diff --git a/all_results.json b/all_results.json index 047c4a7008f2ff07dc3319c8e924a9c7ca384c2f..d417069f16c233f3c46d6a8ce956827c58d83629 100644 --- a/all_results.json +++ b/all_results.json @@ -1,14 +1,8 @@ { "epoch": 2.0, - "eval_cer": 0.01165665167457964, - "eval_loss": 0.005274078343063593, - "eval_runtime": 1990.4275, - "eval_samples": 2000, - "eval_samples_per_second": 1.005, - "eval_steps_per_second": 0.251, - "train_loss": 0.016045775709704408, - "train_runtime": 206173.8627, - "train_samples": 2960086, - "train_samples_per_second": 28.714, - "train_steps_per_second": 0.897 + "train_loss": 0.013614018808192265, + "train_runtime": 415192.129, + "train_samples": 6342779, + "train_samples_per_second": 30.553, + "train_steps_per_second": 0.955 } \ No newline at end of file diff --git a/config.json b/config.json index c8a1c7ebd5ad984ff8c24dcd9ce0eb5ab27b0abe..4ba6e9d65f9a3489b31ec956ea4d653cc1fffd5e 100644 --- a/config.json +++ b/config.json @@ -69,7 +69,7 @@ } }, "torch_dtype": "float32", - "transformers_version": "4.27.3", + "transformers_version": "4.30.2", "use_cache": true, "vocab_size": 50265 } diff --git a/generation_config.json b/generation_config.json index 1b00ca7a8a32b8b903a86bab0b5731c499759fd5..6c794ebf7e6a23203b59fba0a81a7d3c84d1cd45 100644 --- a/generation_config.json +++ b/generation_config.json @@ -8,5 +8,5 @@ "no_repeat_ngram_size": 3, "num_beams": 4, "pad_token_id": 1, - "transformers_version": "4.27.3" + "transformers_version": "4.30.2" } diff --git a/merges.txt b/merges.txt index 6636bda4a1fd7a63653dffb22683b8162c8de956..226b0752cac7789c48f0cb3ec53eda48b7be36cc 100644 --- a/merges.txt +++ b/merges.txt @@ -1,4 +1,4 @@ -#version: 0.2 - Trained by `huggingface/tokenizers` +#version: 0.2 Ġ t Ġ a h e diff --git a/pytorch_model.bin b/pytorch_model.bin index 65249d4d581ed5891d506608f40512bd9df1d517..cb2a97963ba95d317243fa7bc9485ff977581b85 100644 --- a/pytorch_model.bin +++ b/pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:96696783fd7389a128057a8994d2b0151034ffed0645a6a6c5b271c1514f2b0b +oid sha256:6ed26ed7830bddb2e53106a9f1e2d9eac7db42270845f34d6f3315c387c147b5 size 557971229 diff --git a/tokenizer.json b/tokenizer.json index 53991fd16215ae49c709b8c7ff24bb94f1c76fac..b04fe5793a1d04928db9817b4a2f864956da53f9 100644 --- a/tokenizer.json +++ b/tokenizer.json @@ -87,6 +87,7 @@ "continuing_subword_prefix": "", "end_of_word_suffix": "", "fuse_unk": false, + "byte_fallback": false, "vocab": { "": 0, "": 1, diff --git a/tokenizer_config.json b/tokenizer_config.json index f57c2b5b04fe2aa5ce9993300ef9867d56704684..1cced8e6bdea9a67e88551545c3110bedcc06e95 100644 --- a/tokenizer_config.json +++ b/tokenizer_config.json @@ -1,6 +1,7 @@ { "add_prefix_space": false, "bos_token": "", + "clean_up_tokenization_spaces": true, "cls_token": "", "eos_token": "", "errors": "replace", @@ -8,7 +9,6 @@ "model_max_length": 1024, "pad_token": "", "sep_token": "", - "special_tokens_map_file": null, "tokenizer_class": "BartTokenizer", "trim_offsets": true, "unk_token": "" diff --git a/train_results.json b/train_results.json index 2bdacad677b8d784f7398fedc2ac6aeac30291fb..d417069f16c233f3c46d6a8ce956827c58d83629 100644 --- a/train_results.json +++ b/train_results.json @@ -1,8 +1,8 @@ { "epoch": 2.0, - "train_loss": 0.016045775709704408, - "train_runtime": 206173.8627, - "train_samples": 2960086, - "train_samples_per_second": 28.714, - "train_steps_per_second": 0.897 + "train_loss": 0.013614018808192265, + "train_runtime": 415192.129, + "train_samples": 6342779, + "train_samples_per_second": 30.553, + "train_steps_per_second": 0.955 } \ No newline at end of file diff --git a/trainer_state.json b/trainer_state.json index 3d6d3d8f391784b0fcb347a2a9fa638d828a5619..4625ccb9b4b27dfb586ee9d649b812a83b4c1a67 100644 --- a/trainer_state.json +++ b/trainer_state.json @@ -1,112690 +1,241441 @@ { - "best_metric": 0.9214921903908192, - "best_model_checkpoint": "./models/bart-base-spelling-nl-1m-3/checkpoint-177000", - "epoch": 1.999985135567007, - "global_step": 185004, + "best_metric": 0.9143955354015062, + "best_model_checkpoint": "./models/bart-base-spelling-nl-3m-3-2nd/checkpoint-390000", + "epoch": 1.999991171063792, + "global_step": 396422, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, - "learning_rate": 0.0002999837841343971, - "loss": 1.0202, + "learning_rate": 0.00029999243230698596, + "loss": 0.7347, "step": 10 }, { "epoch": 0.0, - "learning_rate": 0.00029996756826879416, - "loss": 0.2241, + "learning_rate": 0.00029998486461397194, + "loss": 0.2215, "step": 20 }, { "epoch": 0.0, - "learning_rate": 0.0002999513524031912, - "loss": 0.175, + "learning_rate": 0.0002999772969209579, + "loss": 0.1811, "step": 30 }, { "epoch": 0.0, - "learning_rate": 0.00029993513653758834, - "loss": 0.1532, + "learning_rate": 0.00029996972922794395, + "loss": 0.1745, "step": 40 }, { "epoch": 0.0, - "learning_rate": 0.00029991892067198546, - "loss": 0.1924, + "learning_rate": 0.00029996216153492994, + "loss": 0.1605, "step": 50 }, { "epoch": 0.0, - "learning_rate": 0.00029990270480638253, - "loss": 0.146, + "learning_rate": 0.0002999545938419159, + "loss": 0.1534, "step": 60 }, { "epoch": 0.0, - "learning_rate": 0.00029988648894077965, - "loss": 0.1704, + "learning_rate": 0.0002999470261489019, + "loss": 0.1525, "step": 70 }, { "epoch": 0.0, - "learning_rate": 0.0002998702730751767, - "loss": 0.157, + "learning_rate": 0.0002999394584558879, + "loss": 0.1273, "step": 80 }, { "epoch": 0.0, - "learning_rate": 0.00029985405720957384, - "loss": 0.1478, + "learning_rate": 0.00029993189076287386, + "loss": 0.144, "step": 90 }, { "epoch": 0.0, - "learning_rate": 0.00029983784134397096, - "loss": 0.1327, + "learning_rate": 0.0002999243230698599, + "loss": 0.172, "step": 100 }, { "epoch": 0.0, - "learning_rate": 0.000299821625478368, - "loss": 0.1403, + "learning_rate": 0.0002999167553768459, + "loss": 0.1288, "step": 110 }, { "epoch": 0.0, - "learning_rate": 0.0002998054096127651, - "loss": 0.1263, + "learning_rate": 0.00029990918768383186, + "loss": 0.1398, "step": 120 }, { "epoch": 0.0, - "learning_rate": 0.0002997891937471622, - "loss": 0.1305, + "learning_rate": 0.00029990161999081784, + "loss": 0.164, "step": 130 }, { "epoch": 0.0, - "learning_rate": 0.0002997729778815593, - "loss": 0.1128, + "learning_rate": 0.0002998940522978038, + "loss": 0.1436, "step": 140 }, { "epoch": 0.0, - "learning_rate": 0.0002997567620159564, + "learning_rate": 0.0002998864846047898, "loss": 0.1263, "step": 150 }, { "epoch": 0.0, - "learning_rate": 0.00029974054615035346, - "loss": 0.1136, + "learning_rate": 0.00029987891691177584, + "loss": 0.1235, "step": 160 }, { "epoch": 0.0, - "learning_rate": 0.0002997243302847506, - "loss": 0.1132, + "learning_rate": 0.0002998713492187618, + "loss": 0.1192, "step": 170 }, { "epoch": 0.0, - "learning_rate": 0.0002997081144191477, - "loss": 0.1185, + "learning_rate": 0.0002998637815257478, + "loss": 0.1067, "step": 180 }, { "epoch": 0.0, - "learning_rate": 0.00029969189855354476, - "loss": 0.1145, + "learning_rate": 0.0002998562138327338, + "loss": 0.1085, "step": 190 }, { "epoch": 0.0, - "learning_rate": 0.00029967568268794183, - "loss": 0.1166, + "learning_rate": 0.00029984864613971977, + "loss": 0.1203, "step": 200 }, { "epoch": 0.0, - "learning_rate": 0.00029965946682233895, - "loss": 0.1197, + "learning_rate": 0.00029984107844670575, + "loss": 0.1025, "step": 210 }, { "epoch": 0.0, - "learning_rate": 0.00029964325095673607, - "loss": 0.1119, + "learning_rate": 0.00029983351075369173, + "loss": 0.1044, "step": 220 }, { "epoch": 0.0, - "learning_rate": 0.00029962703509113313, - "loss": 0.1056, + "learning_rate": 0.00029982594306067776, + "loss": 0.0965, "step": 230 }, { "epoch": 0.0, - "learning_rate": 0.00029961081922553025, - "loss": 0.1087, + "learning_rate": 0.00029981837536766375, + "loss": 0.1083, "step": 240 }, { "epoch": 0.0, - "learning_rate": 0.0002995946033599273, - "loss": 0.109, + "learning_rate": 0.0002998108076746497, + "loss": 0.106, "step": 250 }, { "epoch": 0.0, - "learning_rate": 0.00029957838749432444, - "loss": 0.0968, + "learning_rate": 0.0002998032399816357, + "loss": 0.1017, "step": 260 }, { "epoch": 0.0, - "learning_rate": 0.0002995621716287215, - "loss": 0.1025, + "learning_rate": 0.0002997956722886217, + "loss": 0.1216, "step": 270 }, { "epoch": 0.0, - "learning_rate": 0.0002995459557631186, - "loss": 0.0981, + "learning_rate": 0.00029978810459560767, + "loss": 0.1059, "step": 280 }, { "epoch": 0.0, - "learning_rate": 0.0002995297398975157, - "loss": 0.1009, + "learning_rate": 0.0002997805369025937, + "loss": 0.0953, "step": 290 }, { "epoch": 0.0, - "learning_rate": 0.0002995135240319128, - "loss": 0.1017, + "learning_rate": 0.0002997729692095797, + "loss": 0.0948, "step": 300 }, { "epoch": 0.0, - "learning_rate": 0.0002994973081663099, - "loss": 0.1169, + "learning_rate": 0.00029976540151656567, + "loss": 0.1041, "step": 310 }, { "epoch": 0.0, - "learning_rate": 0.000299481092300707, - "loss": 0.1023, + "learning_rate": 0.00029975783382355165, + "loss": 0.0998, "step": 320 }, { "epoch": 0.0, - "learning_rate": 0.00029946487643510406, - "loss": 0.1122, + "learning_rate": 0.00029975026613053763, + "loss": 0.0976, "step": 330 }, { "epoch": 0.0, - "learning_rate": 0.0002994486605695012, - "loss": 0.0944, + "learning_rate": 0.0002997426984375236, + "loss": 0.1064, "step": 340 }, { "epoch": 0.0, - "learning_rate": 0.00029943244470389825, - "loss": 0.0995, + "learning_rate": 0.0002997351307445096, + "loss": 0.1054, "step": 350 }, { "epoch": 0.0, - "learning_rate": 0.00029941622883829537, - "loss": 0.0897, + "learning_rate": 0.00029972756305149563, + "loss": 0.084, "step": 360 }, { "epoch": 0.0, - "learning_rate": 0.0002994000129726925, - "loss": 0.0936, + "learning_rate": 0.0002997199953584816, + "loss": 0.0937, "step": 370 }, { "epoch": 0.0, - "learning_rate": 0.00029938379710708955, - "loss": 0.0905, + "learning_rate": 0.0002997124276654676, + "loss": 0.1096, "step": 380 }, { "epoch": 0.0, - "learning_rate": 0.0002993675812414866, - "loss": 0.0891, + "learning_rate": 0.0002997048599724536, + "loss": 0.1014, "step": 390 }, { "epoch": 0.0, - "learning_rate": 0.00029935136537588374, - "loss": 0.0886, + "learning_rate": 0.00029969729227943956, + "loss": 0.0946, "step": 400 }, { "epoch": 0.0, - "learning_rate": 0.00029933514951028086, - "loss": 0.0872, + "learning_rate": 0.00029968972458642554, + "loss": 0.0951, "step": 410 }, { "epoch": 0.0, - "learning_rate": 0.0002993189336446779, - "loss": 0.0874, + "learning_rate": 0.0002996821568934116, + "loss": 0.0892, "step": 420 }, { "epoch": 0.0, - "learning_rate": 0.000299302717779075, + "learning_rate": 0.00029967458920039756, "loss": 0.0945, "step": 430 }, { "epoch": 0.0, - "learning_rate": 0.0002992865019134721, - "loss": 0.1135, + "learning_rate": 0.00029966702150738354, + "loss": 0.0932, "step": 440 }, { "epoch": 0.0, - "learning_rate": 0.00029927028604786923, - "loss": 0.1259, + "learning_rate": 0.0002996594538143695, + "loss": 0.0833, "step": 450 }, { "epoch": 0.0, - "learning_rate": 0.0002992540701822663, - "loss": 0.1149, + "learning_rate": 0.0002996518861213555, + "loss": 0.0837, "step": 460 }, { - "epoch": 0.01, - "learning_rate": 0.00029923785431666336, - "loss": 0.1007, + "epoch": 0.0, + "learning_rate": 0.0002996443184283415, + "loss": 0.085, "step": 470 }, { - "epoch": 0.01, - "learning_rate": 0.0002992216384510605, - "loss": 0.1059, + "epoch": 0.0, + "learning_rate": 0.0002996367507353275, + "loss": 0.086, "step": 480 }, { - "epoch": 0.01, - "learning_rate": 0.0002992054225854576, - "loss": 0.1042, + "epoch": 0.0, + "learning_rate": 0.0002996291830423135, + "loss": 0.079, "step": 490 }, { - "epoch": 0.01, - "learning_rate": 0.00029918920671985467, - "loss": 0.1074, + "epoch": 0.0, + "learning_rate": 0.0002996216153492995, + "loss": 0.0793, "step": 500 }, { - "epoch": 0.01, - "learning_rate": 0.0002991729908542518, - "loss": 0.093, + "epoch": 0.0, + "learning_rate": 0.00029961404765628546, + "loss": 0.0857, "step": 510 }, { - "epoch": 0.01, - "learning_rate": 0.00029915677498864885, - "loss": 0.1079, + "epoch": 0.0, + "learning_rate": 0.00029960647996327144, + "loss": 0.0824, "step": 520 }, { - "epoch": 0.01, - "learning_rate": 0.00029914055912304597, - "loss": 0.0862, + "epoch": 0.0, + "learning_rate": 0.0002995989122702574, + "loss": 0.0853, "step": 530 }, { - "epoch": 0.01, - "learning_rate": 0.0002991243432574431, - "loss": 0.0947, + "epoch": 0.0, + "learning_rate": 0.0002995913445772434, + "loss": 0.0837, "step": 540 }, { - "epoch": 0.01, - "learning_rate": 0.00029910812739184016, - "loss": 0.0835, + "epoch": 0.0, + "learning_rate": 0.00029958377688422944, + "loss": 0.0743, "step": 550 }, { - "epoch": 0.01, - "learning_rate": 0.0002990919115262372, - "loss": 0.0931, + "epoch": 0.0, + "learning_rate": 0.0002995762091912154, + "loss": 0.0792, "step": 560 }, { - "epoch": 0.01, - "learning_rate": 0.00029907569566063434, - "loss": 0.0853, + "epoch": 0.0, + "learning_rate": 0.0002995686414982014, + "loss": 0.0767, "step": 570 }, { - "epoch": 0.01, - "learning_rate": 0.00029905947979503146, - "loss": 0.0821, + "epoch": 0.0, + "learning_rate": 0.0002995610738051874, + "loss": 0.0813, "step": 580 }, { - "epoch": 0.01, - "learning_rate": 0.0002990432639294285, - "loss": 0.0911, + "epoch": 0.0, + "learning_rate": 0.00029955350611217337, + "loss": 0.0869, "step": 590 }, { - "epoch": 0.01, - "learning_rate": 0.0002990270480638256, - "loss": 0.0821, + "epoch": 0.0, + "learning_rate": 0.00029954593841915935, + "loss": 0.0795, "step": 600 }, { - "epoch": 0.01, - "learning_rate": 0.0002990108321982227, - "loss": 0.0909, + "epoch": 0.0, + "learning_rate": 0.0002995383707261454, + "loss": 0.0784, "step": 610 }, { - "epoch": 0.01, - "learning_rate": 0.00029899461633261983, - "loss": 0.0887, + "epoch": 0.0, + "learning_rate": 0.00029953080303313137, + "loss": 0.0813, "step": 620 }, { - "epoch": 0.01, - "learning_rate": 0.0002989784004670169, - "loss": 0.0853, + "epoch": 0.0, + "learning_rate": 0.0002995232353401173, + "loss": 0.0906, "step": 630 }, { - "epoch": 0.01, - "learning_rate": 0.00029896218460141396, - "loss": 0.0791, + "epoch": 0.0, + "learning_rate": 0.0002995156676471033, + "loss": 0.0762, "step": 640 }, { - "epoch": 0.01, - "learning_rate": 0.0002989459687358111, - "loss": 0.0788, + "epoch": 0.0, + "learning_rate": 0.0002995080999540893, + "loss": 0.0874, "step": 650 }, { - "epoch": 0.01, - "learning_rate": 0.0002989297528702082, - "loss": 0.0836, + "epoch": 0.0, + "learning_rate": 0.0002995005322610753, + "loss": 0.0744, "step": 660 }, { - "epoch": 0.01, - "learning_rate": 0.00029891353700460527, - "loss": 0.081, + "epoch": 0.0, + "learning_rate": 0.00029949296456806127, + "loss": 0.0719, "step": 670 }, { - "epoch": 0.01, - "learning_rate": 0.0002988973211390024, - "loss": 0.0799, + "epoch": 0.0, + "learning_rate": 0.00029948539687504725, + "loss": 0.0757, "step": 680 }, { - "epoch": 0.01, - "learning_rate": 0.00029888110527339945, - "loss": 0.0832, + "epoch": 0.0, + "learning_rate": 0.00029947782918203324, + "loss": 0.0752, "step": 690 }, { - "epoch": 0.01, - "learning_rate": 0.0002988648894077966, - "loss": 0.0746, + "epoch": 0.0, + "learning_rate": 0.0002994702614890192, + "loss": 0.0854, "step": 700 }, { - "epoch": 0.01, - "learning_rate": 0.00029884867354219364, - "loss": 0.0846, + "epoch": 0.0, + "learning_rate": 0.00029946269379600525, + "loss": 0.0878, "step": 710 }, { - "epoch": 0.01, - "learning_rate": 0.00029883245767659076, - "loss": 0.084, + "epoch": 0.0, + "learning_rate": 0.00029945512610299123, + "loss": 0.0747, "step": 720 }, { - "epoch": 0.01, - "learning_rate": 0.0002988162418109878, - "loss": 0.0793, + "epoch": 0.0, + "learning_rate": 0.0002994475584099772, + "loss": 0.0783, "step": 730 }, { - "epoch": 0.01, - "learning_rate": 0.00029880002594538495, - "loss": 0.0761, + "epoch": 0.0, + "learning_rate": 0.0002994399907169632, + "loss": 0.0841, "step": 740 }, { - "epoch": 0.01, - "learning_rate": 0.00029878381007978207, - "loss": 0.0768, + "epoch": 0.0, + "learning_rate": 0.0002994324230239492, + "loss": 0.0798, "step": 750 }, { - "epoch": 0.01, - "learning_rate": 0.00029876759421417913, - "loss": 0.0829, + "epoch": 0.0, + "learning_rate": 0.00029942485533093516, + "loss": 0.0835, "step": 760 }, { - "epoch": 0.01, - "learning_rate": 0.0002987513783485762, - "loss": 0.0768, + "epoch": 0.0, + "learning_rate": 0.00029941728763792114, + "loss": 0.0709, "step": 770 }, { - "epoch": 0.01, - "learning_rate": 0.0002987351624829733, - "loss": 0.0708, + "epoch": 0.0, + "learning_rate": 0.0002994097199449072, + "loss": 0.0715, "step": 780 }, { - "epoch": 0.01, - "learning_rate": 0.00029871894661737044, - "loss": 0.0757, + "epoch": 0.0, + "learning_rate": 0.00029940215225189316, + "loss": 0.0859, "step": 790 }, { - "epoch": 0.01, - "learning_rate": 0.0002987027307517675, - "loss": 0.0762, + "epoch": 0.0, + "learning_rate": 0.00029939458455887914, + "loss": 0.0811, "step": 800 }, { - "epoch": 0.01, - "learning_rate": 0.0002986865148861646, - "loss": 0.0788, + "epoch": 0.0, + "learning_rate": 0.0002993870168658651, + "loss": 0.0768, "step": 810 }, { - "epoch": 0.01, - "learning_rate": 0.0002986702990205617, - "loss": 0.0722, + "epoch": 0.0, + "learning_rate": 0.0002993794491728511, + "loss": 0.0736, "step": 820 }, { - "epoch": 0.01, - "learning_rate": 0.0002986540831549588, - "loss": 0.0891, + "epoch": 0.0, + "learning_rate": 0.0002993718814798371, + "loss": 0.0673, "step": 830 }, { - "epoch": 0.01, - "learning_rate": 0.00029863786728935587, - "loss": 0.0776, + "epoch": 0.0, + "learning_rate": 0.0002993643137868231, + "loss": 0.0703, "step": 840 }, { - "epoch": 0.01, - "learning_rate": 0.000298621651423753, - "loss": 0.0764, + "epoch": 0.0, + "learning_rate": 0.0002993567460938091, + "loss": 0.0774, "step": 850 }, { - "epoch": 0.01, - "learning_rate": 0.00029860543555815006, - "loss": 0.0751, + "epoch": 0.0, + "learning_rate": 0.0002993491784007951, + "loss": 0.0795, "step": 860 }, { - "epoch": 0.01, - "learning_rate": 0.0002985892196925472, - "loss": 0.0762, + "epoch": 0.0, + "learning_rate": 0.00029934161070778106, + "loss": 0.0833, "step": 870 }, { - "epoch": 0.01, - "learning_rate": 0.00029857300382694424, - "loss": 0.0757, + "epoch": 0.0, + "learning_rate": 0.00029933404301476705, + "loss": 0.077, "step": 880 }, { - "epoch": 0.01, - "learning_rate": 0.00029855678796134136, - "loss": 0.0718, + "epoch": 0.0, + "learning_rate": 0.000299326475321753, + "loss": 0.0724, "step": 890 }, { - "epoch": 0.01, - "learning_rate": 0.00029854057209573843, - "loss": 0.0736, + "epoch": 0.0, + "learning_rate": 0.000299318907628739, + "loss": 0.0766, "step": 900 }, { - "epoch": 0.01, - "learning_rate": 0.00029852435623013555, - "loss": 0.078, + "epoch": 0.0, + "learning_rate": 0.00029931133993572504, + "loss": 0.0849, "step": 910 }, { - "epoch": 0.01, - "learning_rate": 0.0002985081403645326, - "loss": 0.0774, + "epoch": 0.0, + "learning_rate": 0.000299303772242711, + "loss": 0.0761, "step": 920 }, { - "epoch": 0.01, - "learning_rate": 0.00029849192449892973, - "loss": 0.0727, + "epoch": 0.0, + "learning_rate": 0.000299296204549697, + "loss": 0.0725, "step": 930 }, { - "epoch": 0.01, - "learning_rate": 0.0002984757086333268, - "loss": 0.0834, + "epoch": 0.0, + "learning_rate": 0.000299288636856683, + "loss": 0.0778, "step": 940 }, { - "epoch": 0.01, - "learning_rate": 0.0002984594927677239, - "loss": 0.0811, + "epoch": 0.0, + "learning_rate": 0.00029928106916366897, + "loss": 0.0758, "step": 950 }, { - "epoch": 0.01, - "learning_rate": 0.000298443276902121, - "loss": 0.0768, + "epoch": 0.0, + "learning_rate": 0.00029927350147065495, + "loss": 0.0794, "step": 960 }, { - "epoch": 0.01, - "learning_rate": 0.0002984270610365181, - "loss": 0.0764, + "epoch": 0.0, + "learning_rate": 0.000299265933777641, + "loss": 0.0707, "step": 970 }, { - "epoch": 0.01, - "learning_rate": 0.0002984108451709152, - "loss": 0.0817, + "epoch": 0.0, + "learning_rate": 0.00029925836608462697, + "loss": 0.0737, "step": 980 }, { - "epoch": 0.01, - "learning_rate": 0.0002983946293053123, - "loss": 0.0856, + "epoch": 0.0, + "learning_rate": 0.00029925079839161295, + "loss": 0.0756, "step": 990 }, { "epoch": 0.01, - "learning_rate": 0.00029837841343970936, - "loss": 0.0834, + "learning_rate": 0.00029924323069859893, + "loss": 0.0794, "step": 1000 }, { "epoch": 0.01, - "eval_cer": 0.9216337726727086, - "eval_loss": 0.060326751321554184, - "eval_runtime": 121.7661, - "eval_samples_per_second": 16.425, - "eval_steps_per_second": 4.106, + "eval_cer": 0.914636193640606, + "eval_loss": 0.057572510093450546, + "eval_runtime": 117.4563, + "eval_samples_per_second": 17.028, + "eval_steps_per_second": 4.257, "step": 1000 }, { "epoch": 0.01, - "learning_rate": 0.0002983621975741065, - "loss": 0.0711, + "learning_rate": 0.0002992356630055849, + "loss": 0.0786, "step": 1010 }, { "epoch": 0.01, - "learning_rate": 0.0002983459817085036, - "loss": 0.0706, + "learning_rate": 0.0002992280953125709, + "loss": 0.0757, "step": 1020 }, { "epoch": 0.01, - "learning_rate": 0.00029832976584290066, - "loss": 0.0661, + "learning_rate": 0.00029922052761955693, + "loss": 0.079, "step": 1030 }, { "epoch": 0.01, - "learning_rate": 0.00029831354997729773, - "loss": 0.0843, + "learning_rate": 0.0002992129599265429, + "loss": 0.0718, "step": 1040 }, { "epoch": 0.01, - "learning_rate": 0.00029829733411169485, - "loss": 0.0696, + "learning_rate": 0.0002992053922335289, + "loss": 0.083, "step": 1050 }, { "epoch": 0.01, - "learning_rate": 0.00029828111824609197, - "loss": 0.0796, + "learning_rate": 0.0002991978245405149, + "loss": 0.0785, "step": 1060 }, { "epoch": 0.01, - "learning_rate": 0.00029826490238048903, - "loss": 0.0737, + "learning_rate": 0.00029919025684750086, + "loss": 0.0776, "step": 1070 }, { "epoch": 0.01, - "learning_rate": 0.00029824868651488615, - "loss": 0.073, + "learning_rate": 0.00029918268915448684, + "loss": 0.0747, "step": 1080 }, { "epoch": 0.01, - "learning_rate": 0.0002982324706492832, - "loss": 0.0668, + "learning_rate": 0.0002991751214614728, + "loss": 0.082, "step": 1090 }, { "epoch": 0.01, - "learning_rate": 0.00029821625478368034, - "loss": 0.076, + "learning_rate": 0.00029916755376845885, + "loss": 0.073, "step": 1100 }, { "epoch": 0.01, - "learning_rate": 0.00029820003891807746, - "loss": 0.0771, + "learning_rate": 0.00029915998607544484, + "loss": 0.0719, "step": 1110 }, { "epoch": 0.01, - "learning_rate": 0.0002981838230524745, - "loss": 0.0652, + "learning_rate": 0.0002991524183824308, + "loss": 0.0861, "step": 1120 }, { "epoch": 0.01, - "learning_rate": 0.0002981676071868716, - "loss": 0.0713, + "learning_rate": 0.0002991448506894168, + "loss": 0.0647, "step": 1130 }, { "epoch": 0.01, - "learning_rate": 0.0002981513913212687, - "loss": 0.0709, + "learning_rate": 0.0002991372829964028, + "loss": 0.0666, "step": 1140 }, { "epoch": 0.01, - "learning_rate": 0.00029813517545566583, - "loss": 0.0741, + "learning_rate": 0.00029912971530338876, + "loss": 0.0736, "step": 1150 }, { "epoch": 0.01, - "learning_rate": 0.0002981189595900629, - "loss": 0.073, + "learning_rate": 0.0002991221476103748, + "loss": 0.0638, "step": 1160 }, { "epoch": 0.01, - "learning_rate": 0.00029810274372445996, - "loss": 0.063, + "learning_rate": 0.0002991145799173608, + "loss": 0.0711, "step": 1170 }, { "epoch": 0.01, - "learning_rate": 0.0002980865278588571, - "loss": 0.0682, + "learning_rate": 0.00029910701222434676, + "loss": 0.0683, "step": 1180 }, { "epoch": 0.01, - "learning_rate": 0.0002980703119932542, - "loss": 0.0699, + "learning_rate": 0.00029909944453133274, + "loss": 0.0695, "step": 1190 }, { "epoch": 0.01, - "learning_rate": 0.00029805409612765127, - "loss": 0.0667, + "learning_rate": 0.0002990918768383187, + "loss": 0.0733, "step": 1200 }, { "epoch": 0.01, - "learning_rate": 0.00029803788026204833, - "loss": 0.0717, + "learning_rate": 0.0002990843091453047, + "loss": 0.0736, "step": 1210 }, { "epoch": 0.01, - "learning_rate": 0.00029802166439644545, - "loss": 0.0657, + "learning_rate": 0.00029907674145229074, + "loss": 0.0725, "step": 1220 }, { "epoch": 0.01, - "learning_rate": 0.00029800544853084257, - "loss": 0.0761, + "learning_rate": 0.0002990691737592767, + "loss": 0.0629, "step": 1230 }, { "epoch": 0.01, - "learning_rate": 0.00029798923266523964, - "loss": 0.0801, + "learning_rate": 0.0002990616060662627, + "loss": 0.061, "step": 1240 }, { "epoch": 0.01, - "learning_rate": 0.00029797301679963676, - "loss": 0.0712, + "learning_rate": 0.0002990540383732487, + "loss": 0.059, "step": 1250 }, { "epoch": 0.01, - "learning_rate": 0.0002979568009340338, - "loss": 0.068, + "learning_rate": 0.00029904647068023467, + "loss": 0.0654, "step": 1260 }, { "epoch": 0.01, - "learning_rate": 0.00029794058506843094, - "loss": 0.0628, + "learning_rate": 0.00029903890298722065, + "loss": 0.0563, "step": 1270 }, { "epoch": 0.01, - "learning_rate": 0.000297924369202828, - "loss": 0.0705, + "learning_rate": 0.00029903133529420663, + "loss": 0.0666, "step": 1280 }, { "epoch": 0.01, - "learning_rate": 0.00029790815333722513, - "loss": 0.0692, + "learning_rate": 0.00029902376760119266, + "loss": 0.0655, "step": 1290 }, { "epoch": 0.01, - "learning_rate": 0.0002978919374716222, - "loss": 0.0786, + "learning_rate": 0.00029901619990817865, + "loss": 0.0569, "step": 1300 }, { "epoch": 0.01, - "learning_rate": 0.0002978757216060193, - "loss": 0.0775, + "learning_rate": 0.0002990086322151646, + "loss": 0.0673, "step": 1310 }, { "epoch": 0.01, - "learning_rate": 0.0002978595057404164, - "loss": 0.0664, + "learning_rate": 0.0002990010645221506, + "loss": 0.0653, "step": 1320 }, { "epoch": 0.01, - "learning_rate": 0.0002978432898748135, - "loss": 0.0603, + "learning_rate": 0.0002989934968291366, + "loss": 0.0668, "step": 1330 }, { "epoch": 0.01, - "learning_rate": 0.00029782707400921056, - "loss": 0.0608, + "learning_rate": 0.00029898592913612257, + "loss": 0.0727, "step": 1340 }, { "epoch": 0.01, - "learning_rate": 0.0002978108581436077, - "loss": 0.0627, + "learning_rate": 0.0002989783614431086, + "loss": 0.0714, "step": 1350 }, { "epoch": 0.01, - "learning_rate": 0.00029779464227800475, - "loss": 0.0677, + "learning_rate": 0.0002989707937500946, + "loss": 0.0657, "step": 1360 }, { "epoch": 0.01, - "learning_rate": 0.00029777842641240187, - "loss": 0.0728, + "learning_rate": 0.00029896322605708057, + "loss": 0.0631, "step": 1370 }, { "epoch": 0.01, - "learning_rate": 0.000297762210546799, - "loss": 0.0751, + "learning_rate": 0.00029895565836406655, + "loss": 0.0658, "step": 1380 }, { - "epoch": 0.02, - "learning_rate": 0.00029774599468119605, - "loss": 0.0666, + "epoch": 0.01, + "learning_rate": 0.00029894809067105253, + "loss": 0.0652, "step": 1390 }, { - "epoch": 0.02, - "learning_rate": 0.0002977297788155931, - "loss": 0.0664, + "epoch": 0.01, + "learning_rate": 0.0002989405229780385, + "loss": 0.0743, "step": 1400 }, { - "epoch": 0.02, - "learning_rate": 0.00029771356294999024, - "loss": 0.0645, + "epoch": 0.01, + "learning_rate": 0.0002989329552850245, + "loss": 0.0639, "step": 1410 }, { - "epoch": 0.02, - "learning_rate": 0.00029769734708438736, - "loss": 0.0714, + "epoch": 0.01, + "learning_rate": 0.00029892538759201053, + "loss": 0.0642, "step": 1420 }, { - "epoch": 0.02, - "learning_rate": 0.0002976811312187844, - "loss": 0.0743, + "epoch": 0.01, + "learning_rate": 0.0002989178198989965, + "loss": 0.0706, "step": 1430 }, { - "epoch": 0.02, - "learning_rate": 0.00029766491535318155, - "loss": 0.0631, + "epoch": 0.01, + "learning_rate": 0.0002989102522059825, + "loss": 0.0656, "step": 1440 }, { - "epoch": 0.02, - "learning_rate": 0.0002976486994875786, - "loss": 0.0612, + "epoch": 0.01, + "learning_rate": 0.0002989026845129685, + "loss": 0.0714, "step": 1450 }, { - "epoch": 0.02, - "learning_rate": 0.00029763248362197573, - "loss": 0.0598, + "epoch": 0.01, + "learning_rate": 0.00029889511681995446, + "loss": 0.0703, "step": 1460 }, { - "epoch": 0.02, - "learning_rate": 0.0002976162677563728, - "loss": 0.058, + "epoch": 0.01, + "learning_rate": 0.00029888754912694044, + "loss": 0.0675, "step": 1470 }, { - "epoch": 0.02, - "learning_rate": 0.0002976000518907699, - "loss": 0.064, + "epoch": 0.01, + "learning_rate": 0.0002988799814339265, + "loss": 0.0703, "step": 1480 }, { - "epoch": 0.02, - "learning_rate": 0.000297583836025167, - "loss": 0.0575, + "epoch": 0.01, + "learning_rate": 0.00029887241374091246, + "loss": 0.0671, "step": 1490 }, { - "epoch": 0.02, - "learning_rate": 0.0002975676201595641, - "loss": 0.0634, + "epoch": 0.01, + "learning_rate": 0.00029886484604789844, + "loss": 0.0668, "step": 1500 }, { - "epoch": 0.02, - "learning_rate": 0.00029755140429396117, - "loss": 0.06, + "epoch": 0.01, + "learning_rate": 0.0002988572783548844, + "loss": 0.0688, "step": 1510 }, { - "epoch": 0.02, - "learning_rate": 0.0002975351884283583, - "loss": 0.0562, + "epoch": 0.01, + "learning_rate": 0.0002988497106618704, + "loss": 0.065, "step": 1520 }, { - "epoch": 0.02, - "learning_rate": 0.00029751897256275535, - "loss": 0.0716, + "epoch": 0.01, + "learning_rate": 0.0002988421429688564, + "loss": 0.0656, "step": 1530 }, { - "epoch": 0.02, - "learning_rate": 0.0002975027566971525, - "loss": 0.0696, + "epoch": 0.01, + "learning_rate": 0.0002988345752758424, + "loss": 0.0695, "step": 1540 }, { - "epoch": 0.02, - "learning_rate": 0.0002974865408315496, - "loss": 0.0671, + "epoch": 0.01, + "learning_rate": 0.0002988270075828284, + "loss": 0.0732, "step": 1550 }, { - "epoch": 0.02, - "learning_rate": 0.00029747032496594666, - "loss": 0.0796, + "epoch": 0.01, + "learning_rate": 0.0002988194398898144, + "loss": 0.0693, "step": 1560 }, { - "epoch": 0.02, - "learning_rate": 0.0002974541091003437, - "loss": 0.0591, + "epoch": 0.01, + "learning_rate": 0.00029881187219680036, + "loss": 0.0653, "step": 1570 }, { - "epoch": 0.02, - "learning_rate": 0.00029743789323474084, - "loss": 0.0684, + "epoch": 0.01, + "learning_rate": 0.00029880430450378634, + "loss": 0.0652, "step": 1580 }, { - "epoch": 0.02, - "learning_rate": 0.00029742167736913796, - "loss": 0.0634, + "epoch": 0.01, + "learning_rate": 0.0002987967368107723, + "loss": 0.0775, "step": 1590 }, { - "epoch": 0.02, - "learning_rate": 0.00029740546150353503, - "loss": 0.0703, + "epoch": 0.01, + "learning_rate": 0.0002987891691177583, + "loss": 0.069, "step": 1600 }, { - "epoch": 0.02, - "learning_rate": 0.0002973892456379321, - "loss": 0.0554, + "epoch": 0.01, + "learning_rate": 0.00029878160142474434, + "loss": 0.0666, "step": 1610 }, { - "epoch": 0.02, - "learning_rate": 0.0002973730297723292, - "loss": 0.0745, + "epoch": 0.01, + "learning_rate": 0.0002987740337317303, + "loss": 0.0642, "step": 1620 }, { - "epoch": 0.02, - "learning_rate": 0.00029735681390672633, - "loss": 0.0601, + "epoch": 0.01, + "learning_rate": 0.0002987664660387163, + "loss": 0.0659, "step": 1630 }, { - "epoch": 0.02, - "learning_rate": 0.0002973405980411234, - "loss": 0.0676, + "epoch": 0.01, + "learning_rate": 0.0002987588983457023, + "loss": 0.0657, "step": 1640 }, { - "epoch": 0.02, - "learning_rate": 0.00029732438217552047, - "loss": 0.0643, + "epoch": 0.01, + "learning_rate": 0.00029875133065268827, + "loss": 0.0655, "step": 1650 }, { - "epoch": 0.02, - "learning_rate": 0.0002973081663099176, - "loss": 0.0646, + "epoch": 0.01, + "learning_rate": 0.00029874376295967425, + "loss": 0.0605, "step": 1660 }, { - "epoch": 0.02, - "learning_rate": 0.0002972919504443147, - "loss": 0.0567, + "epoch": 0.01, + "learning_rate": 0.0002987361952666603, + "loss": 0.0676, "step": 1670 }, { - "epoch": 0.02, - "learning_rate": 0.0002972757345787118, - "loss": 0.0657, + "epoch": 0.01, + "learning_rate": 0.00029872862757364627, + "loss": 0.0536, "step": 1680 }, { - "epoch": 0.02, - "learning_rate": 0.0002972595187131089, - "loss": 0.0624, + "epoch": 0.01, + "learning_rate": 0.00029872105988063225, + "loss": 0.059, "step": 1690 }, { - "epoch": 0.02, - "learning_rate": 0.00029724330284750596, - "loss": 0.0657, + "epoch": 0.01, + "learning_rate": 0.00029871349218761823, + "loss": 0.059, "step": 1700 }, { - "epoch": 0.02, - "learning_rate": 0.0002972270869819031, - "loss": 0.0537, + "epoch": 0.01, + "learning_rate": 0.0002987059244946042, + "loss": 0.0586, "step": 1710 }, { - "epoch": 0.02, - "learning_rate": 0.0002972108711163002, - "loss": 0.0571, + "epoch": 0.01, + "learning_rate": 0.0002986983568015902, + "loss": 0.0583, "step": 1720 }, { - "epoch": 0.02, - "learning_rate": 0.00029719465525069726, - "loss": 0.0607, + "epoch": 0.01, + "learning_rate": 0.0002986907891085762, + "loss": 0.0589, "step": 1730 }, { - "epoch": 0.02, - "learning_rate": 0.00029717843938509433, - "loss": 0.0585, + "epoch": 0.01, + "learning_rate": 0.0002986832214155622, + "loss": 0.0582, "step": 1740 }, { - "epoch": 0.02, - "learning_rate": 0.00029716222351949145, - "loss": 0.0573, + "epoch": 0.01, + "learning_rate": 0.0002986756537225482, + "loss": 0.0708, "step": 1750 }, { - "epoch": 0.02, - "learning_rate": 0.00029714600765388857, - "loss": 0.0684, + "epoch": 0.01, + "learning_rate": 0.00029866808602953417, + "loss": 0.0637, "step": 1760 }, { - "epoch": 0.02, - "learning_rate": 0.00029712979178828563, - "loss": 0.0589, + "epoch": 0.01, + "learning_rate": 0.00029866051833652015, + "loss": 0.0645, "step": 1770 }, { - "epoch": 0.02, - "learning_rate": 0.0002971135759226827, - "loss": 0.0581, + "epoch": 0.01, + "learning_rate": 0.00029865295064350613, + "loss": 0.0582, "step": 1780 }, { - "epoch": 0.02, - "learning_rate": 0.0002970973600570798, - "loss": 0.0578, + "epoch": 0.01, + "learning_rate": 0.0002986453829504921, + "loss": 0.058, "step": 1790 }, { - "epoch": 0.02, - "learning_rate": 0.00029708114419147694, - "loss": 0.0646, + "epoch": 0.01, + "learning_rate": 0.00029863781525747815, + "loss": 0.0606, "step": 1800 }, { - "epoch": 0.02, - "learning_rate": 0.000297064928325874, - "loss": 0.0542, + "epoch": 0.01, + "learning_rate": 0.00029863024756446413, + "loss": 0.0569, "step": 1810 }, { - "epoch": 0.02, - "learning_rate": 0.0002970487124602711, - "loss": 0.0683, + "epoch": 0.01, + "learning_rate": 0.0002986226798714501, + "loss": 0.0622, "step": 1820 }, { - "epoch": 0.02, - "learning_rate": 0.0002970324965946682, - "loss": 0.0626, + "epoch": 0.01, + "learning_rate": 0.0002986151121784361, + "loss": 0.0669, "step": 1830 }, { - "epoch": 0.02, - "learning_rate": 0.0002970162807290653, - "loss": 0.0561, + "epoch": 0.01, + "learning_rate": 0.0002986075444854221, + "loss": 0.0735, "step": 1840 }, { - "epoch": 0.02, - "learning_rate": 0.0002970000648634624, - "loss": 0.0681, + "epoch": 0.01, + "learning_rate": 0.00029859997679240806, + "loss": 0.0759, "step": 1850 }, { - "epoch": 0.02, - "learning_rate": 0.0002969838489978595, - "loss": 0.0608, + "epoch": 0.01, + "learning_rate": 0.0002985924090993941, + "loss": 0.0636, "step": 1860 }, { - "epoch": 0.02, - "learning_rate": 0.00029696763313225656, - "loss": 0.057, + "epoch": 0.01, + "learning_rate": 0.0002985848414063801, + "loss": 0.0633, "step": 1870 }, { - "epoch": 0.02, - "learning_rate": 0.0002969514172666537, - "loss": 0.0527, + "epoch": 0.01, + "learning_rate": 0.00029857727371336606, + "loss": 0.064, "step": 1880 }, { - "epoch": 0.02, - "learning_rate": 0.00029693520140105075, - "loss": 0.0584, + "epoch": 0.01, + "learning_rate": 0.000298569706020352, + "loss": 0.0751, "step": 1890 }, { - "epoch": 0.02, - "learning_rate": 0.00029691898553544787, - "loss": 0.0569, + "epoch": 0.01, + "learning_rate": 0.000298562138327338, + "loss": 0.0611, "step": 1900 }, { - "epoch": 0.02, - "learning_rate": 0.00029690276966984493, - "loss": 0.0585, + "epoch": 0.01, + "learning_rate": 0.000298554570634324, + "loss": 0.0672, "step": 1910 }, { - "epoch": 0.02, - "learning_rate": 0.00029688655380424205, - "loss": 0.0538, + "epoch": 0.01, + "learning_rate": 0.00029854700294131, + "loss": 0.0659, "step": 1920 }, { - "epoch": 0.02, - "learning_rate": 0.0002968703379386391, - "loss": 0.0621, + "epoch": 0.01, + "learning_rate": 0.00029853943524829596, + "loss": 0.0645, "step": 1930 }, { - "epoch": 0.02, - "learning_rate": 0.00029685412207303624, - "loss": 0.0637, + "epoch": 0.01, + "learning_rate": 0.00029853186755528195, + "loss": 0.0679, "step": 1940 }, { - "epoch": 0.02, - "learning_rate": 0.0002968379062074333, - "loss": 0.0613, + "epoch": 0.01, + "learning_rate": 0.0002985242998622679, + "loss": 0.0619, "step": 1950 }, { - "epoch": 0.02, - "learning_rate": 0.0002968216903418304, - "loss": 0.0589, + "epoch": 0.01, + "learning_rate": 0.00029851673216925396, + "loss": 0.0564, "step": 1960 }, { - "epoch": 0.02, - "learning_rate": 0.0002968054744762275, - "loss": 0.0596, + "epoch": 0.01, + "learning_rate": 0.00029850916447623994, + "loss": 0.053, "step": 1970 }, { - "epoch": 0.02, - "learning_rate": 0.0002967892586106246, - "loss": 0.0617, + "epoch": 0.01, + "learning_rate": 0.0002985015967832259, + "loss": 0.0625, "step": 1980 }, { - "epoch": 0.02, - "learning_rate": 0.00029677304274502173, - "loss": 0.0621, + "epoch": 0.01, + "learning_rate": 0.0002984940290902119, + "loss": 0.063, "step": 1990 }, { - "epoch": 0.02, - "learning_rate": 0.0002967568268794188, - "loss": 0.0566, + "epoch": 0.01, + "learning_rate": 0.0002984864613971979, + "loss": 0.0629, "step": 2000 }, { - "epoch": 0.02, - "eval_cer": 0.9216580935554872, - "eval_loss": 0.04665278643369675, - "eval_runtime": 120.2206, - "eval_samples_per_second": 16.636, - "eval_steps_per_second": 4.159, + "epoch": 0.01, + "eval_cer": 0.9145119829365546, + "eval_loss": 0.04564144089818001, + "eval_runtime": 117.4132, + "eval_samples_per_second": 17.034, + "eval_steps_per_second": 4.258, "step": 2000 }, { - "epoch": 0.02, - "learning_rate": 0.00029674061101381586, - "loss": 0.0507, + "epoch": 0.01, + "learning_rate": 0.00029847889370418387, + "loss": 0.052, "step": 2010 }, { - "epoch": 0.02, - "learning_rate": 0.000296724395148213, - "loss": 0.0582, + "epoch": 0.01, + "learning_rate": 0.00029847132601116985, + "loss": 0.0563, "step": 2020 }, { - "epoch": 0.02, - "learning_rate": 0.0002967081792826101, - "loss": 0.0521, + "epoch": 0.01, + "learning_rate": 0.0002984637583181559, + "loss": 0.0644, "step": 2030 }, { - "epoch": 0.02, - "learning_rate": 0.00029669196341700716, - "loss": 0.052, + "epoch": 0.01, + "learning_rate": 0.00029845619062514187, + "loss": 0.0555, "step": 2040 }, { - "epoch": 0.02, - "learning_rate": 0.00029667574755140423, - "loss": 0.0567, + "epoch": 0.01, + "learning_rate": 0.00029844862293212785, + "loss": 0.0578, "step": 2050 }, { - "epoch": 0.02, - "learning_rate": 0.00029665953168580135, - "loss": 0.0617, + "epoch": 0.01, + "learning_rate": 0.00029844105523911383, + "loss": 0.0626, "step": 2060 }, { - "epoch": 0.02, - "learning_rate": 0.00029664331582019847, - "loss": 0.055, + "epoch": 0.01, + "learning_rate": 0.0002984334875460998, + "loss": 0.0582, "step": 2070 }, { - "epoch": 0.02, - "learning_rate": 0.00029662709995459554, - "loss": 0.0628, + "epoch": 0.01, + "learning_rate": 0.0002984259198530858, + "loss": 0.0599, "step": 2080 }, { - "epoch": 0.02, - "learning_rate": 0.00029661088408899266, - "loss": 0.0618, + "epoch": 0.01, + "learning_rate": 0.00029841835216007183, + "loss": 0.0776, "step": 2090 }, { - "epoch": 0.02, - "learning_rate": 0.0002965946682233897, - "loss": 0.0605, + "epoch": 0.01, + "learning_rate": 0.0002984107844670578, + "loss": 0.0647, "step": 2100 }, { - "epoch": 0.02, - "learning_rate": 0.00029657845235778684, - "loss": 0.0616, + "epoch": 0.01, + "learning_rate": 0.0002984032167740438, + "loss": 0.0603, "step": 2110 }, { - "epoch": 0.02, - "learning_rate": 0.00029656223649218396, - "loss": 0.0598, + "epoch": 0.01, + "learning_rate": 0.0002983956490810298, + "loss": 0.0652, "step": 2120 }, { - "epoch": 0.02, - "learning_rate": 0.000296546020626581, - "loss": 0.0571, + "epoch": 0.01, + "learning_rate": 0.00029838808138801576, + "loss": 0.0623, "step": 2130 }, { - "epoch": 0.02, - "learning_rate": 0.0002965298047609781, - "loss": 0.057, + "epoch": 0.01, + "learning_rate": 0.00029838051369500174, + "loss": 0.0579, "step": 2140 }, { - "epoch": 0.02, - "learning_rate": 0.0002965135888953752, - "loss": 0.0558, + "epoch": 0.01, + "learning_rate": 0.0002983729460019877, + "loss": 0.0577, "step": 2150 }, { - "epoch": 0.02, - "learning_rate": 0.00029649737302977233, - "loss": 0.0622, + "epoch": 0.01, + "learning_rate": 0.00029836537830897375, + "loss": 0.0613, "step": 2160 }, { - "epoch": 0.02, - "learning_rate": 0.0002964811571641694, - "loss": 0.0626, + "epoch": 0.01, + "learning_rate": 0.00029835781061595974, + "loss": 0.0641, "step": 2170 }, { - "epoch": 0.02, - "learning_rate": 0.00029646494129856646, - "loss": 0.0616, + "epoch": 0.01, + "learning_rate": 0.0002983502429229457, + "loss": 0.0597, "step": 2180 }, { - "epoch": 0.02, - "learning_rate": 0.0002964487254329636, - "loss": 0.0608, + "epoch": 0.01, + "learning_rate": 0.0002983426752299317, + "loss": 0.0632, "step": 2190 }, { - "epoch": 0.02, - "learning_rate": 0.0002964325095673607, - "loss": 0.0878, + "epoch": 0.01, + "learning_rate": 0.0002983351075369177, + "loss": 0.0626, "step": 2200 }, { - "epoch": 0.02, - "learning_rate": 0.00029641629370175777, - "loss": 0.0637, + "epoch": 0.01, + "learning_rate": 0.00029832753984390366, + "loss": 0.0596, "step": 2210 }, { - "epoch": 0.02, - "learning_rate": 0.00029640007783615483, - "loss": 0.0616, + "epoch": 0.01, + "learning_rate": 0.0002983199721508897, + "loss": 0.0594, "step": 2220 }, { - "epoch": 0.02, - "learning_rate": 0.00029638386197055195, - "loss": 0.0678, + "epoch": 0.01, + "learning_rate": 0.0002983124044578757, + "loss": 0.0628, "step": 2230 }, { - "epoch": 0.02, - "learning_rate": 0.0002963676461049491, - "loss": 0.0612, + "epoch": 0.01, + "learning_rate": 0.00029830483676486166, + "loss": 0.0622, "step": 2240 }, { - "epoch": 0.02, - "learning_rate": 0.00029635143023934614, - "loss": 0.0623, + "epoch": 0.01, + "learning_rate": 0.00029829726907184764, + "loss": 0.07, "step": 2250 }, { - "epoch": 0.02, - "learning_rate": 0.00029633521437374326, - "loss": 0.0631, + "epoch": 0.01, + "learning_rate": 0.0002982897013788336, + "loss": 0.0618, "step": 2260 }, { - "epoch": 0.02, - "learning_rate": 0.0002963189985081403, - "loss": 0.0651, + "epoch": 0.01, + "learning_rate": 0.0002982821336858196, + "loss": 0.0629, "step": 2270 }, { - "epoch": 0.02, - "learning_rate": 0.00029630278264253744, - "loss": 0.0596, + "epoch": 0.01, + "learning_rate": 0.00029827456599280564, + "loss": 0.0638, "step": 2280 }, { - "epoch": 0.02, - "learning_rate": 0.00029628656677693456, - "loss": 0.0705, + "epoch": 0.01, + "learning_rate": 0.0002982669982997916, + "loss": 0.0545, "step": 2290 }, { - "epoch": 0.02, - "learning_rate": 0.00029627035091133163, - "loss": 0.0786, + "epoch": 0.01, + "learning_rate": 0.0002982594306067776, + "loss": 0.0578, "step": 2300 }, { - "epoch": 0.02, - "learning_rate": 0.0002962541350457287, - "loss": 0.0724, + "epoch": 0.01, + "learning_rate": 0.0002982518629137636, + "loss": 0.0553, "step": 2310 }, { - "epoch": 0.03, - "learning_rate": 0.0002962379191801258, - "loss": 0.0981, + "epoch": 0.01, + "learning_rate": 0.00029824429522074957, + "loss": 0.0535, "step": 2320 }, { - "epoch": 0.03, - "learning_rate": 0.00029622170331452294, - "loss": 0.0646, + "epoch": 0.01, + "learning_rate": 0.00029823672752773555, + "loss": 0.0537, "step": 2330 }, { - "epoch": 0.03, - "learning_rate": 0.00029620548744892, - "loss": 0.0593, + "epoch": 0.01, + "learning_rate": 0.00029822915983472153, + "loss": 0.05, "step": 2340 }, { - "epoch": 0.03, - "learning_rate": 0.00029618927158331707, - "loss": 0.0509, + "epoch": 0.01, + "learning_rate": 0.00029822159214170756, + "loss": 0.0571, "step": 2350 }, { - "epoch": 0.03, - "learning_rate": 0.0002961730557177142, - "loss": 0.0699, + "epoch": 0.01, + "learning_rate": 0.00029821402444869355, + "loss": 0.0539, "step": 2360 }, { - "epoch": 0.03, - "learning_rate": 0.0002961568398521113, - "loss": 0.0686, + "epoch": 0.01, + "learning_rate": 0.00029820645675567953, + "loss": 0.0569, "step": 2370 }, { - "epoch": 0.03, - "learning_rate": 0.00029614062398650837, - "loss": 0.0529, + "epoch": 0.01, + "learning_rate": 0.0002981988890626655, + "loss": 0.0556, "step": 2380 }, { - "epoch": 0.03, - "learning_rate": 0.0002961244081209055, - "loss": 0.0706, + "epoch": 0.01, + "learning_rate": 0.0002981913213696515, + "loss": 0.0565, "step": 2390 }, { - "epoch": 0.03, - "learning_rate": 0.00029610819225530256, - "loss": 0.0655, + "epoch": 0.01, + "learning_rate": 0.00029818375367663747, + "loss": 0.0538, "step": 2400 }, { - "epoch": 0.03, - "learning_rate": 0.0002960919763896997, - "loss": 0.0581, + "epoch": 0.01, + "learning_rate": 0.0002981761859836235, + "loss": 0.0501, "step": 2410 }, { - "epoch": 0.03, - "learning_rate": 0.00029607576052409674, - "loss": 0.0604, + "epoch": 0.01, + "learning_rate": 0.0002981686182906095, + "loss": 0.0545, "step": 2420 }, { - "epoch": 0.03, - "learning_rate": 0.00029605954465849386, - "loss": 0.0583, + "epoch": 0.01, + "learning_rate": 0.00029816105059759547, + "loss": 0.0578, "step": 2430 }, { - "epoch": 0.03, - "learning_rate": 0.00029604332879289093, - "loss": 0.0576, + "epoch": 0.01, + "learning_rate": 0.00029815348290458145, + "loss": 0.052, "step": 2440 }, { - "epoch": 0.03, - "learning_rate": 0.00029602711292728805, - "loss": 0.0636, + "epoch": 0.01, + "learning_rate": 0.00029814591521156743, + "loss": 0.0606, "step": 2450 }, { - "epoch": 0.03, - "learning_rate": 0.0002960108970616851, - "loss": 0.0678, + "epoch": 0.01, + "learning_rate": 0.0002981383475185534, + "loss": 0.0619, "step": 2460 }, { - "epoch": 0.03, - "learning_rate": 0.00029599468119608223, - "loss": 0.0663, + "epoch": 0.01, + "learning_rate": 0.00029813077982553945, + "loss": 0.0514, "step": 2470 }, { - "epoch": 0.03, - "learning_rate": 0.0002959784653304793, - "loss": 0.0704, + "epoch": 0.01, + "learning_rate": 0.00029812321213252543, + "loss": 0.0585, "step": 2480 }, { - "epoch": 0.03, - "learning_rate": 0.0002959622494648764, - "loss": 0.0627, + "epoch": 0.01, + "learning_rate": 0.0002981156444395114, + "loss": 0.0566, "step": 2490 }, { - "epoch": 0.03, - "learning_rate": 0.0002959460335992735, - "loss": 0.0652, + "epoch": 0.01, + "learning_rate": 0.0002981080767464974, + "loss": 0.05, "step": 2500 }, { - "epoch": 0.03, - "learning_rate": 0.0002959298177336706, - "loss": 0.107, + "epoch": 0.01, + "learning_rate": 0.0002981005090534834, + "loss": 0.0573, "step": 2510 }, { - "epoch": 0.03, - "learning_rate": 0.00029591360186806767, - "loss": 0.0693, + "epoch": 0.01, + "learning_rate": 0.00029809294136046936, + "loss": 0.0556, "step": 2520 }, { - "epoch": 0.03, - "learning_rate": 0.0002958973860024648, - "loss": 0.0684, + "epoch": 0.01, + "learning_rate": 0.00029808537366745534, + "loss": 0.0588, "step": 2530 }, { - "epoch": 0.03, - "learning_rate": 0.00029588117013686186, - "loss": 0.0637, + "epoch": 0.01, + "learning_rate": 0.0002980778059744414, + "loss": 0.0521, "step": 2540 }, { - "epoch": 0.03, - "learning_rate": 0.000295864954271259, - "loss": 0.0638, + "epoch": 0.01, + "learning_rate": 0.00029807023828142736, + "loss": 0.0625, "step": 2550 }, { - "epoch": 0.03, - "learning_rate": 0.0002958487384056561, - "loss": 0.0628, + "epoch": 0.01, + "learning_rate": 0.00029806267058841334, + "loss": 0.077, "step": 2560 }, { - "epoch": 0.03, - "learning_rate": 0.00029583252254005316, - "loss": 0.0535, + "epoch": 0.01, + "learning_rate": 0.0002980551028953993, + "loss": 0.0558, "step": 2570 }, { - "epoch": 0.03, - "learning_rate": 0.0002958163066744502, - "loss": 0.0551, + "epoch": 0.01, + "learning_rate": 0.0002980475352023853, + "loss": 0.0603, "step": 2580 }, { - "epoch": 0.03, - "learning_rate": 0.00029580009080884735, - "loss": 0.059, + "epoch": 0.01, + "learning_rate": 0.0002980399675093713, + "loss": 0.0523, "step": 2590 }, { - "epoch": 0.03, - "learning_rate": 0.00029578387494324447, - "loss": 0.0605, + "epoch": 0.01, + "learning_rate": 0.0002980323998163573, + "loss": 0.0529, "step": 2600 }, { - "epoch": 0.03, - "learning_rate": 0.00029576765907764153, - "loss": 0.0634, + "epoch": 0.01, + "learning_rate": 0.0002980248321233433, + "loss": 0.0549, "step": 2610 }, { - "epoch": 0.03, - "learning_rate": 0.0002957514432120386, - "loss": 0.0554, + "epoch": 0.01, + "learning_rate": 0.0002980172644303293, + "loss": 0.0527, "step": 2620 }, { - "epoch": 0.03, - "learning_rate": 0.0002957352273464357, - "loss": 0.0548, + "epoch": 0.01, + "learning_rate": 0.00029800969673731526, + "loss": 0.0494, "step": 2630 }, { - "epoch": 0.03, - "learning_rate": 0.00029571901148083284, - "loss": 0.069, + "epoch": 0.01, + "learning_rate": 0.00029800212904430124, + "loss": 0.0557, "step": 2640 }, { - "epoch": 0.03, - "learning_rate": 0.0002957027956152299, - "loss": 0.0634, + "epoch": 0.01, + "learning_rate": 0.0002979945613512872, + "loss": 0.056, "step": 2650 }, { - "epoch": 0.03, - "learning_rate": 0.00029568657974962697, - "loss": 0.0618, + "epoch": 0.01, + "learning_rate": 0.0002979869936582732, + "loss": 0.0545, "step": 2660 }, { - "epoch": 0.03, - "learning_rate": 0.0002956703638840241, - "loss": 0.0575, + "epoch": 0.01, + "learning_rate": 0.00029797942596525924, + "loss": 0.0517, "step": 2670 }, { - "epoch": 0.03, - "learning_rate": 0.0002956541480184212, - "loss": 0.0509, + "epoch": 0.01, + "learning_rate": 0.0002979718582722452, + "loss": 0.052, "step": 2680 }, { - "epoch": 0.03, - "learning_rate": 0.00029563793215281833, - "loss": 0.0528, + "epoch": 0.01, + "learning_rate": 0.0002979642905792312, + "loss": 0.0551, "step": 2690 }, { - "epoch": 0.03, - "learning_rate": 0.0002956217162872154, - "loss": 0.0606, + "epoch": 0.01, + "learning_rate": 0.0002979567228862172, + "loss": 0.0493, "step": 2700 }, { - "epoch": 0.03, - "learning_rate": 0.00029560550042161246, - "loss": 0.0648, + "epoch": 0.01, + "learning_rate": 0.00029794915519320317, + "loss": 0.0518, "step": 2710 }, { - "epoch": 0.03, - "learning_rate": 0.0002955892845560096, - "loss": 0.0544, + "epoch": 0.01, + "learning_rate": 0.00029794158750018915, + "loss": 0.0528, "step": 2720 }, { - "epoch": 0.03, - "learning_rate": 0.0002955730686904067, - "loss": 0.0568, + "epoch": 0.01, + "learning_rate": 0.0002979340198071752, + "loss": 0.0472, "step": 2730 }, { - "epoch": 0.03, - "learning_rate": 0.00029555685282480376, - "loss": 0.0553, + "epoch": 0.01, + "learning_rate": 0.00029792645211416117, + "loss": 0.0541, "step": 2740 }, { - "epoch": 0.03, - "learning_rate": 0.00029554063695920083, - "loss": 0.0549, + "epoch": 0.01, + "learning_rate": 0.00029791888442114715, + "loss": 0.0504, "step": 2750 }, { - "epoch": 0.03, - "learning_rate": 0.00029552442109359795, - "loss": 0.0879, + "epoch": 0.01, + "learning_rate": 0.00029791131672813313, + "loss": 0.0628, "step": 2760 }, { - "epoch": 0.03, - "learning_rate": 0.00029550820522799507, - "loss": 0.0844, + "epoch": 0.01, + "learning_rate": 0.0002979037490351191, + "loss": 0.0572, "step": 2770 }, { - "epoch": 0.03, - "learning_rate": 0.00029549198936239214, - "loss": 0.0894, + "epoch": 0.01, + "learning_rate": 0.0002978961813421051, + "loss": 0.0541, "step": 2780 }, { - "epoch": 0.03, - "learning_rate": 0.0002954757734967892, - "loss": 0.0779, + "epoch": 0.01, + "learning_rate": 0.00029788861364909113, + "loss": 0.0556, "step": 2790 }, { - "epoch": 0.03, - "learning_rate": 0.0002954595576311863, - "loss": 0.0667, + "epoch": 0.01, + "learning_rate": 0.0002978810459560771, + "loss": 0.0557, "step": 2800 }, { - "epoch": 0.03, - "learning_rate": 0.00029544334176558344, - "loss": 0.0704, + "epoch": 0.01, + "learning_rate": 0.0002978734782630631, + "loss": 0.0725, "step": 2810 }, { - "epoch": 0.03, - "learning_rate": 0.0002954271258999805, - "loss": 0.0616, + "epoch": 0.01, + "learning_rate": 0.00029786591057004907, + "loss": 0.0681, "step": 2820 }, { - "epoch": 0.03, - "learning_rate": 0.0002954109100343776, - "loss": 0.0584, + "epoch": 0.01, + "learning_rate": 0.00029785834287703505, + "loss": 0.0572, "step": 2830 }, { - "epoch": 0.03, - "learning_rate": 0.0002953946941687747, - "loss": 0.0918, + "epoch": 0.01, + "learning_rate": 0.00029785077518402103, + "loss": 0.0536, "step": 2840 }, { - "epoch": 0.03, - "learning_rate": 0.0002953784783031718, - "loss": 0.0701, + "epoch": 0.01, + "learning_rate": 0.000297843207491007, + "loss": 0.0545, "step": 2850 }, { - "epoch": 0.03, - "learning_rate": 0.0002953622624375689, - "loss": 0.0725, + "epoch": 0.01, + "learning_rate": 0.00029783563979799305, + "loss": 0.0573, "step": 2860 }, { - "epoch": 0.03, - "learning_rate": 0.000295346046571966, - "loss": 0.0636, + "epoch": 0.01, + "learning_rate": 0.00029782807210497903, + "loss": 0.0519, "step": 2870 }, { - "epoch": 0.03, - "learning_rate": 0.00029532983070636306, - "loss": 0.0612, + "epoch": 0.01, + "learning_rate": 0.000297820504411965, + "loss": 0.0539, "step": 2880 }, { - "epoch": 0.03, - "learning_rate": 0.0002953136148407602, - "loss": 0.0669, + "epoch": 0.01, + "learning_rate": 0.000297812936718951, + "loss": 0.0611, "step": 2890 }, { - "epoch": 0.03, - "learning_rate": 0.0002952973989751573, - "loss": 0.0568, + "epoch": 0.01, + "learning_rate": 0.000297805369025937, + "loss": 0.0533, "step": 2900 }, { - "epoch": 0.03, - "learning_rate": 0.00029528118310955437, - "loss": 0.0551, + "epoch": 0.01, + "learning_rate": 0.00029779780133292296, + "loss": 0.0537, "step": 2910 }, { - "epoch": 0.03, - "learning_rate": 0.00029526496724395143, - "loss": 0.0648, + "epoch": 0.01, + "learning_rate": 0.000297790233639909, + "loss": 0.0529, "step": 2920 }, { - "epoch": 0.03, - "learning_rate": 0.00029524875137834855, - "loss": 0.061, + "epoch": 0.01, + "learning_rate": 0.000297782665946895, + "loss": 0.0539, "step": 2930 }, { - "epoch": 0.03, - "learning_rate": 0.0002952325355127457, - "loss": 0.0547, + "epoch": 0.01, + "learning_rate": 0.00029777509825388096, + "loss": 0.0511, "step": 2940 }, { - "epoch": 0.03, - "learning_rate": 0.00029521631964714274, - "loss": 0.0637, + "epoch": 0.01, + "learning_rate": 0.00029776753056086694, + "loss": 0.0568, "step": 2950 }, { - "epoch": 0.03, - "learning_rate": 0.0002952001037815398, - "loss": 0.0606, + "epoch": 0.01, + "learning_rate": 0.0002977599628678529, + "loss": 0.0534, "step": 2960 }, { - "epoch": 0.03, - "learning_rate": 0.0002951838879159369, - "loss": 0.0546, + "epoch": 0.01, + "learning_rate": 0.0002977523951748389, + "loss": 0.0514, "step": 2970 }, { - "epoch": 0.03, - "learning_rate": 0.00029516767205033404, - "loss": 0.0545, + "epoch": 0.02, + "learning_rate": 0.00029774482748182494, + "loss": 0.059, "step": 2980 }, { - "epoch": 0.03, - "learning_rate": 0.0002951514561847311, - "loss": 0.0598, + "epoch": 0.02, + "learning_rate": 0.0002977372597888109, + "loss": 0.06, "step": 2990 }, { - "epoch": 0.03, - "learning_rate": 0.00029513524031912823, - "loss": 0.0534, + "epoch": 0.02, + "learning_rate": 0.0002977296920957969, + "loss": 0.071, "step": 3000 }, { - "epoch": 0.03, - "eval_cer": 0.921613794804712, - "eval_loss": 0.04357113689184189, - "eval_runtime": 120.9669, - "eval_samples_per_second": 16.533, - "eval_steps_per_second": 4.133, + "epoch": 0.02, + "eval_cer": 0.9145605027428246, + "eval_loss": 0.04296322166919708, + "eval_runtime": 117.3539, + "eval_samples_per_second": 17.042, + "eval_steps_per_second": 4.261, "step": 3000 }, { - "epoch": 0.03, - "learning_rate": 0.0002951190244535253, - "loss": 0.0794, + "epoch": 0.02, + "learning_rate": 0.0002977221244027829, + "loss": 0.0634, "step": 3010 }, { - "epoch": 0.03, - "learning_rate": 0.0002951028085879224, - "loss": 0.0604, + "epoch": 0.02, + "learning_rate": 0.00029771455670976886, + "loss": 0.055, "step": 3020 }, { - "epoch": 0.03, - "learning_rate": 0.0002950865927223195, - "loss": 0.0512, + "epoch": 0.02, + "learning_rate": 0.00029770698901675484, + "loss": 0.0572, "step": 3030 }, { - "epoch": 0.03, - "learning_rate": 0.0002950703768567166, - "loss": 0.0569, + "epoch": 0.02, + "learning_rate": 0.0002976994213237408, + "loss": 0.0522, "step": 3040 }, { - "epoch": 0.03, - "learning_rate": 0.00029505416099111367, - "loss": 0.0507, + "epoch": 0.02, + "learning_rate": 0.00029769185363072686, + "loss": 0.0582, "step": 3050 }, { - "epoch": 0.03, - "learning_rate": 0.0002950379451255108, - "loss": 0.0652, + "epoch": 0.02, + "learning_rate": 0.00029768428593771284, + "loss": 0.0513, "step": 3060 }, { - "epoch": 0.03, - "learning_rate": 0.00029502172925990785, - "loss": 0.0545, + "epoch": 0.02, + "learning_rate": 0.0002976767182446988, + "loss": 0.0565, "step": 3070 }, { - "epoch": 0.03, - "learning_rate": 0.00029500551339430497, - "loss": 0.0499, + "epoch": 0.02, + "learning_rate": 0.0002976691505516848, + "loss": 0.0509, "step": 3080 }, { - "epoch": 0.03, - "learning_rate": 0.00029498929752870204, - "loss": 0.0525, + "epoch": 0.02, + "learning_rate": 0.0002976615828586708, + "loss": 0.0587, "step": 3090 }, { - "epoch": 0.03, - "learning_rate": 0.00029497308166309916, - "loss": 0.0599, + "epoch": 0.02, + "learning_rate": 0.00029765401516565677, + "loss": 0.0504, "step": 3100 }, { - "epoch": 0.03, - "learning_rate": 0.0002949568657974962, - "loss": 0.0604, + "epoch": 0.02, + "learning_rate": 0.0002976464474726428, + "loss": 0.053, "step": 3110 }, { - "epoch": 0.03, - "learning_rate": 0.00029494064993189334, - "loss": 0.0561, + "epoch": 0.02, + "learning_rate": 0.0002976388797796288, + "loss": 0.0575, "step": 3120 }, { - "epoch": 0.03, - "learning_rate": 0.00029492443406629046, - "loss": 0.0602, + "epoch": 0.02, + "learning_rate": 0.00029763131208661477, + "loss": 0.069, "step": 3130 }, { - "epoch": 0.03, - "learning_rate": 0.00029490821820068753, - "loss": 0.0542, + "epoch": 0.02, + "learning_rate": 0.00029762374439360075, + "loss": 0.0556, "step": 3140 }, { - "epoch": 0.03, - "learning_rate": 0.0002948920023350846, - "loss": 0.0548, + "epoch": 0.02, + "learning_rate": 0.00029761617670058673, + "loss": 0.0563, "step": 3150 }, { - "epoch": 0.03, - "learning_rate": 0.0002948757864694817, - "loss": 0.0596, + "epoch": 0.02, + "learning_rate": 0.0002976086090075727, + "loss": 0.0533, "step": 3160 }, { - "epoch": 0.03, - "learning_rate": 0.00029485957060387883, - "loss": 0.063, + "epoch": 0.02, + "learning_rate": 0.0002976010413145587, + "loss": 0.0604, "step": 3170 }, { - "epoch": 0.03, - "learning_rate": 0.0002948433547382759, - "loss": 0.0487, + "epoch": 0.02, + "learning_rate": 0.0002975934736215447, + "loss": 0.0548, "step": 3180 }, { - "epoch": 0.03, - "learning_rate": 0.00029482713887267297, - "loss": 0.0576, + "epoch": 0.02, + "learning_rate": 0.00029758590592853066, + "loss": 0.0575, "step": 3190 }, { - "epoch": 0.03, - "learning_rate": 0.0002948109230070701, - "loss": 0.0473, + "epoch": 0.02, + "learning_rate": 0.00029757833823551664, + "loss": 0.0544, "step": 3200 }, { - "epoch": 0.03, - "learning_rate": 0.0002947947071414672, - "loss": 0.0506, + "epoch": 0.02, + "learning_rate": 0.0002975707705425026, + "loss": 0.0557, "step": 3210 }, { - "epoch": 0.03, - "learning_rate": 0.00029477849127586427, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.00029756320284948865, + "loss": 0.0545, "step": 3220 }, { - "epoch": 0.03, - "learning_rate": 0.00029476227541026134, - "loss": 0.0512, + "epoch": 0.02, + "learning_rate": 0.00029755563515647464, + "loss": 0.0549, "step": 3230 }, { - "epoch": 0.04, - "learning_rate": 0.00029474605954465846, - "loss": 0.0533, + "epoch": 0.02, + "learning_rate": 0.0002975480674634606, + "loss": 0.0504, "step": 3240 }, { - "epoch": 0.04, - "learning_rate": 0.0002947298436790556, - "loss": 0.0494, + "epoch": 0.02, + "learning_rate": 0.0002975404997704466, + "loss": 0.0501, "step": 3250 }, { - "epoch": 0.04, - "learning_rate": 0.00029471362781345264, - "loss": 0.0542, + "epoch": 0.02, + "learning_rate": 0.0002975329320774326, + "loss": 0.0545, "step": 3260 }, { - "epoch": 0.04, - "learning_rate": 0.00029469741194784976, - "loss": 0.0538, + "epoch": 0.02, + "learning_rate": 0.00029752536438441856, + "loss": 0.0453, "step": 3270 }, { - "epoch": 0.04, - "learning_rate": 0.00029468119608224683, - "loss": 0.0462, + "epoch": 0.02, + "learning_rate": 0.0002975177966914046, + "loss": 0.0476, "step": 3280 }, { - "epoch": 0.04, - "learning_rate": 0.00029466498021664395, - "loss": 0.058, + "epoch": 0.02, + "learning_rate": 0.0002975102289983906, + "loss": 0.0596, "step": 3290 }, { - "epoch": 0.04, - "learning_rate": 0.00029464876435104107, - "loss": 0.0448, + "epoch": 0.02, + "learning_rate": 0.00029750266130537656, + "loss": 0.06, "step": 3300 }, { - "epoch": 0.04, - "learning_rate": 0.00029463254848543813, - "loss": 0.0527, + "epoch": 0.02, + "learning_rate": 0.00029749509361236254, + "loss": 0.0556, "step": 3310 }, { - "epoch": 0.04, - "learning_rate": 0.0002946163326198352, - "loss": 0.0513, + "epoch": 0.02, + "learning_rate": 0.0002974875259193485, + "loss": 0.0532, "step": 3320 }, { - "epoch": 0.04, - "learning_rate": 0.0002946001167542323, - "loss": 0.0503, + "epoch": 0.02, + "learning_rate": 0.0002974799582263345, + "loss": 0.0508, "step": 3330 }, { - "epoch": 0.04, - "learning_rate": 0.00029458390088862944, - "loss": 0.0506, + "epoch": 0.02, + "learning_rate": 0.00029747239053332054, + "loss": 0.0553, "step": 3340 }, { - "epoch": 0.04, - "learning_rate": 0.0002945676850230265, - "loss": 0.0514, + "epoch": 0.02, + "learning_rate": 0.0002974648228403065, + "loss": 0.0571, "step": 3350 }, { - "epoch": 0.04, - "learning_rate": 0.00029455146915742357, - "loss": 0.0524, + "epoch": 0.02, + "learning_rate": 0.0002974572551472925, + "loss": 0.0518, "step": 3360 }, { - "epoch": 0.04, - "learning_rate": 0.0002945352532918207, - "loss": 0.0501, + "epoch": 0.02, + "learning_rate": 0.0002974496874542785, + "loss": 0.0596, "step": 3370 }, { - "epoch": 0.04, - "learning_rate": 0.0002945190374262178, - "loss": 0.0514, + "epoch": 0.02, + "learning_rate": 0.00029744211976126447, + "loss": 0.0473, "step": 3380 }, { - "epoch": 0.04, - "learning_rate": 0.0002945028215606149, - "loss": 0.0543, + "epoch": 0.02, + "learning_rate": 0.00029743455206825045, + "loss": 0.0541, "step": 3390 }, { - "epoch": 0.04, - "learning_rate": 0.000294486605695012, - "loss": 0.0464, + "epoch": 0.02, + "learning_rate": 0.00029742698437523643, + "loss": 0.0475, "step": 3400 }, { - "epoch": 0.04, - "learning_rate": 0.00029447038982940906, - "loss": 0.053, + "epoch": 0.02, + "learning_rate": 0.00029741941668222246, + "loss": 0.0535, "step": 3410 }, { - "epoch": 0.04, - "learning_rate": 0.0002944541739638062, - "loss": 0.0567, + "epoch": 0.02, + "learning_rate": 0.00029741184898920845, + "loss": 0.0912, "step": 3420 }, { - "epoch": 0.04, - "learning_rate": 0.00029443795809820325, - "loss": 0.0575, + "epoch": 0.02, + "learning_rate": 0.00029740428129619443, + "loss": 0.0654, "step": 3430 }, { - "epoch": 0.04, - "learning_rate": 0.00029442174223260037, - "loss": 0.0517, + "epoch": 0.02, + "learning_rate": 0.0002973967136031804, + "loss": 0.1074, "step": 3440 }, { - "epoch": 0.04, - "learning_rate": 0.00029440552636699743, - "loss": 0.0567, + "epoch": 0.02, + "learning_rate": 0.0002973891459101664, + "loss": 0.0576, "step": 3450 }, { - "epoch": 0.04, - "learning_rate": 0.00029438931050139455, - "loss": 0.0462, + "epoch": 0.02, + "learning_rate": 0.00029738157821715237, + "loss": 0.0517, "step": 3460 }, { - "epoch": 0.04, - "learning_rate": 0.0002943730946357916, - "loss": 0.0662, + "epoch": 0.02, + "learning_rate": 0.0002973740105241384, + "loss": 0.0604, "step": 3470 }, { - "epoch": 0.04, - "learning_rate": 0.00029435687877018874, - "loss": 0.0505, + "epoch": 0.02, + "learning_rate": 0.0002973664428311244, + "loss": 0.0488, "step": 3480 }, { - "epoch": 0.04, - "learning_rate": 0.0002943406629045858, - "loss": 0.0458, + "epoch": 0.02, + "learning_rate": 0.00029735887513811037, + "loss": 0.0484, "step": 3490 }, { - "epoch": 0.04, - "learning_rate": 0.0002943244470389829, - "loss": 0.0491, + "epoch": 0.02, + "learning_rate": 0.00029735130744509635, + "loss": 0.0547, "step": 3500 }, { - "epoch": 0.04, - "learning_rate": 0.00029430823117338, - "loss": 0.054, + "epoch": 0.02, + "learning_rate": 0.00029734373975208233, + "loss": 0.0545, "step": 3510 }, { - "epoch": 0.04, - "learning_rate": 0.0002942920153077771, - "loss": 0.0461, + "epoch": 0.02, + "learning_rate": 0.0002973361720590683, + "loss": 0.0482, "step": 3520 }, { - "epoch": 0.04, - "learning_rate": 0.0002942757994421742, - "loss": 0.0514, + "epoch": 0.02, + "learning_rate": 0.00029732860436605435, + "loss": 0.0554, "step": 3530 }, { - "epoch": 0.04, - "learning_rate": 0.0002942595835765713, - "loss": 0.0542, + "epoch": 0.02, + "learning_rate": 0.00029732103667304033, + "loss": 0.0561, "step": 3540 }, { - "epoch": 0.04, - "learning_rate": 0.00029424336771096836, - "loss": 0.0551, + "epoch": 0.02, + "learning_rate": 0.0002973134689800263, + "loss": 0.0556, "step": 3550 }, { - "epoch": 0.04, - "learning_rate": 0.0002942271518453655, - "loss": 0.0516, + "epoch": 0.02, + "learning_rate": 0.0002973059012870123, + "loss": 0.0797, "step": 3560 }, { - "epoch": 0.04, - "learning_rate": 0.0002942109359797626, - "loss": 0.0505, + "epoch": 0.02, + "learning_rate": 0.0002972983335939983, + "loss": 0.0609, "step": 3570 }, { - "epoch": 0.04, - "learning_rate": 0.00029419472011415966, - "loss": 0.0451, + "epoch": 0.02, + "learning_rate": 0.00029729076590098426, + "loss": 0.1602, "step": 3580 }, { - "epoch": 0.04, - "learning_rate": 0.00029417850424855673, - "loss": 0.0477, + "epoch": 0.02, + "learning_rate": 0.00029728319820797024, + "loss": 0.0635, "step": 3590 }, { - "epoch": 0.04, - "learning_rate": 0.00029416228838295385, - "loss": 0.0485, + "epoch": 0.02, + "learning_rate": 0.0002972756305149563, + "loss": 0.0597, "step": 3600 }, { - "epoch": 0.04, - "learning_rate": 0.00029414607251735097, - "loss": 0.0523, + "epoch": 0.02, + "learning_rate": 0.00029726806282194226, + "loss": 0.0554, "step": 3610 }, { - "epoch": 0.04, - "learning_rate": 0.00029412985665174803, - "loss": 0.0448, + "epoch": 0.02, + "learning_rate": 0.00029726049512892824, + "loss": 0.0558, "step": 3620 }, { - "epoch": 0.04, - "learning_rate": 0.00029411364078614515, - "loss": 0.0512, + "epoch": 0.02, + "learning_rate": 0.0002972529274359142, + "loss": 0.0559, "step": 3630 }, { - "epoch": 0.04, - "learning_rate": 0.0002940974249205422, - "loss": 0.0461, + "epoch": 0.02, + "learning_rate": 0.0002972453597429002, + "loss": 0.0551, "step": 3640 }, { - "epoch": 0.04, - "learning_rate": 0.00029408120905493934, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.0002972377920498862, + "loss": 0.0566, "step": 3650 }, { - "epoch": 0.04, - "learning_rate": 0.0002940649931893364, - "loss": 0.0474, + "epoch": 0.02, + "learning_rate": 0.0002972302243568722, + "loss": 0.0545, "step": 3660 }, { - "epoch": 0.04, - "learning_rate": 0.0002940487773237335, - "loss": 0.0832, + "epoch": 0.02, + "learning_rate": 0.0002972226566638582, + "loss": 0.0498, "step": 3670 }, { - "epoch": 0.04, - "learning_rate": 0.0002940325614581306, - "loss": 0.0521, + "epoch": 0.02, + "learning_rate": 0.0002972150889708442, + "loss": 0.052, "step": 3680 }, { - "epoch": 0.04, - "learning_rate": 0.0002940163455925277, - "loss": 0.0659, + "epoch": 0.02, + "learning_rate": 0.00029720752127783016, + "loss": 0.0546, "step": 3690 }, { - "epoch": 0.04, - "learning_rate": 0.00029400012972692483, - "loss": 0.0498, + "epoch": 0.02, + "learning_rate": 0.00029719995358481614, + "loss": 0.0547, "step": 3700 }, { - "epoch": 0.04, - "learning_rate": 0.0002939839138613219, - "loss": 0.0465, + "epoch": 0.02, + "learning_rate": 0.0002971923858918021, + "loss": 0.0474, "step": 3710 }, { - "epoch": 0.04, - "learning_rate": 0.00029396769799571896, - "loss": 0.0456, + "epoch": 0.02, + "learning_rate": 0.0002971848181987881, + "loss": 0.0519, "step": 3720 }, { - "epoch": 0.04, - "learning_rate": 0.0002939514821301161, - "loss": 0.0468, + "epoch": 0.02, + "learning_rate": 0.00029717725050577414, + "loss": 0.0477, "step": 3730 }, { - "epoch": 0.04, - "learning_rate": 0.0002939352662645132, - "loss": 0.0467, + "epoch": 0.02, + "learning_rate": 0.0002971696828127601, + "loss": 0.0469, "step": 3740 }, { - "epoch": 0.04, - "learning_rate": 0.00029391905039891027, - "loss": 0.0446, + "epoch": 0.02, + "learning_rate": 0.0002971621151197461, + "loss": 0.0513, "step": 3750 }, { - "epoch": 0.04, - "learning_rate": 0.00029390283453330733, - "loss": 0.0486, + "epoch": 0.02, + "learning_rate": 0.0002971545474267321, + "loss": 0.0462, "step": 3760 }, { - "epoch": 0.04, - "learning_rate": 0.00029388661866770445, - "loss": 0.0536, + "epoch": 0.02, + "learning_rate": 0.00029714697973371807, + "loss": 0.0553, "step": 3770 }, { - "epoch": 0.04, - "learning_rate": 0.00029387040280210157, - "loss": 0.0519, + "epoch": 0.02, + "learning_rate": 0.00029713941204070405, + "loss": 0.0615, "step": 3780 }, { - "epoch": 0.04, - "learning_rate": 0.00029385418693649864, - "loss": 0.0512, + "epoch": 0.02, + "learning_rate": 0.0002971318443476901, + "loss": 0.0498, "step": 3790 }, { - "epoch": 0.04, - "learning_rate": 0.0002938379710708957, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.00029712427665467607, + "loss": 0.0577, "step": 3800 }, { - "epoch": 0.04, - "learning_rate": 0.0002938217552052928, - "loss": 0.0525, + "epoch": 0.02, + "learning_rate": 0.00029711670896166205, + "loss": 0.0521, "step": 3810 }, { - "epoch": 0.04, - "learning_rate": 0.00029380553933968994, - "loss": 0.0557, + "epoch": 0.02, + "learning_rate": 0.00029710914126864803, + "loss": 0.0528, "step": 3820 }, { - "epoch": 0.04, - "learning_rate": 0.000293789323474087, - "loss": 0.0452, + "epoch": 0.02, + "learning_rate": 0.000297101573575634, + "loss": 0.0476, "step": 3830 }, { - "epoch": 0.04, - "learning_rate": 0.00029377310760848413, - "loss": 0.0489, + "epoch": 0.02, + "learning_rate": 0.00029709400588262, + "loss": 0.0474, "step": 3840 }, { - "epoch": 0.04, - "learning_rate": 0.0002937568917428812, - "loss": 0.0488, + "epoch": 0.02, + "learning_rate": 0.00029708643818960603, + "loss": 0.0548, "step": 3850 }, { - "epoch": 0.04, - "learning_rate": 0.0002937406758772783, - "loss": 0.0529, + "epoch": 0.02, + "learning_rate": 0.000297078870496592, + "loss": 0.0538, "step": 3860 }, { - "epoch": 0.04, - "learning_rate": 0.00029372446001167543, - "loss": 0.0482, + "epoch": 0.02, + "learning_rate": 0.000297071302803578, + "loss": 0.0453, "step": 3870 }, { - "epoch": 0.04, - "learning_rate": 0.0002937082441460725, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.00029706373511056397, + "loss": 0.052, "step": 3880 }, { - "epoch": 0.04, - "learning_rate": 0.00029369202828046957, - "loss": 0.0559, + "epoch": 0.02, + "learning_rate": 0.00029705616741754995, + "loss": 0.0486, "step": 3890 }, { - "epoch": 0.04, - "learning_rate": 0.0002936758124148667, - "loss": 0.0563, + "epoch": 0.02, + "learning_rate": 0.00029704859972453593, + "loss": 0.0462, "step": 3900 }, { - "epoch": 0.04, - "learning_rate": 0.0002936595965492638, - "loss": 0.0492, + "epoch": 0.02, + "learning_rate": 0.0002970410320315219, + "loss": 0.0425, "step": 3910 }, { - "epoch": 0.04, - "learning_rate": 0.00029364338068366087, - "loss": 0.0468, + "epoch": 0.02, + "learning_rate": 0.00029703346433850795, + "loss": 0.0561, "step": 3920 }, { - "epoch": 0.04, - "learning_rate": 0.00029362716481805794, - "loss": 0.0459, + "epoch": 0.02, + "learning_rate": 0.00029702589664549393, + "loss": 0.0472, "step": 3930 }, { - "epoch": 0.04, - "learning_rate": 0.00029361094895245506, - "loss": 0.051, + "epoch": 0.02, + "learning_rate": 0.0002970183289524799, + "loss": 0.0526, "step": 3940 }, { - "epoch": 0.04, - "learning_rate": 0.0002935947330868522, - "loss": 0.0491, + "epoch": 0.02, + "learning_rate": 0.0002970107612594659, + "loss": 0.047, "step": 3950 }, { - "epoch": 0.04, - "learning_rate": 0.00029357851722124924, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.0002970031935664519, + "loss": 0.051, "step": 3960 }, { - "epoch": 0.04, - "learning_rate": 0.0002935623013556463, - "loss": 0.0447, + "epoch": 0.02, + "learning_rate": 0.00029699562587343786, + "loss": 0.0456, "step": 3970 }, { - "epoch": 0.04, - "learning_rate": 0.00029354608549004343, - "loss": 0.0549, + "epoch": 0.02, + "learning_rate": 0.0002969880581804239, + "loss": 0.0425, "step": 3980 }, { - "epoch": 0.04, - "learning_rate": 0.00029352986962444055, - "loss": 0.059, + "epoch": 0.02, + "learning_rate": 0.0002969804904874099, + "loss": 0.0543, "step": 3990 }, { - "epoch": 0.04, - "learning_rate": 0.0002935136537588376, - "loss": 0.0461, + "epoch": 0.02, + "learning_rate": 0.00029697292279439586, + "loss": 0.0542, "step": 4000 }, { - "epoch": 0.04, - "eval_cer": 0.9216346412756651, - "eval_loss": 0.03921321779489517, - "eval_runtime": 120.7862, - "eval_samples_per_second": 16.558, - "eval_steps_per_second": 4.14, + "epoch": 0.02, + "eval_cer": 0.9145430356125674, + "eval_loss": 0.038954902440309525, + "eval_runtime": 117.4435, + "eval_samples_per_second": 17.029, + "eval_steps_per_second": 4.257, "step": 4000 }, { - "epoch": 0.04, - "learning_rate": 0.00029349743789323473, - "loss": 0.0531, + "epoch": 0.02, + "learning_rate": 0.00029696535510138184, + "loss": 0.0502, "step": 4010 }, { - "epoch": 0.04, - "learning_rate": 0.0002934812220276318, - "loss": 0.0441, + "epoch": 0.02, + "learning_rate": 0.0002969577874083678, + "loss": 0.0453, "step": 4020 }, { - "epoch": 0.04, - "learning_rate": 0.0002934650061620289, - "loss": 0.0453, + "epoch": 0.02, + "learning_rate": 0.0002969502197153538, + "loss": 0.0519, "step": 4030 }, { - "epoch": 0.04, - "learning_rate": 0.000293448790296426, - "loss": 0.0461, + "epoch": 0.02, + "learning_rate": 0.00029694265202233984, + "loss": 0.0464, "step": 4040 }, { - "epoch": 0.04, - "learning_rate": 0.0002934325744308231, - "loss": 0.0509, + "epoch": 0.02, + "learning_rate": 0.0002969350843293258, + "loss": 0.0494, "step": 4050 }, { - "epoch": 0.04, - "learning_rate": 0.00029341635856522017, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.0002969275166363118, + "loss": 0.0455, "step": 4060 }, { - "epoch": 0.04, - "learning_rate": 0.0002934001426996173, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.0002969199489432978, + "loss": 0.0543, "step": 4070 }, { - "epoch": 0.04, - "learning_rate": 0.00029338392683401436, - "loss": 0.0531, + "epoch": 0.02, + "learning_rate": 0.00029691238125028376, + "loss": 0.0464, "step": 4080 }, { - "epoch": 0.04, - "learning_rate": 0.0002933677109684115, - "loss": 0.0472, + "epoch": 0.02, + "learning_rate": 0.00029690481355726974, + "loss": 0.0518, "step": 4090 }, { - "epoch": 0.04, - "learning_rate": 0.00029335149510280854, - "loss": 0.041, + "epoch": 0.02, + "learning_rate": 0.0002968972458642557, + "loss": 0.0526, "step": 4100 }, { - "epoch": 0.04, - "learning_rate": 0.00029333527923720566, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.00029688967817124176, + "loss": 0.0541, "step": 4110 }, { - "epoch": 0.04, - "learning_rate": 0.0002933190633716027, - "loss": 0.0518, + "epoch": 0.02, + "learning_rate": 0.00029688211047822774, + "loss": 0.0511, "step": 4120 }, { - "epoch": 0.04, - "learning_rate": 0.00029330284750599985, - "loss": 0.0531, + "epoch": 0.02, + "learning_rate": 0.0002968745427852137, + "loss": 0.0495, "step": 4130 }, { - "epoch": 0.04, - "learning_rate": 0.00029328663164039697, - "loss": 0.0456, + "epoch": 0.02, + "learning_rate": 0.0002968669750921997, + "loss": 0.0424, "step": 4140 }, { - "epoch": 0.04, - "learning_rate": 0.00029327041577479403, - "loss": 0.0544, + "epoch": 0.02, + "learning_rate": 0.0002968594073991857, + "loss": 0.0516, "step": 4150 }, { - "epoch": 0.04, - "learning_rate": 0.0002932541999091911, - "loss": 0.0403, + "epoch": 0.02, + "learning_rate": 0.00029685183970617167, + "loss": 0.0454, "step": 4160 }, { - "epoch": 0.05, - "learning_rate": 0.0002932379840435882, - "loss": 0.0537, + "epoch": 0.02, + "learning_rate": 0.0002968442720131577, + "loss": 0.0522, "step": 4170 }, { - "epoch": 0.05, - "learning_rate": 0.00029322176817798534, - "loss": 0.0502, + "epoch": 0.02, + "learning_rate": 0.0002968367043201437, + "loss": 0.0516, "step": 4180 }, { - "epoch": 0.05, - "learning_rate": 0.0002932055523123824, - "loss": 0.0509, + "epoch": 0.02, + "learning_rate": 0.00029682913662712967, + "loss": 0.0462, "step": 4190 }, { - "epoch": 0.05, - "learning_rate": 0.00029318933644677947, - "loss": 0.0528, + "epoch": 0.02, + "learning_rate": 0.00029682156893411565, + "loss": 0.0546, "step": 4200 }, { - "epoch": 0.05, - "learning_rate": 0.0002931731205811766, - "loss": 0.0469, + "epoch": 0.02, + "learning_rate": 0.00029681400124110163, + "loss": 0.0444, "step": 4210 }, { - "epoch": 0.05, - "learning_rate": 0.0002931569047155737, - "loss": 0.0511, + "epoch": 0.02, + "learning_rate": 0.0002968064335480876, + "loss": 0.0504, "step": 4220 }, { - "epoch": 0.05, - "learning_rate": 0.0002931406888499708, - "loss": 0.0527, + "epoch": 0.02, + "learning_rate": 0.0002967988658550736, + "loss": 0.0566, "step": 4230 }, { - "epoch": 0.05, - "learning_rate": 0.00029312447298436784, - "loss": 0.0511, + "epoch": 0.02, + "learning_rate": 0.00029679129816205963, + "loss": 0.0473, "step": 4240 }, { - "epoch": 0.05, - "learning_rate": 0.00029310825711876496, - "loss": 0.0454, + "epoch": 0.02, + "learning_rate": 0.0002967837304690456, + "loss": 0.048, "step": 4250 }, { - "epoch": 0.05, - "learning_rate": 0.0002930920412531621, - "loss": 0.0483, + "epoch": 0.02, + "learning_rate": 0.0002967761627760316, + "loss": 0.049, "step": 4260 }, { - "epoch": 0.05, - "learning_rate": 0.00029307582538755914, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.0002967685950830176, + "loss": 0.0518, "step": 4270 }, { - "epoch": 0.05, - "learning_rate": 0.00029305960952195626, - "loss": 0.0488, + "epoch": 0.02, + "learning_rate": 0.00029676102739000355, + "loss": 0.0496, "step": 4280 }, { - "epoch": 0.05, - "learning_rate": 0.00029304339365635333, - "loss": 0.0539, + "epoch": 0.02, + "learning_rate": 0.00029675345969698954, + "loss": 0.0528, "step": 4290 }, { - "epoch": 0.05, - "learning_rate": 0.00029302717779075045, - "loss": 0.059, + "epoch": 0.02, + "learning_rate": 0.00029674589200397557, + "loss": 0.0442, "step": 4300 }, { - "epoch": 0.05, - "learning_rate": 0.00029301096192514757, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.00029673832431096155, + "loss": 0.0463, "step": 4310 }, { - "epoch": 0.05, - "learning_rate": 0.00029299474605954464, - "loss": 0.0492, + "epoch": 0.02, + "learning_rate": 0.00029673075661794753, + "loss": 0.0494, "step": 4320 }, { - "epoch": 0.05, - "learning_rate": 0.0002929785301939417, - "loss": 0.0466, + "epoch": 0.02, + "learning_rate": 0.0002967231889249335, + "loss": 0.0448, "step": 4330 }, { - "epoch": 0.05, - "learning_rate": 0.0002929623143283388, - "loss": 0.0499, + "epoch": 0.02, + "learning_rate": 0.0002967156212319195, + "loss": 0.0654, "step": 4340 }, { - "epoch": 0.05, - "learning_rate": 0.00029294609846273594, - "loss": 0.0442, + "epoch": 0.02, + "learning_rate": 0.0002967080535389055, + "loss": 0.0627, "step": 4350 }, { - "epoch": 0.05, - "learning_rate": 0.000292929882597133, - "loss": 0.0472, + "epoch": 0.02, + "learning_rate": 0.0002967004858458915, + "loss": 0.0456, "step": 4360 }, { - "epoch": 0.05, - "learning_rate": 0.00029291366673153007, - "loss": 0.0456, + "epoch": 0.02, + "learning_rate": 0.0002966929181528775, + "loss": 0.0504, "step": 4370 }, { - "epoch": 0.05, - "learning_rate": 0.0002928974508659272, - "loss": 0.0503, + "epoch": 0.02, + "learning_rate": 0.0002966853504598635, + "loss": 0.046, "step": 4380 }, { - "epoch": 0.05, - "learning_rate": 0.0002928812350003243, - "loss": 0.0479, + "epoch": 0.02, + "learning_rate": 0.00029667778276684946, + "loss": 0.046, "step": 4390 }, { - "epoch": 0.05, - "learning_rate": 0.0002928650191347214, - "loss": 0.0441, + "epoch": 0.02, + "learning_rate": 0.00029667021507383544, + "loss": 0.0498, "step": 4400 }, { - "epoch": 0.05, - "learning_rate": 0.0002928488032691185, - "loss": 0.048, + "epoch": 0.02, + "learning_rate": 0.0002966626473808214, + "loss": 0.0465, "step": 4410 }, { - "epoch": 0.05, - "learning_rate": 0.00029283258740351556, - "loss": 0.04, + "epoch": 0.02, + "learning_rate": 0.0002966550796878074, + "loss": 0.0443, "step": 4420 }, { - "epoch": 0.05, - "learning_rate": 0.0002928163715379127, - "loss": 0.0527, + "epoch": 0.02, + "learning_rate": 0.0002966475119947934, + "loss": 0.0482, "step": 4430 }, { - "epoch": 0.05, - "learning_rate": 0.0002928001556723098, - "loss": 0.046, + "epoch": 0.02, + "learning_rate": 0.00029663994430177937, + "loss": 0.0453, "step": 4440 }, { - "epoch": 0.05, - "learning_rate": 0.00029278393980670687, - "loss": 0.0489, + "epoch": 0.02, + "learning_rate": 0.00029663237660876535, + "loss": 0.0473, "step": 4450 }, { - "epoch": 0.05, - "learning_rate": 0.00029276772394110393, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.00029662480891575133, + "loss": 0.0463, "step": 4460 }, { - "epoch": 0.05, - "learning_rate": 0.00029275150807550105, - "loss": 0.0473, + "epoch": 0.02, + "learning_rate": 0.00029661724122273736, + "loss": 0.0426, "step": 4470 }, { - "epoch": 0.05, - "learning_rate": 0.0002927352922098982, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.00029660967352972335, + "loss": 0.045, "step": 4480 }, { - "epoch": 0.05, - "learning_rate": 0.00029271907634429524, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.00029660210583670933, + "loss": 0.0493, "step": 4490 }, { - "epoch": 0.05, - "learning_rate": 0.0002927028604786923, - "loss": 0.0477, + "epoch": 0.02, + "learning_rate": 0.0002965945381436953, + "loss": 0.0462, "step": 4500 }, { - "epoch": 0.05, - "learning_rate": 0.0002926866446130894, - "loss": 0.0545, + "epoch": 0.02, + "learning_rate": 0.0002965869704506813, + "loss": 0.047, "step": 4510 }, { - "epoch": 0.05, - "learning_rate": 0.00029267042874748654, - "loss": 0.0489, + "epoch": 0.02, + "learning_rate": 0.00029657940275766727, + "loss": 0.048, "step": 4520 }, { - "epoch": 0.05, - "learning_rate": 0.0002926542128818836, - "loss": 0.0493, + "epoch": 0.02, + "learning_rate": 0.0002965718350646533, + "loss": 0.0553, "step": 4530 }, { - "epoch": 0.05, - "learning_rate": 0.0002926379970162807, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.0002965642673716393, + "loss": 0.0486, "step": 4540 }, { - "epoch": 0.05, - "learning_rate": 0.0002926217811506778, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.00029655669967862527, + "loss": 0.0472, "step": 4550 }, { - "epoch": 0.05, - "learning_rate": 0.0002926055652850749, - "loss": 0.0466, + "epoch": 0.02, + "learning_rate": 0.00029654913198561125, + "loss": 0.0441, "step": 4560 }, { - "epoch": 0.05, - "learning_rate": 0.000292589349419472, - "loss": 0.051, + "epoch": 0.02, + "learning_rate": 0.00029654156429259723, + "loss": 0.0496, "step": 4570 }, { - "epoch": 0.05, - "learning_rate": 0.0002925731335538691, - "loss": 0.0509, + "epoch": 0.02, + "learning_rate": 0.0002965339965995832, + "loss": 0.0417, "step": 4580 }, { - "epoch": 0.05, - "learning_rate": 0.00029255691768826617, - "loss": 0.0412, + "epoch": 0.02, + "learning_rate": 0.00029652642890656925, + "loss": 0.0459, "step": 4590 }, { - "epoch": 0.05, - "learning_rate": 0.0002925407018226633, - "loss": 0.0459, + "epoch": 0.02, + "learning_rate": 0.00029651886121355523, + "loss": 0.0412, "step": 4600 }, { - "epoch": 0.05, - "learning_rate": 0.00029252448595706035, - "loss": 0.0398, + "epoch": 0.02, + "learning_rate": 0.0002965112935205412, + "loss": 0.0461, "step": 4610 }, { - "epoch": 0.05, - "learning_rate": 0.00029250827009145747, - "loss": 0.0373, + "epoch": 0.02, + "learning_rate": 0.0002965037258275272, + "loss": 0.0502, "step": 4620 }, { - "epoch": 0.05, - "learning_rate": 0.00029249205422585454, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.0002964961581345132, + "loss": 0.0614, "step": 4630 }, { - "epoch": 0.05, - "learning_rate": 0.00029247583836025166, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.00029648859044149916, + "loss": 0.0506, "step": 4640 }, { - "epoch": 0.05, - "learning_rate": 0.0002924596224946487, - "loss": 0.0398, + "epoch": 0.02, + "learning_rate": 0.00029648102274848514, + "loss": 0.0487, "step": 4650 }, { - "epoch": 0.05, - "learning_rate": 0.00029244340662904584, - "loss": 0.0407, + "epoch": 0.02, + "learning_rate": 0.0002964734550554712, + "loss": 0.0505, "step": 4660 }, { - "epoch": 0.05, - "learning_rate": 0.0002924271907634429, - "loss": 0.0467, + "epoch": 0.02, + "learning_rate": 0.00029646588736245716, + "loss": 0.0527, "step": 4670 }, { - "epoch": 0.05, - "learning_rate": 0.00029241097489784003, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.00029645831966944314, + "loss": 0.0573, "step": 4680 }, { - "epoch": 0.05, - "learning_rate": 0.0002923947590322371, - "loss": 0.0451, + "epoch": 0.02, + "learning_rate": 0.0002964507519764291, + "loss": 0.0635, "step": 4690 }, { - "epoch": 0.05, - "learning_rate": 0.0002923785431666342, - "loss": 0.0493, + "epoch": 0.02, + "learning_rate": 0.0002964431842834151, + "loss": 0.0447, "step": 4700 }, { - "epoch": 0.05, - "learning_rate": 0.00029236232730103133, - "loss": 0.0478, + "epoch": 0.02, + "learning_rate": 0.0002964356165904011, + "loss": 0.0517, "step": 4710 }, { - "epoch": 0.05, - "learning_rate": 0.0002923461114354284, - "loss": 0.0434, + "epoch": 0.02, + "learning_rate": 0.0002964280488973871, + "loss": 0.0665, "step": 4720 }, { - "epoch": 0.05, - "learning_rate": 0.00029232989556982546, - "loss": 0.0426, + "epoch": 0.02, + "learning_rate": 0.0002964204812043731, + "loss": 0.0506, "step": 4730 }, { - "epoch": 0.05, - "learning_rate": 0.0002923136797042226, - "loss": 0.042, + "epoch": 0.02, + "learning_rate": 0.0002964129135113591, + "loss": 0.0562, "step": 4740 }, { - "epoch": 0.05, - "learning_rate": 0.0002922974638386197, - "loss": 0.045, + "epoch": 0.02, + "learning_rate": 0.00029640534581834506, + "loss": 0.052, "step": 4750 }, { - "epoch": 0.05, - "learning_rate": 0.00029228124797301677, - "loss": 0.0395, + "epoch": 0.02, + "learning_rate": 0.00029639777812533104, + "loss": 0.0505, "step": 4760 }, { - "epoch": 0.05, - "learning_rate": 0.00029226503210741384, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.000296390210432317, + "loss": 0.0509, "step": 4770 }, { - "epoch": 0.05, - "learning_rate": 0.00029224881624181096, - "loss": 0.0433, + "epoch": 0.02, + "learning_rate": 0.000296382642739303, + "loss": 0.046, "step": 4780 }, { - "epoch": 0.05, - "learning_rate": 0.0002922326003762081, - "loss": 0.0499, + "epoch": 0.02, + "learning_rate": 0.00029637507504628904, + "loss": 0.0936, "step": 4790 }, { - "epoch": 0.05, - "learning_rate": 0.00029221638451060514, - "loss": 0.0486, + "epoch": 0.02, + "learning_rate": 0.000296367507353275, + "loss": 0.0593, "step": 4800 }, { - "epoch": 0.05, - "learning_rate": 0.0002922001686450022, - "loss": 0.0388, + "epoch": 0.02, + "learning_rate": 0.000296359939660261, + "loss": 0.0514, "step": 4810 }, { - "epoch": 0.05, - "learning_rate": 0.0002921839527793993, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.000296352371967247, + "loss": 0.0491, "step": 4820 }, { - "epoch": 0.05, - "learning_rate": 0.00029216773691379645, - "loss": 0.0402, + "epoch": 0.02, + "learning_rate": 0.00029634480427423297, + "loss": 0.0521, "step": 4830 }, { - "epoch": 0.05, - "learning_rate": 0.0002921515210481935, - "loss": 0.0417, + "epoch": 0.02, + "learning_rate": 0.00029633723658121895, + "loss": 0.0521, "step": 4840 }, { - "epoch": 0.05, - "learning_rate": 0.00029213530518259063, - "loss": 0.0431, + "epoch": 0.02, + "learning_rate": 0.000296329668888205, + "loss": 0.0527, "step": 4850 }, { - "epoch": 0.05, - "learning_rate": 0.0002921190893169877, - "loss": 0.0408, + "epoch": 0.02, + "learning_rate": 0.00029632210119519097, + "loss": 0.0649, "step": 4860 }, { - "epoch": 0.05, - "learning_rate": 0.0002921028734513848, - "loss": 0.0398, + "epoch": 0.02, + "learning_rate": 0.00029631453350217695, + "loss": 0.0527, "step": 4870 }, { - "epoch": 0.05, - "learning_rate": 0.00029208665758578194, - "loss": 0.0566, + "epoch": 0.02, + "learning_rate": 0.00029630696580916293, + "loss": 0.0539, "step": 4880 }, { - "epoch": 0.05, - "learning_rate": 0.000292070441720179, - "loss": 0.0453, + "epoch": 0.02, + "learning_rate": 0.0002962993981161489, + "loss": 0.0478, "step": 4890 }, { - "epoch": 0.05, - "learning_rate": 0.00029205422585457607, - "loss": 0.044, + "epoch": 0.02, + "learning_rate": 0.0002962918304231349, + "loss": 0.0465, "step": 4900 }, { - "epoch": 0.05, - "learning_rate": 0.0002920380099889732, - "loss": 0.0461, + "epoch": 0.02, + "learning_rate": 0.00029628426273012093, + "loss": 0.0743, "step": 4910 }, { - "epoch": 0.05, - "learning_rate": 0.0002920217941233703, - "loss": 0.0415, + "epoch": 0.02, + "learning_rate": 0.0002962766950371069, + "loss": 0.073, "step": 4920 }, { - "epoch": 0.05, - "learning_rate": 0.0002920055782577674, - "loss": 0.0386, + "epoch": 0.02, + "learning_rate": 0.0002962691273440929, + "loss": 0.0692, "step": 4930 }, { - "epoch": 0.05, - "learning_rate": 0.00029198936239216444, - "loss": 0.0555, + "epoch": 0.02, + "learning_rate": 0.00029626155965107887, + "loss": 0.044, "step": 4940 }, { - "epoch": 0.05, - "learning_rate": 0.00029197314652656156, - "loss": 0.046, + "epoch": 0.02, + "learning_rate": 0.00029625399195806485, + "loss": 0.0441, "step": 4950 }, { - "epoch": 0.05, - "learning_rate": 0.0002919569306609587, - "loss": 0.0481, + "epoch": 0.03, + "learning_rate": 0.00029624642426505083, + "loss": 0.0501, "step": 4960 }, { - "epoch": 0.05, - "learning_rate": 0.00029194071479535574, - "loss": 0.0429, + "epoch": 0.03, + "learning_rate": 0.0002962388565720368, + "loss": 0.0458, "step": 4970 }, { - "epoch": 0.05, - "learning_rate": 0.0002919244989297528, - "loss": 0.0439, + "epoch": 0.03, + "learning_rate": 0.00029623128887902285, + "loss": 0.0422, "step": 4980 }, { - "epoch": 0.05, - "learning_rate": 0.00029190828306414993, - "loss": 0.0493, + "epoch": 0.03, + "learning_rate": 0.00029622372118600883, + "loss": 0.0495, "step": 4990 }, { - "epoch": 0.05, - "learning_rate": 0.00029189206719854705, - "loss": 0.0416, + "epoch": 0.03, + "learning_rate": 0.0002962161534929948, + "loss": 0.0464, "step": 5000 }, { - "epoch": 0.05, - "eval_cer": 0.9216007657603663, - "eval_loss": 0.03539329394698143, - "eval_runtime": 120.0814, - "eval_samples_per_second": 16.655, - "eval_steps_per_second": 4.164, + "epoch": 0.03, + "eval_cer": 0.9145071309559275, + "eval_loss": 0.03470829501748085, + "eval_runtime": 117.4598, + "eval_samples_per_second": 17.027, + "eval_steps_per_second": 4.257, "step": 5000 }, { - "epoch": 0.05, - "learning_rate": 0.0002918758513329441, - "loss": 0.0472, + "epoch": 0.03, + "learning_rate": 0.0002962085857999808, + "loss": 0.0427, "step": 5010 }, { - "epoch": 0.05, - "learning_rate": 0.00029185963546734124, - "loss": 0.0482, + "epoch": 0.03, + "learning_rate": 0.0002962010181069668, + "loss": 0.0465, "step": 5020 }, { - "epoch": 0.05, - "learning_rate": 0.0002918434196017383, - "loss": 0.0447, + "epoch": 0.03, + "learning_rate": 0.00029619345041395276, + "loss": 0.0453, "step": 5030 }, { - "epoch": 0.05, - "learning_rate": 0.0002918272037361354, - "loss": 0.0431, + "epoch": 0.03, + "learning_rate": 0.0002961858827209388, + "loss": 0.0415, "step": 5040 }, { - "epoch": 0.05, - "learning_rate": 0.00029181098787053254, - "loss": 0.0441, + "epoch": 0.03, + "learning_rate": 0.0002961783150279248, + "loss": 0.0476, "step": 5050 }, { - "epoch": 0.05, - "learning_rate": 0.0002917947720049296, - "loss": 0.0499, + "epoch": 0.03, + "learning_rate": 0.00029617074733491076, + "loss": 0.0447, "step": 5060 }, { - "epoch": 0.05, - "learning_rate": 0.00029177855613932667, - "loss": 0.0428, + "epoch": 0.03, + "learning_rate": 0.00029616317964189674, + "loss": 0.0512, "step": 5070 }, { - "epoch": 0.05, - "learning_rate": 0.0002917623402737238, - "loss": 0.0488, + "epoch": 0.03, + "learning_rate": 0.0002961556119488827, + "loss": 0.0486, "step": 5080 }, { - "epoch": 0.06, - "learning_rate": 0.0002917461244081209, - "loss": 0.0466, + "epoch": 0.03, + "learning_rate": 0.0002961480442558687, + "loss": 0.0486, "step": 5090 }, { - "epoch": 0.06, - "learning_rate": 0.000291729908542518, - "loss": 0.0459, + "epoch": 0.03, + "learning_rate": 0.00029614047656285474, + "loss": 0.0493, "step": 5100 }, { - "epoch": 0.06, - "learning_rate": 0.00029171369267691504, - "loss": 0.0492, + "epoch": 0.03, + "learning_rate": 0.0002961329088698407, + "loss": 0.0504, "step": 5110 }, { - "epoch": 0.06, - "learning_rate": 0.00029169747681131216, - "loss": 0.0482, + "epoch": 0.03, + "learning_rate": 0.0002961253411768267, + "loss": 0.0528, "step": 5120 }, { - "epoch": 0.06, - "learning_rate": 0.0002916812609457093, - "loss": 0.0454, + "epoch": 0.03, + "learning_rate": 0.0002961177734838127, + "loss": 0.046, "step": 5130 }, { - "epoch": 0.06, - "learning_rate": 0.00029166504508010635, - "loss": 0.0446, + "epoch": 0.03, + "learning_rate": 0.00029611020579079866, + "loss": 0.0519, "step": 5140 }, { - "epoch": 0.06, - "learning_rate": 0.00029164882921450347, - "loss": 0.0412, + "epoch": 0.03, + "learning_rate": 0.00029610263809778465, + "loss": 0.0498, "step": 5150 }, { - "epoch": 0.06, - "learning_rate": 0.00029163261334890053, - "loss": 0.042, + "epoch": 0.03, + "learning_rate": 0.0002960950704047706, + "loss": 0.0432, "step": 5160 }, { - "epoch": 0.06, - "learning_rate": 0.00029161639748329765, - "loss": 0.046, + "epoch": 0.03, + "learning_rate": 0.00029608750271175666, + "loss": 0.0501, "step": 5170 }, { - "epoch": 0.06, - "learning_rate": 0.0002916001816176947, - "loss": 0.0467, + "epoch": 0.03, + "learning_rate": 0.00029607993501874264, + "loss": 0.0449, "step": 5180 }, { - "epoch": 0.06, - "learning_rate": 0.00029158396575209184, - "loss": 0.0554, + "epoch": 0.03, + "learning_rate": 0.0002960723673257286, + "loss": 0.0499, "step": 5190 }, { - "epoch": 0.06, - "learning_rate": 0.0002915677498864889, - "loss": 0.0482, + "epoch": 0.03, + "learning_rate": 0.0002960647996327146, + "loss": 0.0484, "step": 5200 }, { - "epoch": 0.06, - "learning_rate": 0.000291551534020886, - "loss": 0.0492, + "epoch": 0.03, + "learning_rate": 0.0002960572319397006, + "loss": 0.0483, "step": 5210 }, { - "epoch": 0.06, - "learning_rate": 0.0002915353181552831, - "loss": 0.043, + "epoch": 0.03, + "learning_rate": 0.00029604966424668657, + "loss": 0.0518, "step": 5220 }, { - "epoch": 0.06, - "learning_rate": 0.0002915191022896802, - "loss": 0.0457, + "epoch": 0.03, + "learning_rate": 0.0002960420965536726, + "loss": 0.0527, "step": 5230 }, { - "epoch": 0.06, - "learning_rate": 0.0002915028864240773, - "loss": 0.0424, + "epoch": 0.03, + "learning_rate": 0.0002960345288606586, + "loss": 0.0436, "step": 5240 }, { - "epoch": 0.06, - "learning_rate": 0.0002914866705584744, - "loss": 0.0433, + "epoch": 0.03, + "learning_rate": 0.00029602696116764457, + "loss": 0.0591, "step": 5250 }, { - "epoch": 0.06, - "learning_rate": 0.00029147045469287146, - "loss": 0.0459, + "epoch": 0.03, + "learning_rate": 0.00029601939347463055, + "loss": 0.0473, "step": 5260 }, { - "epoch": 0.06, - "learning_rate": 0.0002914542388272686, - "loss": 0.0491, + "epoch": 0.03, + "learning_rate": 0.00029601182578161653, + "loss": 0.0429, "step": 5270 }, { - "epoch": 0.06, - "learning_rate": 0.00029143802296166565, - "loss": 0.0447, + "epoch": 0.03, + "learning_rate": 0.0002960042580886025, + "loss": 0.0483, "step": 5280 }, { - "epoch": 0.06, - "learning_rate": 0.00029142180709606277, - "loss": 0.0389, + "epoch": 0.03, + "learning_rate": 0.0002959966903955885, + "loss": 0.0446, "step": 5290 }, { - "epoch": 0.06, - "learning_rate": 0.00029140559123045983, - "loss": 0.0483, + "epoch": 0.03, + "learning_rate": 0.00029598912270257453, + "loss": 0.0484, "step": 5300 }, { - "epoch": 0.06, - "learning_rate": 0.00029138937536485695, - "loss": 0.0449, + "epoch": 0.03, + "learning_rate": 0.0002959815550095605, + "loss": 0.0453, "step": 5310 }, { - "epoch": 0.06, - "learning_rate": 0.00029137315949925407, - "loss": 0.0527, + "epoch": 0.03, + "learning_rate": 0.0002959739873165465, + "loss": 0.0419, "step": 5320 }, { - "epoch": 0.06, - "learning_rate": 0.00029135694363365114, - "loss": 0.0421, + "epoch": 0.03, + "learning_rate": 0.0002959664196235325, + "loss": 0.0449, "step": 5330 }, { - "epoch": 0.06, - "learning_rate": 0.0002913407277680482, - "loss": 0.0414, + "epoch": 0.03, + "learning_rate": 0.00029595885193051846, + "loss": 0.0401, "step": 5340 }, { - "epoch": 0.06, - "learning_rate": 0.0002913245119024453, - "loss": 0.0417, + "epoch": 0.03, + "learning_rate": 0.00029595128423750444, + "loss": 0.0498, "step": 5350 }, { - "epoch": 0.06, - "learning_rate": 0.00029130829603684244, - "loss": 0.0466, + "epoch": 0.03, + "learning_rate": 0.00029594371654449047, + "loss": 0.0448, "step": 5360 }, { - "epoch": 0.06, - "learning_rate": 0.0002912920801712395, - "loss": 0.0411, + "epoch": 0.03, + "learning_rate": 0.00029593614885147645, + "loss": 0.0476, "step": 5370 }, { - "epoch": 0.06, - "learning_rate": 0.0002912758643056366, - "loss": 0.0472, + "epoch": 0.03, + "learning_rate": 0.00029592858115846244, + "loss": 0.0491, "step": 5380 }, { - "epoch": 0.06, - "learning_rate": 0.0002912596484400337, - "loss": 0.0413, + "epoch": 0.03, + "learning_rate": 0.0002959210134654484, + "loss": 0.0471, "step": 5390 }, { - "epoch": 0.06, - "learning_rate": 0.0002912434325744308, - "loss": 0.0415, + "epoch": 0.03, + "learning_rate": 0.0002959134457724344, + "loss": 0.0448, "step": 5400 }, { - "epoch": 0.06, - "learning_rate": 0.0002912272167088279, - "loss": 0.0382, + "epoch": 0.03, + "learning_rate": 0.0002959058780794204, + "loss": 0.0648, "step": 5410 }, { - "epoch": 0.06, - "learning_rate": 0.000291211000843225, - "loss": 0.0447, + "epoch": 0.03, + "learning_rate": 0.0002958983103864064, + "loss": 0.0482, "step": 5420 }, { - "epoch": 0.06, - "learning_rate": 0.00029119478497762207, - "loss": 0.0448, + "epoch": 0.03, + "learning_rate": 0.0002958907426933924, + "loss": 0.0484, "step": 5430 }, { - "epoch": 0.06, - "learning_rate": 0.0002911785691120192, - "loss": 0.0493, + "epoch": 0.03, + "learning_rate": 0.0002958831750003784, + "loss": 0.0545, "step": 5440 }, { - "epoch": 0.06, - "learning_rate": 0.0002911623532464163, - "loss": 0.0477, + "epoch": 0.03, + "learning_rate": 0.00029587560730736436, + "loss": 0.0501, "step": 5450 }, { - "epoch": 0.06, - "learning_rate": 0.00029114613738081337, - "loss": 0.0433, + "epoch": 0.03, + "learning_rate": 0.00029586803961435034, + "loss": 0.0431, "step": 5460 }, { - "epoch": 0.06, - "learning_rate": 0.00029112992151521044, - "loss": 0.0509, + "epoch": 0.03, + "learning_rate": 0.0002958604719213363, + "loss": 0.0424, "step": 5470 }, { - "epoch": 0.06, - "learning_rate": 0.00029111370564960756, - "loss": 0.0432, + "epoch": 0.03, + "learning_rate": 0.0002958529042283223, + "loss": 0.0434, "step": 5480 }, { - "epoch": 0.06, - "learning_rate": 0.0002910974897840047, - "loss": 0.0506, + "epoch": 0.03, + "learning_rate": 0.00029584533653530834, + "loss": 0.0432, "step": 5490 }, { - "epoch": 0.06, - "learning_rate": 0.00029108127391840174, - "loss": 0.0524, + "epoch": 0.03, + "learning_rate": 0.0002958377688422943, + "loss": 0.0436, "step": 5500 }, { - "epoch": 0.06, - "learning_rate": 0.0002910650580527988, - "loss": 0.0488, + "epoch": 0.03, + "learning_rate": 0.0002958302011492803, + "loss": 0.0486, "step": 5510 }, { - "epoch": 0.06, - "learning_rate": 0.0002910488421871959, - "loss": 0.0429, + "epoch": 0.03, + "learning_rate": 0.0002958226334562663, + "loss": 0.0478, "step": 5520 }, { - "epoch": 0.06, - "learning_rate": 0.00029103262632159305, - "loss": 0.0477, + "epoch": 0.03, + "learning_rate": 0.00029581506576325227, + "loss": 0.0438, "step": 5530 }, { - "epoch": 0.06, - "learning_rate": 0.0002910164104559901, - "loss": 0.0474, + "epoch": 0.03, + "learning_rate": 0.00029580749807023825, + "loss": 0.0386, "step": 5540 }, { - "epoch": 0.06, - "learning_rate": 0.0002910001945903872, - "loss": 0.0439, + "epoch": 0.03, + "learning_rate": 0.0002957999303772243, + "loss": 0.0411, "step": 5550 }, { - "epoch": 0.06, - "learning_rate": 0.0002909839787247843, - "loss": 0.049, + "epoch": 0.03, + "learning_rate": 0.00029579236268421026, + "loss": 0.0462, "step": 5560 }, { - "epoch": 0.06, - "learning_rate": 0.0002909677628591814, - "loss": 0.0469, + "epoch": 0.03, + "learning_rate": 0.00029578479499119625, + "loss": 0.0436, "step": 5570 }, { - "epoch": 0.06, - "learning_rate": 0.0002909515469935785, - "loss": 0.044, + "epoch": 0.03, + "learning_rate": 0.0002957772272981822, + "loss": 0.0457, "step": 5580 }, { - "epoch": 0.06, - "learning_rate": 0.0002909353311279756, - "loss": 0.0446, + "epoch": 0.03, + "learning_rate": 0.0002957696596051682, + "loss": 0.0425, "step": 5590 }, { - "epoch": 0.06, - "learning_rate": 0.00029091911526237267, - "loss": 0.0424, + "epoch": 0.03, + "learning_rate": 0.0002957620919121542, + "loss": 0.0486, "step": 5600 }, { - "epoch": 0.06, - "learning_rate": 0.0002909028993967698, - "loss": 0.0494, + "epoch": 0.03, + "learning_rate": 0.0002957545242191402, + "loss": 0.0496, "step": 5610 }, { - "epoch": 0.06, - "learning_rate": 0.00029088668353116685, - "loss": 0.0461, + "epoch": 0.03, + "learning_rate": 0.0002957469565261262, + "loss": 0.0534, "step": 5620 }, { - "epoch": 0.06, - "learning_rate": 0.000290870467665564, - "loss": 0.0435, + "epoch": 0.03, + "learning_rate": 0.0002957393888331122, + "loss": 0.0385, "step": 5630 }, { - "epoch": 0.06, - "learning_rate": 0.00029085425179996104, - "loss": 0.0497, + "epoch": 0.03, + "learning_rate": 0.00029573182114009817, + "loss": 0.0467, "step": 5640 }, { - "epoch": 0.06, - "learning_rate": 0.00029083803593435816, - "loss": 0.0534, + "epoch": 0.03, + "learning_rate": 0.00029572425344708415, + "loss": 0.0478, "step": 5650 }, { - "epoch": 0.06, - "learning_rate": 0.0002908218200687552, - "loss": 0.0461, + "epoch": 0.03, + "learning_rate": 0.00029571668575407013, + "loss": 0.0406, "step": 5660 }, { - "epoch": 0.06, - "learning_rate": 0.00029080560420315235, - "loss": 0.05, + "epoch": 0.03, + "learning_rate": 0.0002957091180610561, + "loss": 0.0493, "step": 5670 }, { - "epoch": 0.06, - "learning_rate": 0.0002907893883375494, - "loss": 0.0438, + "epoch": 0.03, + "learning_rate": 0.0002957015503680421, + "loss": 0.0448, "step": 5680 }, { - "epoch": 0.06, - "learning_rate": 0.00029077317247194653, - "loss": 0.041, + "epoch": 0.03, + "learning_rate": 0.0002956939826750281, + "loss": 0.0465, "step": 5690 }, { - "epoch": 0.06, - "learning_rate": 0.0002907569566063436, - "loss": 0.0456, + "epoch": 0.03, + "learning_rate": 0.00029568641498201406, + "loss": 0.0485, "step": 5700 }, { - "epoch": 0.06, - "learning_rate": 0.0002907407407407407, - "loss": 0.0466, + "epoch": 0.03, + "learning_rate": 0.00029567884728900004, + "loss": 0.044, "step": 5710 }, { - "epoch": 0.06, - "learning_rate": 0.00029072452487513784, - "loss": 0.0462, + "epoch": 0.03, + "learning_rate": 0.0002956712795959861, + "loss": 0.0454, "step": 5720 }, { - "epoch": 0.06, - "learning_rate": 0.0002907083090095349, - "loss": 0.0439, + "epoch": 0.03, + "learning_rate": 0.00029566371190297206, + "loss": 0.0488, "step": 5730 }, { - "epoch": 0.06, - "learning_rate": 0.00029069209314393197, - "loss": 0.0481, + "epoch": 0.03, + "learning_rate": 0.00029565614420995804, + "loss": 0.042, "step": 5740 }, { - "epoch": 0.06, - "learning_rate": 0.0002906758772783291, - "loss": 0.0511, + "epoch": 0.03, + "learning_rate": 0.000295648576516944, + "loss": 0.046, "step": 5750 }, { - "epoch": 0.06, - "learning_rate": 0.0002906596614127262, - "loss": 0.0538, + "epoch": 0.03, + "learning_rate": 0.00029564100882393, + "loss": 0.0447, "step": 5760 }, { - "epoch": 0.06, - "learning_rate": 0.00029064344554712327, - "loss": 0.0438, + "epoch": 0.03, + "learning_rate": 0.000295633441130916, + "loss": 0.043, "step": 5770 }, { - "epoch": 0.06, - "learning_rate": 0.0002906272296815204, - "loss": 0.0465, + "epoch": 0.03, + "learning_rate": 0.000295625873437902, + "loss": 0.0484, "step": 5780 }, { - "epoch": 0.06, - "learning_rate": 0.00029061101381591746, - "loss": 0.0422, + "epoch": 0.03, + "learning_rate": 0.000295618305744888, + "loss": 0.0468, "step": 5790 }, { - "epoch": 0.06, - "learning_rate": 0.0002905947979503146, - "loss": 0.046, + "epoch": 0.03, + "learning_rate": 0.000295610738051874, + "loss": 0.0498, "step": 5800 }, { - "epoch": 0.06, - "learning_rate": 0.00029057858208471164, - "loss": 0.0476, + "epoch": 0.03, + "learning_rate": 0.00029560317035885996, + "loss": 0.0474, "step": 5810 }, { - "epoch": 0.06, - "learning_rate": 0.00029056236621910876, - "loss": 0.0465, + "epoch": 0.03, + "learning_rate": 0.00029559560266584594, + "loss": 0.045, "step": 5820 }, { - "epoch": 0.06, - "learning_rate": 0.00029054615035350583, - "loss": 0.0452, + "epoch": 0.03, + "learning_rate": 0.0002955880349728319, + "loss": 0.0471, "step": 5830 }, { - "epoch": 0.06, - "learning_rate": 0.00029052993448790295, - "loss": 0.0539, + "epoch": 0.03, + "learning_rate": 0.00029558046727981796, + "loss": 0.0414, "step": 5840 }, { - "epoch": 0.06, - "learning_rate": 0.0002905137186223, - "loss": 0.0472, + "epoch": 0.03, + "learning_rate": 0.00029557289958680394, + "loss": 0.0423, "step": 5850 }, { - "epoch": 0.06, - "learning_rate": 0.00029049750275669713, - "loss": 0.0496, + "epoch": 0.03, + "learning_rate": 0.0002955653318937899, + "loss": 0.0437, "step": 5860 }, { - "epoch": 0.06, - "learning_rate": 0.0002904812868910942, - "loss": 0.0466, + "epoch": 0.03, + "learning_rate": 0.0002955577642007759, + "loss": 0.0409, "step": 5870 }, { - "epoch": 0.06, - "learning_rate": 0.0002904650710254913, - "loss": 0.0423, + "epoch": 0.03, + "learning_rate": 0.0002955501965077619, + "loss": 0.0462, "step": 5880 }, { - "epoch": 0.06, - "learning_rate": 0.00029044885515988844, - "loss": 0.0423, + "epoch": 0.03, + "learning_rate": 0.00029554262881474787, + "loss": 0.0426, "step": 5890 }, { - "epoch": 0.06, - "learning_rate": 0.0002904326392942855, - "loss": 0.0551, + "epoch": 0.03, + "learning_rate": 0.00029553506112173385, + "loss": 0.0413, "step": 5900 }, { - "epoch": 0.06, - "learning_rate": 0.00029041642342868257, - "loss": 0.0518, + "epoch": 0.03, + "learning_rate": 0.0002955274934287199, + "loss": 0.0397, "step": 5910 }, { - "epoch": 0.06, - "learning_rate": 0.0002904002075630797, - "loss": 0.0499, + "epoch": 0.03, + "learning_rate": 0.00029551992573570587, + "loss": 0.0427, "step": 5920 }, { - "epoch": 0.06, - "learning_rate": 0.0002903839916974768, - "loss": 0.0686, + "epoch": 0.03, + "learning_rate": 0.00029551235804269185, + "loss": 0.0414, "step": 5930 }, { - "epoch": 0.06, - "learning_rate": 0.0002903677758318739, - "loss": 0.0467, + "epoch": 0.03, + "learning_rate": 0.00029550479034967783, + "loss": 0.0402, "step": 5940 }, { - "epoch": 0.06, - "learning_rate": 0.00029035155996627094, - "loss": 0.044, + "epoch": 0.03, + "learning_rate": 0.0002954972226566638, + "loss": 0.0468, "step": 5950 }, { - "epoch": 0.06, - "learning_rate": 0.00029033534410066806, - "loss": 0.0512, + "epoch": 0.03, + "learning_rate": 0.0002954896549636498, + "loss": 0.0353, "step": 5960 }, { - "epoch": 0.06, - "learning_rate": 0.0002903191282350652, - "loss": 0.0445, + "epoch": 0.03, + "learning_rate": 0.00029548208727063583, + "loss": 0.0466, "step": 5970 }, { - "epoch": 0.06, - "learning_rate": 0.00029030291236946225, - "loss": 0.0489, + "epoch": 0.03, + "learning_rate": 0.0002954745195776218, + "loss": 0.0469, "step": 5980 }, { - "epoch": 0.06, - "learning_rate": 0.0002902866965038593, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.0002954669518846078, + "loss": 0.0437, "step": 5990 }, { - "epoch": 0.06, - "learning_rate": 0.00029027048063825643, - "loss": 0.0433, + "epoch": 0.03, + "learning_rate": 0.00029545938419159377, + "loss": 0.0402, "step": 6000 }, { - "epoch": 0.06, - "eval_cer": 0.9216250866431449, - "eval_loss": 0.033627625554800034, - "eval_runtime": 121.2057, - "eval_samples_per_second": 16.501, - "eval_steps_per_second": 4.125, + "epoch": 0.03, + "eval_cer": 0.9144964565985481, + "eval_loss": 0.03346065431833267, + "eval_runtime": 117.4862, + "eval_samples_per_second": 17.023, + "eval_steps_per_second": 4.256, "step": 6000 }, { - "epoch": 0.06, - "learning_rate": 0.00029025426477265355, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.00029545181649857975, + "loss": 0.0513, "step": 6010 }, { - "epoch": 0.07, - "learning_rate": 0.00029023804890705067, - "loss": 0.0464, + "epoch": 0.03, + "learning_rate": 0.00029544424880556574, + "loss": 0.0432, "step": 6020 }, { - "epoch": 0.07, - "learning_rate": 0.00029022183304144774, - "loss": 0.0433, + "epoch": 0.03, + "learning_rate": 0.0002954366811125517, + "loss": 0.0466, "step": 6030 }, { - "epoch": 0.07, - "learning_rate": 0.0002902056171758448, - "loss": 0.0471, + "epoch": 0.03, + "learning_rate": 0.00029542911341953775, + "loss": 0.0424, "step": 6040 }, { - "epoch": 0.07, - "learning_rate": 0.0002901894013102419, - "loss": 0.0426, + "epoch": 0.03, + "learning_rate": 0.00029542154572652373, + "loss": 0.0389, "step": 6050 }, { - "epoch": 0.07, - "learning_rate": 0.00029017318544463904, - "loss": 0.0427, + "epoch": 0.03, + "learning_rate": 0.0002954139780335097, + "loss": 0.0377, "step": 6060 }, { - "epoch": 0.07, - "learning_rate": 0.0002901569695790361, - "loss": 0.0403, + "epoch": 0.03, + "learning_rate": 0.0002954064103404957, + "loss": 0.0425, "step": 6070 }, { - "epoch": 0.07, - "learning_rate": 0.0002901407537134332, - "loss": 0.0447, + "epoch": 0.03, + "learning_rate": 0.0002953988426474817, + "loss": 0.0406, "step": 6080 }, { - "epoch": 0.07, - "learning_rate": 0.0002901245378478303, - "loss": 0.044, + "epoch": 0.03, + "learning_rate": 0.00029539127495446766, + "loss": 0.0465, "step": 6090 }, { - "epoch": 0.07, - "learning_rate": 0.0002901083219822274, - "loss": 0.0468, + "epoch": 0.03, + "learning_rate": 0.0002953837072614537, + "loss": 0.0463, "step": 6100 }, { - "epoch": 0.07, - "learning_rate": 0.0002900921061166245, - "loss": 0.0402, + "epoch": 0.03, + "learning_rate": 0.0002953761395684397, + "loss": 0.0954, "step": 6110 }, { - "epoch": 0.07, - "learning_rate": 0.00029007589025102155, - "loss": 0.0405, + "epoch": 0.03, + "learning_rate": 0.00029536857187542566, + "loss": 0.068, "step": 6120 }, { - "epoch": 0.07, - "learning_rate": 0.00029005967438541867, - "loss": 0.0496, + "epoch": 0.03, + "learning_rate": 0.00029536100418241164, + "loss": 0.0656, "step": 6130 }, { - "epoch": 0.07, - "learning_rate": 0.0002900434585198158, - "loss": 0.0491, + "epoch": 0.03, + "learning_rate": 0.0002953534364893976, + "loss": 0.066, "step": 6140 }, { - "epoch": 0.07, - "learning_rate": 0.00029002724265421285, - "loss": 0.0556, + "epoch": 0.03, + "learning_rate": 0.0002953458687963836, + "loss": 0.0541, "step": 6150 }, { - "epoch": 0.07, - "learning_rate": 0.00029001102678860997, - "loss": 0.0431, + "epoch": 0.03, + "learning_rate": 0.00029533830110336964, + "loss": 0.0574, "step": 6160 }, { - "epoch": 0.07, - "learning_rate": 0.00028999481092300704, - "loss": 0.0403, + "epoch": 0.03, + "learning_rate": 0.0002953307334103556, + "loss": 0.0532, "step": 6170 }, { - "epoch": 0.07, - "learning_rate": 0.00028997859505740416, - "loss": 0.0448, + "epoch": 0.03, + "learning_rate": 0.0002953231657173416, + "loss": 0.0622, "step": 6180 }, { - "epoch": 0.07, - "learning_rate": 0.0002899623791918012, - "loss": 0.0421, + "epoch": 0.03, + "learning_rate": 0.0002953155980243276, + "loss": 0.0538, "step": 6190 }, { - "epoch": 0.07, - "learning_rate": 0.00028994616332619834, - "loss": 0.0453, + "epoch": 0.03, + "learning_rate": 0.00029530803033131356, + "loss": 0.0555, "step": 6200 }, { - "epoch": 0.07, - "learning_rate": 0.0002899299474605954, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.00029530046263829955, + "loss": 0.0598, "step": 6210 }, { - "epoch": 0.07, - "learning_rate": 0.00028991373159499253, - "loss": 0.0475, + "epoch": 0.03, + "learning_rate": 0.0002952928949452855, + "loss": 0.046, "step": 6220 }, { - "epoch": 0.07, - "learning_rate": 0.0002898975157293896, - "loss": 0.0407, + "epoch": 0.03, + "learning_rate": 0.00029528532725227156, + "loss": 0.0497, "step": 6230 }, { - "epoch": 0.07, - "learning_rate": 0.0002898812998637867, - "loss": 0.046, + "epoch": 0.03, + "learning_rate": 0.00029527775955925754, + "loss": 0.0507, "step": 6240 }, { - "epoch": 0.07, - "learning_rate": 0.0002898650839981838, - "loss": 0.0442, + "epoch": 0.03, + "learning_rate": 0.0002952701918662435, + "loss": 0.0494, "step": 6250 }, { - "epoch": 0.07, - "learning_rate": 0.0002898488681325809, - "loss": 0.0435, + "epoch": 0.03, + "learning_rate": 0.0002952626241732295, + "loss": 0.0491, "step": 6260 }, { - "epoch": 0.07, - "learning_rate": 0.00028983265226697796, - "loss": 0.0422, + "epoch": 0.03, + "learning_rate": 0.0002952550564802155, + "loss": 0.0548, "step": 6270 }, { - "epoch": 0.07, - "learning_rate": 0.0002898164364013751, - "loss": 0.0409, + "epoch": 0.03, + "learning_rate": 0.00029524748878720147, + "loss": 0.0527, "step": 6280 }, { - "epoch": 0.07, - "learning_rate": 0.00028980022053577215, - "loss": 0.041, + "epoch": 0.03, + "learning_rate": 0.0002952399210941875, + "loss": 0.0517, "step": 6290 }, { - "epoch": 0.07, - "learning_rate": 0.00028978400467016927, - "loss": 0.0356, + "epoch": 0.03, + "learning_rate": 0.0002952323534011735, + "loss": 0.0451, "step": 6300 }, { - "epoch": 0.07, - "learning_rate": 0.00028976778880456634, - "loss": 0.0383, + "epoch": 0.03, + "learning_rate": 0.00029522478570815947, + "loss": 0.0527, "step": 6310 }, { - "epoch": 0.07, - "learning_rate": 0.00028975157293896345, - "loss": 0.0382, + "epoch": 0.03, + "learning_rate": 0.00029521721801514545, + "loss": 0.0539, "step": 6320 }, { - "epoch": 0.07, - "learning_rate": 0.0002897353570733606, - "loss": 0.0409, + "epoch": 0.03, + "learning_rate": 0.00029520965032213143, + "loss": 0.0477, "step": 6330 }, { - "epoch": 0.07, - "learning_rate": 0.00028971914120775764, - "loss": 0.0401, + "epoch": 0.03, + "learning_rate": 0.0002952020826291174, + "loss": 0.0627, "step": 6340 }, { - "epoch": 0.07, - "learning_rate": 0.0002897029253421547, - "loss": 0.0427, + "epoch": 0.03, + "learning_rate": 0.00029519451493610345, + "loss": 0.0474, "step": 6350 }, { - "epoch": 0.07, - "learning_rate": 0.0002896867094765518, - "loss": 0.0416, + "epoch": 0.03, + "learning_rate": 0.00029518694724308943, + "loss": 0.0467, "step": 6360 }, { - "epoch": 0.07, - "learning_rate": 0.00028967049361094895, - "loss": 0.0402, + "epoch": 0.03, + "learning_rate": 0.0002951793795500754, + "loss": 0.0516, "step": 6370 }, { - "epoch": 0.07, - "learning_rate": 0.000289654277745346, - "loss": 0.0507, + "epoch": 0.03, + "learning_rate": 0.0002951718118570614, + "loss": 0.0443, "step": 6380 }, { - "epoch": 0.07, - "learning_rate": 0.0002896380618797431, - "loss": 0.0411, + "epoch": 0.03, + "learning_rate": 0.0002951642441640474, + "loss": 0.048, "step": 6390 }, { - "epoch": 0.07, - "learning_rate": 0.0002896218460141402, - "loss": 0.0436, + "epoch": 0.03, + "learning_rate": 0.00029515667647103336, + "loss": 0.0481, "step": 6400 }, { - "epoch": 0.07, - "learning_rate": 0.0002896056301485373, - "loss": 0.043, + "epoch": 0.03, + "learning_rate": 0.00029514910877801934, + "loss": 0.0468, "step": 6410 }, { - "epoch": 0.07, - "learning_rate": 0.0002895894142829344, - "loss": 0.0404, + "epoch": 0.03, + "learning_rate": 0.00029514154108500537, + "loss": 0.0453, "step": 6420 }, { - "epoch": 0.07, - "learning_rate": 0.0002895731984173315, - "loss": 0.0423, + "epoch": 0.03, + "learning_rate": 0.00029513397339199135, + "loss": 0.0819, "step": 6430 }, { - "epoch": 0.07, - "learning_rate": 0.00028955698255172857, - "loss": 0.0436, + "epoch": 0.03, + "learning_rate": 0.00029512640569897734, + "loss": 0.0532, "step": 6440 }, { - "epoch": 0.07, - "learning_rate": 0.0002895407666861257, - "loss": 0.0377, + "epoch": 0.03, + "learning_rate": 0.0002951188380059633, + "loss": 0.0467, "step": 6450 }, { - "epoch": 0.07, - "learning_rate": 0.0002895245508205228, - "loss": 0.0412, + "epoch": 0.03, + "learning_rate": 0.0002951112703129493, + "loss": 0.048, "step": 6460 }, { - "epoch": 0.07, - "learning_rate": 0.0002895083349549199, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.0002951037026199353, + "loss": 0.0522, "step": 6470 }, { - "epoch": 0.07, - "learning_rate": 0.00028949211908931694, - "loss": 0.0448, + "epoch": 0.03, + "learning_rate": 0.0002950961349269213, + "loss": 0.0526, "step": 6480 }, { - "epoch": 0.07, - "learning_rate": 0.00028947590322371406, - "loss": 0.0421, + "epoch": 0.03, + "learning_rate": 0.0002950885672339073, + "loss": 0.0431, "step": 6490 }, { - "epoch": 0.07, - "learning_rate": 0.0002894596873581112, - "loss": 0.0396, + "epoch": 0.03, + "learning_rate": 0.0002950809995408933, + "loss": 0.0413, "step": 6500 }, { - "epoch": 0.07, - "learning_rate": 0.00028944347149250824, - "loss": 0.0402, + "epoch": 0.03, + "learning_rate": 0.00029507343184787926, + "loss": 0.0447, "step": 6510 }, { - "epoch": 0.07, - "learning_rate": 0.0002894272556269053, - "loss": 0.0447, + "epoch": 0.03, + "learning_rate": 0.00029506586415486524, + "loss": 0.0429, "step": 6520 }, { - "epoch": 0.07, - "learning_rate": 0.00028941103976130243, - "loss": 0.0376, + "epoch": 0.03, + "learning_rate": 0.0002950582964618512, + "loss": 0.0491, "step": 6530 }, { - "epoch": 0.07, - "learning_rate": 0.00028939482389569955, - "loss": 0.046, + "epoch": 0.03, + "learning_rate": 0.0002950507287688372, + "loss": 0.0441, "step": 6540 }, { - "epoch": 0.07, - "learning_rate": 0.0002893786080300966, - "loss": 0.04, + "epoch": 0.03, + "learning_rate": 0.00029504316107582324, + "loss": 0.047, "step": 6550 }, { - "epoch": 0.07, - "learning_rate": 0.0002893623921644937, - "loss": 0.0441, + "epoch": 0.03, + "learning_rate": 0.0002950355933828092, + "loss": 0.0478, "step": 6560 }, { - "epoch": 0.07, - "learning_rate": 0.0002893461762988908, - "loss": 0.0379, + "epoch": 0.03, + "learning_rate": 0.0002950280256897952, + "loss": 0.0459, "step": 6570 }, { - "epoch": 0.07, - "learning_rate": 0.0002893299604332879, - "loss": 0.0483, + "epoch": 0.03, + "learning_rate": 0.0002950204579967812, + "loss": 0.0422, "step": 6580 }, { - "epoch": 0.07, - "learning_rate": 0.000289313744567685, - "loss": 0.0427, + "epoch": 0.03, + "learning_rate": 0.00029501289030376717, + "loss": 0.044, "step": 6590 }, { - "epoch": 0.07, - "learning_rate": 0.0002892975287020821, - "loss": 0.0446, + "epoch": 0.03, + "learning_rate": 0.00029500532261075315, + "loss": 0.0382, "step": 6600 }, { - "epoch": 0.07, - "learning_rate": 0.00028928131283647917, - "loss": 0.0445, + "epoch": 0.03, + "learning_rate": 0.0002949977549177392, + "loss": 0.0437, "step": 6610 }, { - "epoch": 0.07, - "learning_rate": 0.0002892650969708763, - "loss": 0.0454, + "epoch": 0.03, + "learning_rate": 0.00029499018722472516, + "loss": 0.0372, "step": 6620 }, { - "epoch": 0.07, - "learning_rate": 0.0002892488811052734, - "loss": 0.0423, + "epoch": 0.03, + "learning_rate": 0.00029498261953171115, + "loss": 0.0367, "step": 6630 }, { - "epoch": 0.07, - "learning_rate": 0.0002892326652396705, - "loss": 0.0465, + "epoch": 0.03, + "learning_rate": 0.0002949750518386971, + "loss": 0.0394, "step": 6640 }, { - "epoch": 0.07, - "learning_rate": 0.00028921644937406754, - "loss": 0.0435, + "epoch": 0.03, + "learning_rate": 0.0002949674841456831, + "loss": 0.0373, "step": 6650 }, { - "epoch": 0.07, - "learning_rate": 0.00028920023350846466, - "loss": 0.0428, + "epoch": 0.03, + "learning_rate": 0.0002949599164526691, + "loss": 0.0447, "step": 6660 }, { - "epoch": 0.07, - "learning_rate": 0.0002891840176428618, - "loss": 0.041, + "epoch": 0.03, + "learning_rate": 0.0002949523487596551, + "loss": 0.0398, "step": 6670 }, { - "epoch": 0.07, - "learning_rate": 0.00028916780177725885, - "loss": 0.0383, + "epoch": 0.03, + "learning_rate": 0.0002949447810666411, + "loss": 0.0366, "step": 6680 }, { - "epoch": 0.07, - "learning_rate": 0.0002891515859116559, - "loss": 0.0424, + "epoch": 0.03, + "learning_rate": 0.0002949372133736271, + "loss": 0.0432, "step": 6690 }, { - "epoch": 0.07, - "learning_rate": 0.00028913537004605303, - "loss": 0.0369, + "epoch": 0.03, + "learning_rate": 0.00029492964568061307, + "loss": 0.0436, "step": 6700 }, { - "epoch": 0.07, - "learning_rate": 0.00028911915418045015, - "loss": 0.0459, + "epoch": 0.03, + "learning_rate": 0.00029492207798759905, + "loss": 0.0411, "step": 6710 }, { - "epoch": 0.07, - "learning_rate": 0.0002891029383148472, - "loss": 0.0438, + "epoch": 0.03, + "learning_rate": 0.00029491451029458503, + "loss": 0.0417, "step": 6720 }, { - "epoch": 0.07, - "learning_rate": 0.00028908672244924434, - "loss": 0.0379, + "epoch": 0.03, + "learning_rate": 0.000294906942601571, + "loss": 0.0432, "step": 6730 }, { - "epoch": 0.07, - "learning_rate": 0.0002890705065836414, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.00029489937490855705, + "loss": 0.0392, "step": 6740 }, { - "epoch": 0.07, - "learning_rate": 0.0002890542907180385, - "loss": 0.0438, + "epoch": 0.03, + "learning_rate": 0.00029489180721554303, + "loss": 0.0403, "step": 6750 }, { - "epoch": 0.07, - "learning_rate": 0.0002890380748524356, - "loss": 0.0431, + "epoch": 0.03, + "learning_rate": 0.000294884239522529, + "loss": 0.0409, "step": 6760 }, { - "epoch": 0.07, - "learning_rate": 0.0002890218589868327, - "loss": 0.0471, + "epoch": 0.03, + "learning_rate": 0.000294876671829515, + "loss": 0.0413, "step": 6770 }, { - "epoch": 0.07, - "learning_rate": 0.0002890056431212298, - "loss": 0.0387, + "epoch": 0.03, + "learning_rate": 0.000294869104136501, + "loss": 0.0445, "step": 6780 }, { - "epoch": 0.07, - "learning_rate": 0.0002889894272556269, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.00029486153644348696, + "loss": 0.0415, "step": 6790 }, { - "epoch": 0.07, - "learning_rate": 0.00028897321139002396, - "loss": 0.0371, + "epoch": 0.03, + "learning_rate": 0.000294853968750473, + "loss": 0.0381, "step": 6800 }, { - "epoch": 0.07, - "learning_rate": 0.0002889569955244211, - "loss": 0.0421, + "epoch": 0.03, + "learning_rate": 0.000294846401057459, + "loss": 0.042, "step": 6810 }, { - "epoch": 0.07, - "learning_rate": 0.00028894077965881815, - "loss": 0.0421, + "epoch": 0.03, + "learning_rate": 0.00029483883336444496, + "loss": 0.0454, "step": 6820 }, { - "epoch": 0.07, - "learning_rate": 0.00028892456379321527, - "loss": 0.0368, + "epoch": 0.03, + "learning_rate": 0.00029483126567143094, + "loss": 0.0434, "step": 6830 }, { - "epoch": 0.07, - "learning_rate": 0.00028890834792761233, - "loss": 0.0374, + "epoch": 0.03, + "learning_rate": 0.0002948236979784169, + "loss": 0.0438, "step": 6840 }, { - "epoch": 0.07, - "learning_rate": 0.00028889213206200945, - "loss": 0.0407, + "epoch": 0.03, + "learning_rate": 0.0002948161302854029, + "loss": 0.0494, "step": 6850 }, { - "epoch": 0.07, - "learning_rate": 0.0002888759161964065, - "loss": 0.0466, + "epoch": 0.03, + "learning_rate": 0.00029480856259238894, + "loss": 0.0552, "step": 6860 }, { - "epoch": 0.07, - "learning_rate": 0.00028885970033080364, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.0002948009948993749, + "loss": 0.0457, "step": 6870 }, { - "epoch": 0.07, - "learning_rate": 0.0002888434844652007, - "loss": 0.0449, + "epoch": 0.03, + "learning_rate": 0.0002947934272063609, + "loss": 0.0391, "step": 6880 }, { - "epoch": 0.07, - "learning_rate": 0.0002888272685995978, - "loss": 0.0395, + "epoch": 0.03, + "learning_rate": 0.0002947858595133469, + "loss": 0.0444, "step": 6890 }, { - "epoch": 0.07, - "learning_rate": 0.00028881105273399494, - "loss": 0.0423, + "epoch": 0.03, + "learning_rate": 0.00029477829182033286, + "loss": 0.0453, "step": 6900 }, { - "epoch": 0.07, - "learning_rate": 0.000288794836868392, - "loss": 0.0399, + "epoch": 0.03, + "learning_rate": 0.00029477072412731884, + "loss": 0.045, "step": 6910 }, { - "epoch": 0.07, - "learning_rate": 0.0002887786210027891, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.0002947631564343048, + "loss": 0.0388, "step": 6920 }, { - "epoch": 0.07, - "learning_rate": 0.0002887624051371862, - "loss": 0.0448, + "epoch": 0.03, + "learning_rate": 0.0002947555887412908, + "loss": 0.0405, "step": 6930 }, { - "epoch": 0.08, - "learning_rate": 0.0002887461892715833, - "loss": 0.0411, + "epoch": 0.04, + "learning_rate": 0.0002947480210482768, + "loss": 0.0415, "step": 6940 }, { - "epoch": 0.08, - "learning_rate": 0.0002887299734059804, - "loss": 0.0476, + "epoch": 0.04, + "learning_rate": 0.00029474045335526277, + "loss": 0.0424, "step": 6950 }, { - "epoch": 0.08, - "learning_rate": 0.00028871375754037744, - "loss": 0.0365, + "epoch": 0.04, + "learning_rate": 0.00029473288566224875, + "loss": 0.0373, "step": 6960 }, { - "epoch": 0.08, - "learning_rate": 0.00028869754167477456, - "loss": 0.0408, + "epoch": 0.04, + "learning_rate": 0.0002947253179692348, + "loss": 0.0375, "step": 6970 }, { - "epoch": 0.08, - "learning_rate": 0.0002886813258091717, - "loss": 0.0426, + "epoch": 0.04, + "learning_rate": 0.00029471775027622077, + "loss": 0.0396, "step": 6980 }, { - "epoch": 0.08, - "learning_rate": 0.00028866510994356875, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.00029471018258320675, + "loss": 0.0405, "step": 6990 }, { - "epoch": 0.08, - "learning_rate": 0.0002886488940779658, - "loss": 0.045, + "epoch": 0.04, + "learning_rate": 0.00029470261489019273, + "loss": 0.0927, "step": 7000 }, { - "epoch": 0.08, - "eval_cer": 0.9216294296579268, - "eval_loss": 0.03147590905427933, - "eval_runtime": 120.5116, - "eval_samples_per_second": 16.596, - "eval_steps_per_second": 4.149, + "epoch": 0.04, + "eval_cer": 0.9144498775845288, + "eval_loss": 0.03059179149568081, + "eval_runtime": 117.5676, + "eval_samples_per_second": 17.011, + "eval_steps_per_second": 4.253, "step": 7000 }, { - "epoch": 0.08, - "learning_rate": 0.00028863267821236294, - "loss": 0.0435, + "epoch": 0.04, + "learning_rate": 0.0002946950471971787, + "loss": 0.0505, "step": 7010 }, { - "epoch": 0.08, - "learning_rate": 0.00028861646234676006, - "loss": 0.0446, + "epoch": 0.04, + "learning_rate": 0.0002946874795041647, + "loss": 0.0615, "step": 7020 }, { - "epoch": 0.08, - "learning_rate": 0.0002886002464811572, - "loss": 0.0447, + "epoch": 0.04, + "learning_rate": 0.00029467991181115073, + "loss": 0.0509, "step": 7030 }, { - "epoch": 0.08, - "learning_rate": 0.00028858403061555424, - "loss": 0.0341, + "epoch": 0.04, + "learning_rate": 0.0002946723441181367, + "loss": 0.0462, "step": 7040 }, { - "epoch": 0.08, - "learning_rate": 0.0002885678147499513, - "loss": 0.0362, + "epoch": 0.04, + "learning_rate": 0.0002946647764251227, + "loss": 0.0421, "step": 7050 }, { - "epoch": 0.08, - "learning_rate": 0.0002885515988843484, - "loss": 0.0411, + "epoch": 0.04, + "learning_rate": 0.00029465720873210867, + "loss": 0.0414, "step": 7060 }, { - "epoch": 0.08, - "learning_rate": 0.00028853538301874555, - "loss": 0.0467, + "epoch": 0.04, + "learning_rate": 0.00029464964103909465, + "loss": 0.0405, "step": 7070 }, { - "epoch": 0.08, - "learning_rate": 0.0002885191671531426, - "loss": 0.0403, + "epoch": 0.04, + "learning_rate": 0.00029464207334608064, + "loss": 0.0436, "step": 7080 }, { - "epoch": 0.08, - "learning_rate": 0.0002885029512875397, - "loss": 0.0409, + "epoch": 0.04, + "learning_rate": 0.0002946345056530666, + "loss": 0.0425, "step": 7090 }, { - "epoch": 0.08, - "learning_rate": 0.0002884867354219368, - "loss": 0.0412, + "epoch": 0.04, + "learning_rate": 0.00029462693796005265, + "loss": 0.0442, "step": 7100 }, { - "epoch": 0.08, - "learning_rate": 0.0002884705195563339, - "loss": 0.0408, + "epoch": 0.04, + "learning_rate": 0.00029461937026703863, + "loss": 0.0411, "step": 7110 }, { - "epoch": 0.08, - "learning_rate": 0.000288454303690731, - "loss": 0.0475, + "epoch": 0.04, + "learning_rate": 0.0002946118025740246, + "loss": 0.0409, "step": 7120 }, { - "epoch": 0.08, - "learning_rate": 0.00028843808782512805, - "loss": 0.0398, + "epoch": 0.04, + "learning_rate": 0.0002946042348810106, + "loss": 0.0415, "step": 7130 }, { - "epoch": 0.08, - "learning_rate": 0.00028842187195952517, - "loss": 0.0436, + "epoch": 0.04, + "learning_rate": 0.0002945966671879966, + "loss": 0.0379, "step": 7140 }, { - "epoch": 0.08, - "learning_rate": 0.0002884056560939223, - "loss": 0.0405, + "epoch": 0.04, + "learning_rate": 0.00029458909949498256, + "loss": 0.0438, "step": 7150 }, { - "epoch": 0.08, - "learning_rate": 0.00028838944022831935, - "loss": 0.0405, + "epoch": 0.04, + "learning_rate": 0.0002945815318019686, + "loss": 0.0488, "step": 7160 }, { - "epoch": 0.08, - "learning_rate": 0.0002883732243627165, - "loss": 0.0364, + "epoch": 0.04, + "learning_rate": 0.0002945739641089546, + "loss": 0.0399, "step": 7170 }, { - "epoch": 0.08, - "learning_rate": 0.00028835700849711354, - "loss": 0.037, + "epoch": 0.04, + "learning_rate": 0.00029456639641594056, + "loss": 0.0477, "step": 7180 }, { - "epoch": 0.08, - "learning_rate": 0.00028834079263151066, - "loss": 0.0437, + "epoch": 0.04, + "learning_rate": 0.00029455882872292654, + "loss": 0.0425, "step": 7190 }, { - "epoch": 0.08, - "learning_rate": 0.0002883245767659078, - "loss": 0.0445, + "epoch": 0.04, + "learning_rate": 0.0002945512610299125, + "loss": 0.0436, "step": 7200 }, { - "epoch": 0.08, - "learning_rate": 0.00028830836090030484, - "loss": 0.0442, + "epoch": 0.04, + "learning_rate": 0.0002945436933368985, + "loss": 0.0417, "step": 7210 }, { - "epoch": 0.08, - "learning_rate": 0.0002882921450347019, - "loss": 0.0418, + "epoch": 0.04, + "learning_rate": 0.00029453612564388454, + "loss": 0.0403, "step": 7220 }, { - "epoch": 0.08, - "learning_rate": 0.00028827592916909903, - "loss": 0.0386, + "epoch": 0.04, + "learning_rate": 0.0002945285579508705, + "loss": 0.0378, "step": 7230 }, { - "epoch": 0.08, - "learning_rate": 0.00028825971330349615, - "loss": 0.035, + "epoch": 0.04, + "learning_rate": 0.0002945209902578565, + "loss": 0.045, "step": 7240 }, { - "epoch": 0.08, - "learning_rate": 0.0002882434974378932, - "loss": 0.0475, + "epoch": 0.04, + "learning_rate": 0.0002945134225648425, + "loss": 0.0385, "step": 7250 }, { - "epoch": 0.08, - "learning_rate": 0.0002882272815722903, - "loss": 0.0443, + "epoch": 0.04, + "learning_rate": 0.00029450585487182846, + "loss": 0.0402, "step": 7260 }, { - "epoch": 0.08, - "learning_rate": 0.0002882110657066874, - "loss": 0.0397, + "epoch": 0.04, + "learning_rate": 0.00029449828717881445, + "loss": 0.0473, "step": 7270 }, { - "epoch": 0.08, - "learning_rate": 0.0002881948498410845, - "loss": 0.04, + "epoch": 0.04, + "learning_rate": 0.0002944907194858004, + "loss": 0.0433, "step": 7280 }, { - "epoch": 0.08, - "learning_rate": 0.0002881786339754816, - "loss": 0.0455, + "epoch": 0.04, + "learning_rate": 0.00029448315179278646, + "loss": 0.0402, "step": 7290 }, { - "epoch": 0.08, - "learning_rate": 0.00028816241810987865, - "loss": 0.0381, + "epoch": 0.04, + "learning_rate": 0.00029447558409977244, + "loss": 0.04, "step": 7300 }, { - "epoch": 0.08, - "learning_rate": 0.00028814620224427577, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.0002944680164067584, + "loss": 0.0422, "step": 7310 }, { - "epoch": 0.08, - "learning_rate": 0.0002881299863786729, - "loss": 0.04, + "epoch": 0.04, + "learning_rate": 0.0002944604487137444, + "loss": 0.043, "step": 7320 }, { - "epoch": 0.08, - "learning_rate": 0.00028811377051306996, - "loss": 0.0424, + "epoch": 0.04, + "learning_rate": 0.0002944528810207304, + "loss": 0.0423, "step": 7330 }, { - "epoch": 0.08, - "learning_rate": 0.0002880975546474671, - "loss": 0.0459, + "epoch": 0.04, + "learning_rate": 0.00029444531332771637, + "loss": 0.0394, "step": 7340 }, { - "epoch": 0.08, - "learning_rate": 0.00028808133878186414, - "loss": 0.0368, + "epoch": 0.04, + "learning_rate": 0.0002944377456347024, + "loss": 0.0409, "step": 7350 }, { - "epoch": 0.08, - "learning_rate": 0.00028806512291626126, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.0002944301779416884, + "loss": 0.038, "step": 7360 }, { - "epoch": 0.08, - "learning_rate": 0.00028804890705065833, - "loss": 0.0438, + "epoch": 0.04, + "learning_rate": 0.00029442261024867437, + "loss": 0.0363, "step": 7370 }, { - "epoch": 0.08, - "learning_rate": 0.00028803269118505545, - "loss": 0.0513, + "epoch": 0.04, + "learning_rate": 0.00029441504255566035, + "loss": 0.0443, "step": 7380 }, { - "epoch": 0.08, - "learning_rate": 0.0002880164753194525, - "loss": 0.0311, + "epoch": 0.04, + "learning_rate": 0.00029440747486264633, + "loss": 0.0407, "step": 7390 }, { - "epoch": 0.08, - "learning_rate": 0.00028800025945384963, - "loss": 0.0439, + "epoch": 0.04, + "learning_rate": 0.0002943999071696323, + "loss": 0.0506, "step": 7400 }, { - "epoch": 0.08, - "learning_rate": 0.0002879840435882467, - "loss": 0.046, + "epoch": 0.04, + "learning_rate": 0.00029439233947661835, + "loss": 0.0434, "step": 7410 }, { - "epoch": 0.08, - "learning_rate": 0.0002879678277226438, - "loss": 0.0427, + "epoch": 0.04, + "learning_rate": 0.00029438477178360433, + "loss": 0.0501, "step": 7420 }, { - "epoch": 0.08, - "learning_rate": 0.0002879516118570409, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.0002943772040905903, + "loss": 0.05, "step": 7430 }, { - "epoch": 0.08, - "learning_rate": 0.000287935395991438, - "loss": 0.0494, + "epoch": 0.04, + "learning_rate": 0.0002943696363975763, + "loss": 0.0444, "step": 7440 }, { - "epoch": 0.08, - "learning_rate": 0.00028791918012583507, - "loss": 0.0359, + "epoch": 0.04, + "learning_rate": 0.0002943620687045623, + "loss": 0.0354, "step": 7450 }, { - "epoch": 0.08, - "learning_rate": 0.0002879029642602322, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.00029435450101154826, + "loss": 0.0387, "step": 7460 }, { - "epoch": 0.08, - "learning_rate": 0.0002878867483946293, - "loss": 0.0451, + "epoch": 0.04, + "learning_rate": 0.00029434693331853424, + "loss": 0.0454, "step": 7470 }, { - "epoch": 0.08, - "learning_rate": 0.0002878705325290264, - "loss": 0.0517, + "epoch": 0.04, + "learning_rate": 0.00029433936562552027, + "loss": 0.0397, "step": 7480 }, { - "epoch": 0.08, - "learning_rate": 0.00028785431666342344, - "loss": 0.0418, + "epoch": 0.04, + "learning_rate": 0.00029433179793250625, + "loss": 0.0448, "step": 7490 }, { - "epoch": 0.08, - "learning_rate": 0.00028783810079782056, - "loss": 0.0431, + "epoch": 0.04, + "learning_rate": 0.00029432423023949224, + "loss": 0.0408, "step": 7500 }, { - "epoch": 0.08, - "learning_rate": 0.0002878218849322177, - "loss": 0.0654, + "epoch": 0.04, + "learning_rate": 0.0002943166625464782, + "loss": 0.046, "step": 7510 }, { - "epoch": 0.08, - "learning_rate": 0.00028780566906661475, - "loss": 0.0419, + "epoch": 0.04, + "learning_rate": 0.0002943090948534642, + "loss": 0.0449, "step": 7520 }, { - "epoch": 0.08, - "learning_rate": 0.0002877894532010118, + "epoch": 0.04, + "learning_rate": 0.0002943015271604502, "loss": 0.0428, "step": 7530 }, { - "epoch": 0.08, - "learning_rate": 0.00028777323733540893, - "loss": 0.0423, + "epoch": 0.04, + "learning_rate": 0.0002942939594674362, + "loss": 0.04, "step": 7540 }, { - "epoch": 0.08, - "learning_rate": 0.00028775702146980605, - "loss": 0.0395, + "epoch": 0.04, + "learning_rate": 0.0002942863917744222, + "loss": 0.0422, "step": 7550 }, { - "epoch": 0.08, - "learning_rate": 0.0002877408056042031, - "loss": 0.0416, + "epoch": 0.04, + "learning_rate": 0.0002942788240814082, + "loss": 0.0374, "step": 7560 }, { - "epoch": 0.08, - "learning_rate": 0.0002877245897386002, - "loss": 0.0433, + "epoch": 0.04, + "learning_rate": 0.00029427125638839416, + "loss": 0.0432, "step": 7570 }, { - "epoch": 0.08, - "learning_rate": 0.0002877083738729973, - "loss": 0.0476, + "epoch": 0.04, + "learning_rate": 0.00029426368869538014, + "loss": 0.0425, "step": 7580 }, { - "epoch": 0.08, - "learning_rate": 0.0002876921580073944, - "loss": 0.0383, + "epoch": 0.04, + "learning_rate": 0.0002942561210023661, + "loss": 0.0372, "step": 7590 }, { - "epoch": 0.08, - "learning_rate": 0.0002876759421417915, - "loss": 0.0446, + "epoch": 0.04, + "learning_rate": 0.0002942485533093521, + "loss": 0.0396, "step": 7600 }, { - "epoch": 0.08, - "learning_rate": 0.0002876597262761886, - "loss": 0.0447, + "epoch": 0.04, + "learning_rate": 0.00029424098561633814, + "loss": 0.0368, "step": 7610 }, { - "epoch": 0.08, - "learning_rate": 0.0002876435104105857, - "loss": 0.0401, + "epoch": 0.04, + "learning_rate": 0.0002942334179233241, + "loss": 0.0451, "step": 7620 }, { - "epoch": 0.08, - "learning_rate": 0.0002876272945449828, - "loss": 0.0409, + "epoch": 0.04, + "learning_rate": 0.0002942258502303101, + "loss": 0.0437, "step": 7630 }, { - "epoch": 0.08, - "learning_rate": 0.0002876110786793799, - "loss": 0.0411, + "epoch": 0.04, + "learning_rate": 0.0002942182825372961, + "loss": 0.0516, "step": 7640 }, { - "epoch": 0.08, - "learning_rate": 0.000287594862813777, - "loss": 0.0378, + "epoch": 0.04, + "learning_rate": 0.00029421071484428207, + "loss": 0.0346, "step": 7650 }, { - "epoch": 0.08, - "learning_rate": 0.00028757864694817405, - "loss": 0.0465, + "epoch": 0.04, + "learning_rate": 0.00029420314715126805, + "loss": 0.0381, "step": 7660 }, { - "epoch": 0.08, - "learning_rate": 0.00028756243108257117, - "loss": 0.0413, + "epoch": 0.04, + "learning_rate": 0.0002941955794582541, + "loss": 0.0469, "step": 7670 }, { - "epoch": 0.08, - "learning_rate": 0.0002875462152169683, - "loss": 0.0387, + "epoch": 0.04, + "learning_rate": 0.00029418801176524006, + "loss": 0.0404, "step": 7680 }, { - "epoch": 0.08, - "learning_rate": 0.00028752999935136535, - "loss": 0.049, + "epoch": 0.04, + "learning_rate": 0.00029418044407222605, + "loss": 0.0437, "step": 7690 }, { - "epoch": 0.08, - "learning_rate": 0.0002875137834857624, - "loss": 0.0463, + "epoch": 0.04, + "learning_rate": 0.000294172876379212, + "loss": 0.0414, "step": 7700 }, { - "epoch": 0.08, - "learning_rate": 0.00028749756762015954, - "loss": 0.0371, + "epoch": 0.04, + "learning_rate": 0.000294165308686198, + "loss": 0.0486, "step": 7710 }, { - "epoch": 0.08, - "learning_rate": 0.00028748135175455666, - "loss": 0.0403, + "epoch": 0.04, + "learning_rate": 0.000294157740993184, + "loss": 0.0429, "step": 7720 }, { - "epoch": 0.08, - "learning_rate": 0.0002874651358889537, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.00029415017330017, + "loss": 0.0445, "step": 7730 }, { - "epoch": 0.08, - "learning_rate": 0.00028744892002335084, - "loss": 0.0452, + "epoch": 0.04, + "learning_rate": 0.000294142605607156, + "loss": 0.0423, "step": 7740 }, { - "epoch": 0.08, - "learning_rate": 0.0002874327041577479, - "loss": 0.0383, + "epoch": 0.04, + "learning_rate": 0.000294135037914142, + "loss": 0.0376, "step": 7750 }, { - "epoch": 0.08, - "learning_rate": 0.000287416488292145, - "loss": 0.0394, + "epoch": 0.04, + "learning_rate": 0.00029412747022112797, + "loss": 0.0449, "step": 7760 }, { - "epoch": 0.08, - "learning_rate": 0.0002874002724265421, - "loss": 0.0362, + "epoch": 0.04, + "learning_rate": 0.00029411990252811395, + "loss": 0.0464, "step": 7770 }, { - "epoch": 0.08, - "learning_rate": 0.0002873840565609392, - "loss": 0.043, + "epoch": 0.04, + "learning_rate": 0.00029411233483509993, + "loss": 0.0354, "step": 7780 }, { - "epoch": 0.08, - "learning_rate": 0.0002873678406953363, - "loss": 0.0395, + "epoch": 0.04, + "learning_rate": 0.0002941047671420859, + "loss": 0.0362, "step": 7790 }, { - "epoch": 0.08, - "learning_rate": 0.0002873516248297334, - "loss": 0.0391, + "epoch": 0.04, + "learning_rate": 0.00029409719944907195, + "loss": 0.0384, "step": 7800 }, { - "epoch": 0.08, - "learning_rate": 0.00028733540896413046, - "loss": 0.0403, + "epoch": 0.04, + "learning_rate": 0.00029408963175605793, + "loss": 0.036, "step": 7810 }, { - "epoch": 0.08, - "learning_rate": 0.0002873191930985276, - "loss": 0.0384, + "epoch": 0.04, + "learning_rate": 0.0002940820640630439, + "loss": 0.0413, "step": 7820 }, { - "epoch": 0.08, - "learning_rate": 0.00028730297723292465, - "loss": 0.0396, + "epoch": 0.04, + "learning_rate": 0.0002940744963700299, + "loss": 0.0345, "step": 7830 }, { - "epoch": 0.08, - "learning_rate": 0.00028728676136732177, - "loss": 0.0361, + "epoch": 0.04, + "learning_rate": 0.0002940669286770159, + "loss": 0.0379, "step": 7840 }, { - "epoch": 0.08, - "learning_rate": 0.00028727054550171883, - "loss": 0.0409, + "epoch": 0.04, + "learning_rate": 0.00029405936098400186, + "loss": 0.0438, "step": 7850 }, { - "epoch": 0.08, - "learning_rate": 0.00028725432963611595, - "loss": 0.0379, + "epoch": 0.04, + "learning_rate": 0.0002940517932909879, + "loss": 0.0433, "step": 7860 }, { - "epoch": 0.09, - "learning_rate": 0.000287238113770513, - "loss": 0.0418, + "epoch": 0.04, + "learning_rate": 0.0002940442255979739, + "loss": 0.0404, "step": 7870 }, { - "epoch": 0.09, - "learning_rate": 0.00028722189790491014, - "loss": 0.0424, + "epoch": 0.04, + "learning_rate": 0.00029403665790495986, + "loss": 0.0398, "step": 7880 }, { - "epoch": 0.09, - "learning_rate": 0.0002872056820393072, - "loss": 0.0422, + "epoch": 0.04, + "learning_rate": 0.00029402909021194584, + "loss": 0.0438, "step": 7890 }, { - "epoch": 0.09, - "learning_rate": 0.0002871894661737043, - "loss": 0.0484, + "epoch": 0.04, + "learning_rate": 0.0002940215225189318, + "loss": 0.0405, "step": 7900 }, { - "epoch": 0.09, - "learning_rate": 0.00028717325030810145, - "loss": 0.0437, + "epoch": 0.04, + "learning_rate": 0.0002940139548259178, + "loss": 0.0459, "step": 7910 }, { - "epoch": 0.09, - "learning_rate": 0.0002871570344424985, - "loss": 0.0362, + "epoch": 0.04, + "learning_rate": 0.00029400638713290384, + "loss": 0.049, "step": 7920 }, { - "epoch": 0.09, - "learning_rate": 0.00028714081857689563, - "loss": 0.0387, + "epoch": 0.04, + "learning_rate": 0.0002939988194398898, + "loss": 0.0392, "step": 7930 }, { - "epoch": 0.09, - "learning_rate": 0.0002871246027112927, - "loss": 0.0394, + "epoch": 0.04, + "learning_rate": 0.0002939912517468758, + "loss": 0.0387, "step": 7940 }, { - "epoch": 0.09, - "learning_rate": 0.0002871083868456898, - "loss": 0.0425, + "epoch": 0.04, + "learning_rate": 0.0002939836840538618, + "loss": 0.0401, "step": 7950 }, { - "epoch": 0.09, - "learning_rate": 0.0002870921709800869, - "loss": 0.0481, + "epoch": 0.04, + "learning_rate": 0.00029397611636084776, + "loss": 0.0488, "step": 7960 }, { - "epoch": 0.09, - "learning_rate": 0.000287075955114484, - "loss": 0.0438, + "epoch": 0.04, + "learning_rate": 0.00029396854866783374, + "loss": 0.0453, "step": 7970 }, { - "epoch": 0.09, - "learning_rate": 0.00028705973924888107, - "loss": 0.0413, + "epoch": 0.04, + "learning_rate": 0.0002939609809748197, + "loss": 0.0404, "step": 7980 }, { - "epoch": 0.09, - "learning_rate": 0.0002870435233832782, - "loss": 0.0447, + "epoch": 0.04, + "learning_rate": 0.00029395341328180576, + "loss": 0.0408, "step": 7990 }, { - "epoch": 0.09, - "learning_rate": 0.00028702730751767525, - "loss": 0.0452, + "epoch": 0.04, + "learning_rate": 0.00029394584558879174, + "loss": 0.0365, "step": 8000 }, { - "epoch": 0.09, - "eval_cer": 0.9215668902450677, - "eval_loss": 0.03050500527024269, - "eval_runtime": 119.8198, - "eval_samples_per_second": 16.692, - "eval_steps_per_second": 4.173, + "epoch": 0.04, + "eval_cer": 0.9145313908590625, + "eval_loss": 0.03206906095147133, + "eval_runtime": 117.4386, + "eval_samples_per_second": 17.03, + "eval_steps_per_second": 4.258, "step": 8000 }, { - "epoch": 0.09, - "learning_rate": 0.00028701109165207237, - "loss": 0.0518, + "epoch": 0.04, + "learning_rate": 0.0002939382778957777, + "loss": 0.0413, "step": 8010 }, { - "epoch": 0.09, - "learning_rate": 0.00028699487578646944, - "loss": 0.0419, + "epoch": 0.04, + "learning_rate": 0.0002939307102027637, + "loss": 0.0405, "step": 8020 }, { - "epoch": 0.09, - "learning_rate": 0.00028697865992086656, - "loss": 0.0416, + "epoch": 0.04, + "learning_rate": 0.0002939231425097497, + "loss": 0.0403, "step": 8030 }, { - "epoch": 0.09, - "learning_rate": 0.0002869624440552637, - "loss": 0.0452, + "epoch": 0.04, + "learning_rate": 0.00029391557481673567, + "loss": 0.0382, "step": 8040 }, { - "epoch": 0.09, - "learning_rate": 0.00028694622818966074, - "loss": 0.0394, + "epoch": 0.04, + "learning_rate": 0.0002939080071237217, + "loss": 0.0399, "step": 8050 }, { - "epoch": 0.09, - "learning_rate": 0.0002869300123240578, - "loss": 0.0382, + "epoch": 0.04, + "learning_rate": 0.0002939004394307077, + "loss": 0.0431, "step": 8060 }, { - "epoch": 0.09, - "learning_rate": 0.00028691379645845493, - "loss": 0.0397, + "epoch": 0.04, + "learning_rate": 0.00029389287173769367, + "loss": 0.0478, "step": 8070 }, { - "epoch": 0.09, - "learning_rate": 0.00028689758059285205, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.00029388530404467965, + "loss": 0.0366, "step": 8080 }, { - "epoch": 0.09, - "learning_rate": 0.0002868813647272491, - "loss": 0.0351, + "epoch": 0.04, + "learning_rate": 0.00029387773635166563, + "loss": 0.037, "step": 8090 }, { - "epoch": 0.09, - "learning_rate": 0.0002868651488616462, - "loss": 0.0386, + "epoch": 0.04, + "learning_rate": 0.0002938701686586516, + "loss": 0.0357, "step": 8100 }, { - "epoch": 0.09, - "learning_rate": 0.0002868489329960433, - "loss": 0.0413, + "epoch": 0.04, + "learning_rate": 0.0002938626009656376, + "loss": 0.0408, "step": 8110 }, { - "epoch": 0.09, - "learning_rate": 0.0002868327171304404, - "loss": 0.0391, + "epoch": 0.04, + "learning_rate": 0.0002938550332726236, + "loss": 0.0392, "step": 8120 }, { - "epoch": 0.09, - "learning_rate": 0.0002868165012648375, - "loss": 0.041, + "epoch": 0.04, + "learning_rate": 0.0002938474655796096, + "loss": 0.0465, "step": 8130 }, { - "epoch": 0.09, - "learning_rate": 0.00028680028539923455, - "loss": 0.0412, + "epoch": 0.04, + "learning_rate": 0.0002938398978865956, + "loss": 0.0369, "step": 8140 }, { - "epoch": 0.09, - "learning_rate": 0.00028678406953363167, - "loss": 0.0409, + "epoch": 0.04, + "learning_rate": 0.00029383233019358157, + "loss": 0.0439, "step": 8150 }, { - "epoch": 0.09, - "learning_rate": 0.0002867678536680288, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.00029382476250056755, + "loss": 0.0455, "step": 8160 }, { - "epoch": 0.09, - "learning_rate": 0.00028675163780242586, - "loss": 0.0429, + "epoch": 0.04, + "learning_rate": 0.00029381719480755353, + "loss": 0.0379, "step": 8170 }, { - "epoch": 0.09, - "learning_rate": 0.000286735421936823, - "loss": 0.0384, + "epoch": 0.04, + "learning_rate": 0.0002938096271145395, + "loss": 0.0352, "step": 8180 }, { - "epoch": 0.09, - "learning_rate": 0.00028671920607122004, - "loss": 0.0387, + "epoch": 0.04, + "learning_rate": 0.0002938020594215255, + "loss": 0.0366, "step": 8190 }, { - "epoch": 0.09, - "learning_rate": 0.00028670299020561716, - "loss": 0.0399, + "epoch": 0.04, + "learning_rate": 0.0002937944917285115, + "loss": 0.04, "step": 8200 }, { - "epoch": 0.09, - "learning_rate": 0.0002866867743400143, - "loss": 0.0387, + "epoch": 0.04, + "learning_rate": 0.00029378692403549746, + "loss": 0.0367, "step": 8210 }, { - "epoch": 0.09, - "learning_rate": 0.00028667055847441135, - "loss": 0.0371, + "epoch": 0.04, + "learning_rate": 0.0002937793563424835, + "loss": 0.0417, "step": 8220 }, { - "epoch": 0.09, - "learning_rate": 0.0002866543426088084, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002937717886494695, + "loss": 0.0412, "step": 8230 }, { - "epoch": 0.09, - "learning_rate": 0.00028663812674320553, - "loss": 0.0426, + "epoch": 0.04, + "learning_rate": 0.00029376422095645546, + "loss": 0.0383, "step": 8240 }, { - "epoch": 0.09, - "learning_rate": 0.00028662191087760265, - "loss": 0.0356, + "epoch": 0.04, + "learning_rate": 0.00029375665326344144, + "loss": 0.0383, "step": 8250 }, { - "epoch": 0.09, - "learning_rate": 0.0002866056950119997, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.0002937490855704274, + "loss": 0.0386, "step": 8260 }, { - "epoch": 0.09, - "learning_rate": 0.0002865894791463968, - "loss": 0.0402, + "epoch": 0.04, + "learning_rate": 0.0002937415178774134, + "loss": 0.041, "step": 8270 }, { - "epoch": 0.09, - "learning_rate": 0.0002865732632807939, - "loss": 0.0398, + "epoch": 0.04, + "learning_rate": 0.00029373395018439944, + "loss": 0.0444, "step": 8280 }, { - "epoch": 0.09, - "learning_rate": 0.000286557047415191, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002937263824913854, + "loss": 0.0399, "step": 8290 }, { - "epoch": 0.09, - "learning_rate": 0.0002865408315495881, - "loss": 0.0335, + "epoch": 0.04, + "learning_rate": 0.0002937188147983714, + "loss": 0.0458, "step": 8300 }, { - "epoch": 0.09, - "learning_rate": 0.00028652461568398515, - "loss": 0.0421, + "epoch": 0.04, + "learning_rate": 0.0002937112471053574, + "loss": 0.036, "step": 8310 }, { - "epoch": 0.09, - "learning_rate": 0.0002865083998183823, - "loss": 0.0378, + "epoch": 0.04, + "learning_rate": 0.00029370367941234336, + "loss": 0.0409, "step": 8320 }, { - "epoch": 0.09, - "learning_rate": 0.0002864921839527794, - "loss": 0.0373, + "epoch": 0.04, + "learning_rate": 0.00029369611171932935, + "loss": 0.0406, "step": 8330 }, { - "epoch": 0.09, - "learning_rate": 0.00028647596808717646, - "loss": 0.0373, + "epoch": 0.04, + "learning_rate": 0.00029368854402631533, + "loss": 0.0401, "step": 8340 }, { - "epoch": 0.09, - "learning_rate": 0.0002864597522215736, - "loss": 0.0401, + "epoch": 0.04, + "learning_rate": 0.00029368097633330136, + "loss": 0.0408, "step": 8350 }, { - "epoch": 0.09, - "learning_rate": 0.00028644353635597065, - "loss": 0.0374, + "epoch": 0.04, + "learning_rate": 0.00029367340864028734, + "loss": 0.035, "step": 8360 }, { - "epoch": 0.09, - "learning_rate": 0.00028642732049036777, - "loss": 0.0376, + "epoch": 0.04, + "learning_rate": 0.0002936658409472733, + "loss": 0.0411, "step": 8370 }, { - "epoch": 0.09, - "learning_rate": 0.00028641110462476483, - "loss": 0.042, + "epoch": 0.04, + "learning_rate": 0.0002936582732542593, + "loss": 0.0472, "step": 8380 }, { - "epoch": 0.09, - "learning_rate": 0.00028639488875916195, - "loss": 0.0381, + "epoch": 0.04, + "learning_rate": 0.0002936507055612453, + "loss": 0.0372, "step": 8390 }, { - "epoch": 0.09, - "learning_rate": 0.000286378672893559, - "loss": 0.0379, + "epoch": 0.04, + "learning_rate": 0.00029364313786823127, + "loss": 0.0366, "step": 8400 }, { - "epoch": 0.09, - "learning_rate": 0.00028636245702795614, - "loss": 0.0375, + "epoch": 0.04, + "learning_rate": 0.0002936355701752173, + "loss": 0.0368, "step": 8410 }, { - "epoch": 0.09, - "learning_rate": 0.0002863462411623532, - "loss": 0.0402, + "epoch": 0.04, + "learning_rate": 0.0002936280024822033, + "loss": 0.0372, "step": 8420 }, { - "epoch": 0.09, - "learning_rate": 0.0002863300252967503, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.00029362043478918927, + "loss": 0.0373, "step": 8430 }, { - "epoch": 0.09, - "learning_rate": 0.0002863138094311474, - "loss": 0.0405, + "epoch": 0.04, + "learning_rate": 0.00029361286709617525, + "loss": 0.0376, "step": 8440 }, { - "epoch": 0.09, - "learning_rate": 0.0002862975935655445, - "loss": 0.0385, + "epoch": 0.04, + "learning_rate": 0.00029360529940316123, + "loss": 0.0405, "step": 8450 }, { - "epoch": 0.09, - "learning_rate": 0.0002862813776999416, - "loss": 0.0409, + "epoch": 0.04, + "learning_rate": 0.0002935977317101472, + "loss": 0.0445, "step": 8460 }, { - "epoch": 0.09, - "learning_rate": 0.0002862651618343387, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.00029359016401713325, + "loss": 0.1198, "step": 8470 }, { - "epoch": 0.09, - "learning_rate": 0.0002862489459687358, - "loss": 0.0402, + "epoch": 0.04, + "learning_rate": 0.00029358259632411923, + "loss": 0.0436, "step": 8480 }, { - "epoch": 0.09, - "learning_rate": 0.0002862327301031329, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.0002935750286311052, + "loss": 0.0414, "step": 8490 }, { - "epoch": 0.09, - "learning_rate": 0.00028621651423752994, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002935674609380912, + "loss": 0.0396, "step": 8500 }, { - "epoch": 0.09, - "learning_rate": 0.00028620029837192706, - "loss": 0.0396, + "epoch": 0.04, + "learning_rate": 0.0002935598932450772, + "loss": 0.0366, "step": 8510 }, { - "epoch": 0.09, - "learning_rate": 0.0002861840825063242, - "loss": 0.0371, + "epoch": 0.04, + "learning_rate": 0.00029355232555206316, + "loss": 0.0383, "step": 8520 }, { - "epoch": 0.09, - "learning_rate": 0.00028616786664072125, - "loss": 0.0418, + "epoch": 0.04, + "learning_rate": 0.00029354475785904914, + "loss": 0.0715, "step": 8530 }, { - "epoch": 0.09, - "learning_rate": 0.0002861516507751183, - "loss": 0.0414, + "epoch": 0.04, + "learning_rate": 0.0002935371901660352, + "loss": 0.067, "step": 8540 }, { - "epoch": 0.09, - "learning_rate": 0.00028613543490951543, - "loss": 0.0383, + "epoch": 0.04, + "learning_rate": 0.00029352962247302115, + "loss": 0.0371, "step": 8550 }, { - "epoch": 0.09, - "learning_rate": 0.00028611921904391255, - "loss": 0.0455, + "epoch": 0.04, + "learning_rate": 0.00029352205478000714, + "loss": 0.0326, "step": 8560 }, { - "epoch": 0.09, - "learning_rate": 0.0002861030031783096, - "loss": 0.0417, + "epoch": 0.04, + "learning_rate": 0.0002935144870869931, + "loss": 0.0439, "step": 8570 }, { - "epoch": 0.09, - "learning_rate": 0.0002860867873127067, - "loss": 0.0404, + "epoch": 0.04, + "learning_rate": 0.0002935069193939791, + "loss": 0.0387, "step": 8580 }, { - "epoch": 0.09, - "learning_rate": 0.0002860705714471038, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002934993517009651, + "loss": 0.0407, "step": 8590 }, { - "epoch": 0.09, - "learning_rate": 0.0002860543555815009, - "loss": 0.0338, + "epoch": 0.04, + "learning_rate": 0.0002934917840079511, + "loss": 0.0378, "step": 8600 }, { - "epoch": 0.09, - "learning_rate": 0.000286038139715898, - "loss": 0.0373, + "epoch": 0.04, + "learning_rate": 0.0002934842163149371, + "loss": 0.0389, "step": 8610 }, { - "epoch": 0.09, - "learning_rate": 0.0002860219238502951, - "loss": 0.0407, + "epoch": 0.04, + "learning_rate": 0.0002934766486219231, + "loss": 0.0462, "step": 8620 }, { - "epoch": 0.09, - "learning_rate": 0.0002860057079846922, + "epoch": 0.04, + "learning_rate": 0.00029346908092890906, "loss": 0.0362, "step": 8630 }, { - "epoch": 0.09, - "learning_rate": 0.0002859894921190893, - "loss": 0.0377, + "epoch": 0.04, + "learning_rate": 0.00029346151323589504, + "loss": 0.0355, "step": 8640 }, { - "epoch": 0.09, - "learning_rate": 0.0002859732762534864, - "loss": 0.0388, + "epoch": 0.04, + "learning_rate": 0.000293453945542881, + "loss": 0.0501, "step": 8650 }, { - "epoch": 0.09, - "learning_rate": 0.0002859570603878835, - "loss": 0.0397, + "epoch": 0.04, + "learning_rate": 0.000293446377849867, + "loss": 0.0372, "step": 8660 }, { - "epoch": 0.09, - "learning_rate": 0.00028594084452228055, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.00029343881015685304, + "loss": 0.047, "step": 8670 }, { - "epoch": 0.09, - "learning_rate": 0.00028592462865667767, - "loss": 0.0396, + "epoch": 0.04, + "learning_rate": 0.000293431242463839, + "loss": 0.0424, "step": 8680 }, { - "epoch": 0.09, - "learning_rate": 0.0002859084127910748, - "loss": 0.0369, + "epoch": 0.04, + "learning_rate": 0.000293423674770825, + "loss": 0.0412, "step": 8690 }, { - "epoch": 0.09, - "learning_rate": 0.00028589219692547185, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.000293416107077811, + "loss": 0.0422, "step": 8700 }, { - "epoch": 0.09, - "learning_rate": 0.0002858759810598689, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.00029340853938479697, + "loss": 0.0416, "step": 8710 }, { - "epoch": 0.09, - "learning_rate": 0.00028585976519426604, - "loss": 0.0427, + "epoch": 0.04, + "learning_rate": 0.00029340097169178295, + "loss": 0.0439, "step": 8720 }, { - "epoch": 0.09, - "learning_rate": 0.00028584354932866316, - "loss": 0.0442, + "epoch": 0.04, + "learning_rate": 0.000293393403998769, + "loss": 0.0432, "step": 8730 }, { - "epoch": 0.09, - "learning_rate": 0.0002858273334630602, - "loss": 0.041, + "epoch": 0.04, + "learning_rate": 0.00029338583630575496, + "loss": 0.049, "step": 8740 }, { - "epoch": 0.09, - "learning_rate": 0.00028581111759745734, - "loss": 0.0381, + "epoch": 0.04, + "learning_rate": 0.00029337826861274095, + "loss": 0.0852, "step": 8750 }, { - "epoch": 0.09, - "learning_rate": 0.0002857949017318544, - "loss": 0.0382, + "epoch": 0.04, + "learning_rate": 0.00029337070091972693, + "loss": 0.0452, "step": 8760 }, { - "epoch": 0.09, - "learning_rate": 0.00028577868586625153, - "loss": 0.038, + "epoch": 0.04, + "learning_rate": 0.0002933631332267129, + "loss": 0.0722, "step": 8770 }, { - "epoch": 0.09, - "learning_rate": 0.00028576247000064865, - "loss": 0.0381, + "epoch": 0.04, + "learning_rate": 0.0002933555655336989, + "loss": 0.0839, "step": 8780 }, { - "epoch": 0.1, - "learning_rate": 0.0002857462541350457, - "loss": 0.0401, + "epoch": 0.04, + "learning_rate": 0.0002933479978406849, + "loss": 0.0442, "step": 8790 }, { - "epoch": 0.1, - "learning_rate": 0.0002857300382694428, - "loss": 0.0389, + "epoch": 0.04, + "learning_rate": 0.0002933404301476709, + "loss": 0.044, "step": 8800 }, { - "epoch": 0.1, - "learning_rate": 0.0002857138224038399, - "loss": 0.039, + "epoch": 0.04, + "learning_rate": 0.0002933328624546569, + "loss": 0.041, "step": 8810 }, { - "epoch": 0.1, - "learning_rate": 0.000285697606538237, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.00029332529476164287, + "loss": 0.0471, "step": 8820 }, { - "epoch": 0.1, - "learning_rate": 0.0002856813906726341, - "loss": 0.0406, + "epoch": 0.04, + "learning_rate": 0.00029331772706862885, + "loss": 0.037, "step": 8830 }, { - "epoch": 0.1, - "learning_rate": 0.00028566517480703115, - "loss": 0.042, + "epoch": 0.04, + "learning_rate": 0.00029331015937561483, + "loss": 0.0418, "step": 8840 }, { - "epoch": 0.1, - "learning_rate": 0.00028564895894142827, - "loss": 0.0371, + "epoch": 0.04, + "learning_rate": 0.0002933025916826008, + "loss": 0.0411, "step": 8850 }, { - "epoch": 0.1, - "learning_rate": 0.0002856327430758254, - "loss": 0.0373, + "epoch": 0.04, + "learning_rate": 0.00029329502398958685, + "loss": 0.0448, "step": 8860 }, { - "epoch": 0.1, - "learning_rate": 0.00028561652721022246, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029328745629657283, + "loss": 0.0363, "step": 8870 }, { - "epoch": 0.1, - "learning_rate": 0.0002856003113446195, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.0002932798886035588, + "loss": 0.0438, "step": 8880 }, { - "epoch": 0.1, - "learning_rate": 0.00028558409547901664, - "loss": 0.0344, + "epoch": 0.04, + "learning_rate": 0.0002932723209105448, + "loss": 0.0372, "step": 8890 }, { - "epoch": 0.1, - "learning_rate": 0.00028556787961341376, - "loss": 0.0392, + "epoch": 0.04, + "learning_rate": 0.0002932647532175308, + "loss": 0.0423, "step": 8900 }, { - "epoch": 0.1, - "learning_rate": 0.00028555166374781083, - "loss": 0.0405, + "epoch": 0.04, + "learning_rate": 0.00029325718552451676, + "loss": 0.0412, "step": 8910 }, { - "epoch": 0.1, - "learning_rate": 0.00028553544788220795, - "loss": 0.0334, + "epoch": 0.05, + "learning_rate": 0.0002932496178315028, + "loss": 0.0338, "step": 8920 }, { - "epoch": 0.1, - "learning_rate": 0.000285519232016605, - "loss": 0.0453, + "epoch": 0.05, + "learning_rate": 0.0002932420501384888, + "loss": 0.0347, "step": 8930 }, { - "epoch": 0.1, - "learning_rate": 0.00028550301615100213, - "loss": 0.0385, + "epoch": 0.05, + "learning_rate": 0.00029323448244547476, + "loss": 0.0444, "step": 8940 }, { - "epoch": 0.1, - "learning_rate": 0.0002854868002853992, - "loss": 0.0401, + "epoch": 0.05, + "learning_rate": 0.00029322691475246074, + "loss": 0.0343, "step": 8950 }, { - "epoch": 0.1, - "learning_rate": 0.0002854705844197963, - "loss": 0.0404, + "epoch": 0.05, + "learning_rate": 0.0002932193470594467, + "loss": 0.0437, "step": 8960 }, { - "epoch": 0.1, - "learning_rate": 0.0002854543685541934, - "loss": 0.0386, + "epoch": 0.05, + "learning_rate": 0.0002932117793664327, + "loss": 0.04, "step": 8970 }, { - "epoch": 0.1, - "learning_rate": 0.0002854381526885905, - "loss": 0.038, + "epoch": 0.05, + "learning_rate": 0.00029320421167341874, + "loss": 0.0405, "step": 8980 }, { - "epoch": 0.1, - "learning_rate": 0.00028542193682298757, - "loss": 0.0369, + "epoch": 0.05, + "learning_rate": 0.0002931966439804047, + "loss": 0.0338, "step": 8990 }, { - "epoch": 0.1, - "learning_rate": 0.0002854057209573847, - "loss": 0.04, + "epoch": 0.05, + "learning_rate": 0.0002931890762873907, + "loss": 0.043, "step": 9000 }, { - "epoch": 0.1, - "eval_cer": 0.9215668902450677, - "eval_loss": 0.028050633147358894, - "eval_runtime": 119.8689, - "eval_samples_per_second": 16.685, - "eval_steps_per_second": 4.171, + "epoch": 0.05, + "eval_cer": 0.9145352724435641, + "eval_loss": 0.03075648657977581, + "eval_runtime": 117.5474, + "eval_samples_per_second": 17.014, + "eval_steps_per_second": 4.254, "step": 9000 }, { - "epoch": 0.1, - "learning_rate": 0.00028538950509178176, - "loss": 0.0479, + "epoch": 0.05, + "learning_rate": 0.0002931815085943767, + "loss": 0.0435, "step": 9010 }, { - "epoch": 0.1, - "learning_rate": 0.0002853732892261789, - "loss": 0.0459, + "epoch": 0.05, + "learning_rate": 0.00029317394090136266, + "loss": 0.0368, "step": 9020 }, { - "epoch": 0.1, - "learning_rate": 0.00028535707336057594, - "loss": 0.0374, + "epoch": 0.05, + "learning_rate": 0.00029316637320834864, + "loss": 0.0428, "step": 9030 }, { - "epoch": 0.1, - "learning_rate": 0.00028534085749497306, - "loss": 0.0451, + "epoch": 0.05, + "learning_rate": 0.0002931588055153346, + "loss": 0.0391, "step": 9040 }, { - "epoch": 0.1, - "learning_rate": 0.0002853246416293702, - "loss": 0.0394, + "epoch": 0.05, + "learning_rate": 0.00029315123782232066, + "loss": 0.0364, "step": 9050 }, { - "epoch": 0.1, - "learning_rate": 0.00028530842576376725, - "loss": 0.0412, + "epoch": 0.05, + "learning_rate": 0.00029314367012930664, + "loss": 0.0351, "step": 9060 }, { - "epoch": 0.1, - "learning_rate": 0.0002852922098981643, - "loss": 0.0406, + "epoch": 0.05, + "learning_rate": 0.0002931361024362926, + "loss": 0.0363, "step": 9070 }, { - "epoch": 0.1, - "learning_rate": 0.00028527599403256143, + "epoch": 0.05, + "learning_rate": 0.0002931285347432786, "loss": 0.0389, "step": 9080 }, { - "epoch": 0.1, - "learning_rate": 0.00028525977816695855, - "loss": 0.0364, + "epoch": 0.05, + "learning_rate": 0.0002931209670502646, + "loss": 0.0447, "step": 9090 }, { - "epoch": 0.1, - "learning_rate": 0.0002852435623013556, - "loss": 0.0407, + "epoch": 0.05, + "learning_rate": 0.00029311339935725057, + "loss": 0.0385, "step": 9100 }, { - "epoch": 0.1, - "learning_rate": 0.0002852273464357527, - "loss": 0.0449, + "epoch": 0.05, + "learning_rate": 0.0002931058316642366, + "loss": 0.0429, "step": 9110 }, { - "epoch": 0.1, - "learning_rate": 0.0002852111305701498, - "loss": 0.045, + "epoch": 0.05, + "learning_rate": 0.0002930982639712226, + "loss": 0.0399, "step": 9120 }, { - "epoch": 0.1, - "learning_rate": 0.0002851949147045469, - "loss": 0.0459, + "epoch": 0.05, + "learning_rate": 0.00029309069627820857, + "loss": 0.0383, "step": 9130 }, { - "epoch": 0.1, - "learning_rate": 0.000285178698838944, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.00029308312858519455, + "loss": 0.0303, "step": 9140 }, { - "epoch": 0.1, - "learning_rate": 0.00028516248297334105, - "loss": 0.0385, + "epoch": 0.05, + "learning_rate": 0.00029307556089218053, + "loss": 0.042, "step": 9150 }, { - "epoch": 0.1, - "learning_rate": 0.0002851462671077382, - "loss": 0.0414, + "epoch": 0.05, + "learning_rate": 0.0002930679931991665, + "loss": 0.0415, "step": 9160 }, { - "epoch": 0.1, - "learning_rate": 0.0002851300512421353, - "loss": 0.0394, + "epoch": 0.05, + "learning_rate": 0.0002930604255061525, + "loss": 0.038, "step": 9170 }, { - "epoch": 0.1, - "learning_rate": 0.00028511383537653236, - "loss": 0.0409, + "epoch": 0.05, + "learning_rate": 0.00029305285781313853, + "loss": 0.0375, "step": 9180 }, { - "epoch": 0.1, - "learning_rate": 0.0002850976195109295, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.0002930452901201245, + "loss": 0.0364, "step": 9190 }, { - "epoch": 0.1, - "learning_rate": 0.00028508140364532654, - "loss": 0.0434, + "epoch": 0.05, + "learning_rate": 0.0002930377224271105, + "loss": 0.0377, "step": 9200 }, { - "epoch": 0.1, - "learning_rate": 0.00028506518777972366, - "loss": 0.0376, + "epoch": 0.05, + "learning_rate": 0.00029303015473409647, + "loss": 0.0382, "step": 9210 }, { - "epoch": 0.1, - "learning_rate": 0.0002850489719141208, - "loss": 0.0767, + "epoch": 0.05, + "learning_rate": 0.00029302258704108245, + "loss": 0.0425, "step": 9220 }, { - "epoch": 0.1, - "learning_rate": 0.00028503275604851785, - "loss": 0.0393, + "epoch": 0.05, + "learning_rate": 0.00029301501934806843, + "loss": 0.0377, "step": 9230 }, { - "epoch": 0.1, - "learning_rate": 0.0002850165401829149, - "loss": 0.0356, + "epoch": 0.05, + "learning_rate": 0.00029300745165505447, + "loss": 0.0442, "step": 9240 }, { - "epoch": 0.1, - "learning_rate": 0.00028500032431731204, - "loss": 0.037, + "epoch": 0.05, + "learning_rate": 0.00029299988396204045, + "loss": 0.0396, "step": 9250 }, { - "epoch": 0.1, - "learning_rate": 0.00028498410845170916, - "loss": 0.0411, + "epoch": 0.05, + "learning_rate": 0.00029299231626902643, + "loss": 0.0383, "step": 9260 }, { - "epoch": 0.1, - "learning_rate": 0.0002849678925861062, - "loss": 0.0377, + "epoch": 0.05, + "learning_rate": 0.0002929847485760124, + "loss": 0.0436, "step": 9270 }, { - "epoch": 0.1, - "learning_rate": 0.0002849516767205033, + "epoch": 0.05, + "learning_rate": 0.0002929771808829984, "loss": 0.0385, "step": 9280 }, { - "epoch": 0.1, - "learning_rate": 0.0002849354608549004, - "loss": 0.0434, + "epoch": 0.05, + "learning_rate": 0.0002929696131899844, + "loss": 0.0407, "step": 9290 }, { - "epoch": 0.1, - "learning_rate": 0.0002849192449892975, - "loss": 0.0373, + "epoch": 0.05, + "learning_rate": 0.0002929620454969704, + "loss": 0.0399, "step": 9300 }, { - "epoch": 0.1, - "learning_rate": 0.0002849030291236946, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.0002929544778039564, + "loss": 0.0396, "step": 9310 }, { - "epoch": 0.1, - "learning_rate": 0.00028488681325809166, - "loss": 0.0355, + "epoch": 0.05, + "learning_rate": 0.0002929469101109424, + "loss": 0.0334, "step": 9320 }, { - "epoch": 0.1, - "learning_rate": 0.0002848705973924888, - "loss": 0.0367, + "epoch": 0.05, + "learning_rate": 0.00029293934241792836, + "loss": 0.0379, "step": 9330 }, { - "epoch": 0.1, - "learning_rate": 0.0002848543815268859, + "epoch": 0.05, + "learning_rate": 0.00029293177472491434, "loss": 0.034, "step": 9340 }, { - "epoch": 0.1, - "learning_rate": 0.00028483816566128296, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.0002929242070319003, + "loss": 0.0384, "step": 9350 }, { - "epoch": 0.1, - "learning_rate": 0.0002848219497956801, - "loss": 0.0362, + "epoch": 0.05, + "learning_rate": 0.0002929166393388863, + "loss": 0.0372, "step": 9360 }, { - "epoch": 0.1, - "learning_rate": 0.00028480573393007715, - "loss": 0.0389, + "epoch": 0.05, + "learning_rate": 0.00029290907164587234, + "loss": 0.0371, "step": 9370 }, { - "epoch": 0.1, - "learning_rate": 0.00028478951806447427, - "loss": 0.0388, + "epoch": 0.05, + "learning_rate": 0.0002929015039528583, + "loss": 0.0378, "step": 9380 }, { - "epoch": 0.1, - "learning_rate": 0.0002847733021988714, - "loss": 0.0414, + "epoch": 0.05, + "learning_rate": 0.0002928939362598443, + "loss": 0.0362, "step": 9390 }, { - "epoch": 0.1, - "learning_rate": 0.00028475708633326845, - "loss": 0.0399, + "epoch": 0.05, + "learning_rate": 0.0002928863685668303, + "loss": 0.0385, "step": 9400 }, { - "epoch": 0.1, - "learning_rate": 0.0002847408704676655, - "loss": 0.0407, + "epoch": 0.05, + "learning_rate": 0.00029287880087381626, + "loss": 0.0355, "step": 9410 }, { - "epoch": 0.1, - "learning_rate": 0.00028472465460206264, - "loss": 0.0407, + "epoch": 0.05, + "learning_rate": 0.00029287123318080224, + "loss": 0.0418, "step": 9420 }, { - "epoch": 0.1, - "learning_rate": 0.00028470843873645976, - "loss": 0.0351, + "epoch": 0.05, + "learning_rate": 0.0002928636654877882, + "loss": 0.0369, "step": 9430 }, { - "epoch": 0.1, - "learning_rate": 0.0002846922228708568, - "loss": 0.0357, + "epoch": 0.05, + "learning_rate": 0.0002928560977947742, + "loss": 0.0423, "step": 9440 }, { - "epoch": 0.1, - "learning_rate": 0.0002846760070052539, - "loss": 0.0432, + "epoch": 0.05, + "learning_rate": 0.0002928485301017602, + "loss": 0.0349, "step": 9450 }, { - "epoch": 0.1, - "learning_rate": 0.000284659791139651, - "loss": 0.039, + "epoch": 0.05, + "learning_rate": 0.00029284096240874617, + "loss": 0.0379, "step": 9460 }, { - "epoch": 0.1, - "learning_rate": 0.00028464357527404813, - "loss": 0.0334, + "epoch": 0.05, + "learning_rate": 0.0002928333947157322, + "loss": 0.0444, "step": 9470 }, { - "epoch": 0.1, - "learning_rate": 0.0002846273594084452, - "loss": 0.044, + "epoch": 0.05, + "learning_rate": 0.0002928258270227182, + "loss": 0.0357, "step": 9480 }, { - "epoch": 0.1, - "learning_rate": 0.0002846111435428423, - "loss": 0.0516, + "epoch": 0.05, + "learning_rate": 0.00029281825932970417, + "loss": 0.0495, "step": 9490 }, { - "epoch": 0.1, - "learning_rate": 0.0002845949276772394, - "loss": 0.0345, + "epoch": 0.05, + "learning_rate": 0.00029281069163669015, + "loss": 0.0384, "step": 9500 }, { - "epoch": 0.1, - "learning_rate": 0.0002845787118116365, - "loss": 0.0382, + "epoch": 0.05, + "learning_rate": 0.00029280312394367613, + "loss": 0.0448, "step": 9510 }, { - "epoch": 0.1, - "learning_rate": 0.00028456249594603357, - "loss": 0.0419, + "epoch": 0.05, + "learning_rate": 0.0002927955562506621, + "loss": 0.0382, "step": 9520 }, { - "epoch": 0.1, - "learning_rate": 0.0002845462800804307, - "loss": 0.0423, + "epoch": 0.05, + "learning_rate": 0.00029278798855764815, + "loss": 0.0397, "step": 9530 }, { - "epoch": 0.1, - "learning_rate": 0.00028453006421482775, - "loss": 0.0382, + "epoch": 0.05, + "learning_rate": 0.00029278042086463413, + "loss": 0.0354, "step": 9540 }, { - "epoch": 0.1, - "learning_rate": 0.00028451384834922487, - "loss": 0.0382, + "epoch": 0.05, + "learning_rate": 0.0002927728531716201, + "loss": 0.042, "step": 9550 }, { - "epoch": 0.1, - "learning_rate": 0.00028449763248362194, - "loss": 0.0343, + "epoch": 0.05, + "learning_rate": 0.0002927652854786061, + "loss": 0.0458, "step": 9560 }, { - "epoch": 0.1, - "learning_rate": 0.00028448141661801906, - "loss": 0.0381, + "epoch": 0.05, + "learning_rate": 0.0002927577177855921, + "loss": 0.0349, "step": 9570 }, { - "epoch": 0.1, - "learning_rate": 0.0002844652007524161, - "loss": 0.0355, + "epoch": 0.05, + "learning_rate": 0.00029275015009257806, + "loss": 0.0386, "step": 9580 }, { - "epoch": 0.1, - "learning_rate": 0.00028444898488681324, - "loss": 0.039, + "epoch": 0.05, + "learning_rate": 0.00029274258239956404, + "loss": 0.0407, "step": 9590 }, { - "epoch": 0.1, - "learning_rate": 0.0002844327690212103, - "loss": 0.0349, + "epoch": 0.05, + "learning_rate": 0.0002927350147065501, + "loss": 0.0397, "step": 9600 }, { - "epoch": 0.1, - "learning_rate": 0.00028441655315560743, - "loss": 0.0342, + "epoch": 0.05, + "learning_rate": 0.00029272744701353605, + "loss": 0.0394, "step": 9610 }, { - "epoch": 0.1, - "learning_rate": 0.0002844003372900045, - "loss": 0.0389, + "epoch": 0.05, + "learning_rate": 0.00029271987932052204, + "loss": 0.043, "step": 9620 }, { - "epoch": 0.1, - "learning_rate": 0.0002843841214244016, - "loss": 0.0368, + "epoch": 0.05, + "learning_rate": 0.000292712311627508, + "loss": 0.0395, "step": 9630 }, { - "epoch": 0.1, - "learning_rate": 0.0002843679055587987, - "loss": 0.0385, + "epoch": 0.05, + "learning_rate": 0.000292704743934494, + "loss": 0.0401, "step": 9640 }, { - "epoch": 0.1, - "learning_rate": 0.0002843516896931958, - "loss": 0.0368, + "epoch": 0.05, + "learning_rate": 0.00029269717624148, + "loss": 0.0418, "step": 9650 }, { - "epoch": 0.1, - "learning_rate": 0.0002843354738275929, - "loss": 0.0384, + "epoch": 0.05, + "learning_rate": 0.000292689608548466, + "loss": 0.0458, "step": 9660 }, { - "epoch": 0.1, - "learning_rate": 0.00028431925796199, - "loss": 0.0406, + "epoch": 0.05, + "learning_rate": 0.000292682040855452, + "loss": 0.0492, "step": 9670 }, { - "epoch": 0.1, - "learning_rate": 0.00028430304209638705, - "loss": 0.041, + "epoch": 0.05, + "learning_rate": 0.000292674473162438, + "loss": 0.0372, "step": 9680 }, { - "epoch": 0.1, - "learning_rate": 0.00028428682623078417, - "loss": 0.036, + "epoch": 0.05, + "learning_rate": 0.00029266690546942396, + "loss": 0.0358, "step": 9690 }, { - "epoch": 0.1, - "learning_rate": 0.0002842706103651813, - "loss": 0.0384, + "epoch": 0.05, + "learning_rate": 0.00029265933777640994, + "loss": 0.0515, "step": 9700 }, { - "epoch": 0.1, - "learning_rate": 0.00028425439449957836, - "loss": 0.0349, + "epoch": 0.05, + "learning_rate": 0.0002926517700833959, + "loss": 0.0445, "step": 9710 }, { - "epoch": 0.11, - "learning_rate": 0.0002842381786339754, - "loss": 0.0364, + "epoch": 0.05, + "learning_rate": 0.00029264420239038196, + "loss": 0.0406, "step": 9720 }, { - "epoch": 0.11, - "learning_rate": 0.00028422196276837254, - "loss": 0.0372, + "epoch": 0.05, + "learning_rate": 0.00029263663469736794, + "loss": 0.0414, "step": 9730 }, { - "epoch": 0.11, - "learning_rate": 0.00028420574690276966, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.0002926290670043539, + "loss": 0.0355, "step": 9740 }, { - "epoch": 0.11, - "learning_rate": 0.0002841895310371667, - "loss": 0.0337, + "epoch": 0.05, + "learning_rate": 0.0002926214993113399, + "loss": 0.0383, "step": 9750 }, { - "epoch": 0.11, - "learning_rate": 0.00028417331517156385, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.0002926139316183259, + "loss": 0.0398, "step": 9760 }, { - "epoch": 0.11, - "learning_rate": 0.0002841570993059609, - "loss": 0.0386, + "epoch": 0.05, + "learning_rate": 0.00029260636392531187, + "loss": 0.0456, "step": 9770 }, { - "epoch": 0.11, - "learning_rate": 0.00028414088344035803, - "loss": 0.0361, + "epoch": 0.05, + "learning_rate": 0.00029259879623229785, + "loss": 0.0414, "step": 9780 }, { - "epoch": 0.11, - "learning_rate": 0.00028412466757475515, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.0002925912285392839, + "loss": 0.0428, "step": 9790 }, { - "epoch": 0.11, - "learning_rate": 0.0002841084517091522, - "loss": 0.0376, + "epoch": 0.05, + "learning_rate": 0.00029258366084626986, + "loss": 0.038, "step": 9800 }, { - "epoch": 0.11, - "learning_rate": 0.0002840922358435493, - "loss": 0.0376, + "epoch": 0.05, + "learning_rate": 0.00029257609315325585, + "loss": 0.0365, "step": 9810 }, { - "epoch": 0.11, - "learning_rate": 0.0002840760199779464, - "loss": 0.0333, + "epoch": 0.05, + "learning_rate": 0.00029256852546024183, + "loss": 0.0341, "step": 9820 }, { - "epoch": 0.11, - "learning_rate": 0.0002840598041123435, - "loss": 0.0372, + "epoch": 0.05, + "learning_rate": 0.0002925609577672278, + "loss": 0.0397, "step": 9830 }, { - "epoch": 0.11, - "learning_rate": 0.0002840435882467406, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.0002925533900742138, + "loss": 0.0363, "step": 9840 }, { - "epoch": 0.11, - "learning_rate": 0.00028402737238113765, - "loss": 0.0422, + "epoch": 0.05, + "learning_rate": 0.0002925458223811998, + "loss": 0.0411, "step": 9850 }, { - "epoch": 0.11, - "learning_rate": 0.0002840111565155348, - "loss": 0.0336, + "epoch": 0.05, + "learning_rate": 0.0002925382546881858, + "loss": 0.039, "step": 9860 }, { - "epoch": 0.11, - "learning_rate": 0.0002839949406499319, - "loss": 0.0402, + "epoch": 0.05, + "learning_rate": 0.0002925306869951718, + "loss": 0.0385, "step": 9870 }, { - "epoch": 0.11, - "learning_rate": 0.00028397872478432896, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.00029252311930215777, + "loss": 0.0349, "step": 9880 }, { - "epoch": 0.11, - "learning_rate": 0.000283962508918726, - "loss": 0.033, + "epoch": 0.05, + "learning_rate": 0.00029251555160914375, + "loss": 0.0366, "step": 9890 }, { - "epoch": 0.11, - "learning_rate": 0.00028394629305312314, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.00029250798391612973, + "loss": 0.0343, "step": 9900 }, { - "epoch": 0.11, - "learning_rate": 0.00028393007718752026, - "loss": 0.036, + "epoch": 0.05, + "learning_rate": 0.0002925004162231157, + "loss": 0.0382, "step": 9910 }, { - "epoch": 0.11, - "learning_rate": 0.00028391386132191733, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.00029249284853010175, + "loss": 0.036, "step": 9920 }, { - "epoch": 0.11, - "learning_rate": 0.00028389764545631445, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.00029248528083708773, + "loss": 0.0409, "step": 9930 }, { - "epoch": 0.11, - "learning_rate": 0.0002838814295907115, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.0002924777131440737, + "loss": 0.0425, "step": 9940 }, { - "epoch": 0.11, - "learning_rate": 0.00028386521372510864, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.0002924701454510597, + "loss": 0.0364, "step": 9950 }, { - "epoch": 0.11, - "learning_rate": 0.0002838489978595057, - "loss": 0.0383, + "epoch": 0.05, + "learning_rate": 0.0002924625777580457, + "loss": 0.0376, "step": 9960 }, { - "epoch": 0.11, - "learning_rate": 0.0002838327819939028, - "loss": 0.0357, + "epoch": 0.05, + "learning_rate": 0.00029245501006503166, + "loss": 0.038, "step": 9970 }, { - "epoch": 0.11, - "learning_rate": 0.0002838165661282999, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.0002924474423720177, + "loss": 0.0385, "step": 9980 }, { - "epoch": 0.11, - "learning_rate": 0.000283800350262697, - "loss": 0.0395, + "epoch": 0.05, + "learning_rate": 0.0002924398746790037, + "loss": 0.0304, "step": 9990 }, { - "epoch": 0.11, - "learning_rate": 0.00028378413439709407, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029243230698598966, + "loss": 0.0413, "step": 10000 }, { - "epoch": 0.11, - "eval_cer": 0.921579050686457, - "eval_loss": 0.02728099934756756, - "eval_runtime": 119.7696, - "eval_samples_per_second": 16.699, - "eval_steps_per_second": 4.175, + "epoch": 0.05, + "eval_cer": 0.9145003381830497, + "eval_loss": 0.02770831808447838, + "eval_runtime": 117.615, + "eval_samples_per_second": 17.005, + "eval_steps_per_second": 4.251, "step": 10000 }, { - "epoch": 0.11, - "learning_rate": 0.0002837679185314912, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.00029242473929297564, + "loss": 0.0328, "step": 10010 }, { - "epoch": 0.11, - "learning_rate": 0.00028375170266588826, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002924171715999616, + "loss": 0.0358, "step": 10020 }, { - "epoch": 0.11, - "learning_rate": 0.0002837354868002854, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.0002924096039069476, + "loss": 0.0386, "step": 10030 }, { - "epoch": 0.11, - "learning_rate": 0.00028371927093468244, - "loss": 0.0351, + "epoch": 0.05, + "learning_rate": 0.00029240203621393364, + "loss": 0.0341, "step": 10040 }, { - "epoch": 0.11, - "learning_rate": 0.00028370305506907956, - "loss": 0.0352, + "epoch": 0.05, + "learning_rate": 0.0002923944685209196, + "loss": 0.036, "step": 10050 }, { - "epoch": 0.11, - "learning_rate": 0.0002836868392034767, - "loss": 0.0314, + "epoch": 0.05, + "learning_rate": 0.0002923869008279056, + "loss": 0.046, "step": 10060 }, { - "epoch": 0.11, - "learning_rate": 0.00028367062333787375, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.0002923793331348916, + "loss": 0.0378, "step": 10070 }, { - "epoch": 0.11, - "learning_rate": 0.00028365440747227087, - "loss": 0.0401, + "epoch": 0.05, + "learning_rate": 0.00029237176544187756, + "loss": 0.039, "step": 10080 }, { - "epoch": 0.11, - "learning_rate": 0.00028363819160666793, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.00029236419774886354, + "loss": 0.0352, "step": 10090 }, { - "epoch": 0.11, - "learning_rate": 0.00028362197574106505, - "loss": 0.0381, + "epoch": 0.05, + "learning_rate": 0.0002923566300558495, + "loss": 0.0363, "step": 10100 }, { - "epoch": 0.11, - "learning_rate": 0.0002836057598754621, - "loss": 0.0333, + "epoch": 0.05, + "learning_rate": 0.00029234906236283556, + "loss": 0.039, "step": 10110 }, { - "epoch": 0.11, - "learning_rate": 0.00028358954400985924, - "loss": 0.0443, + "epoch": 0.05, + "learning_rate": 0.00029234149466982154, + "loss": 0.0353, "step": 10120 }, { - "epoch": 0.11, - "learning_rate": 0.0002835733281442563, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.0002923339269768075, + "loss": 0.0336, "step": 10130 }, { - "epoch": 0.11, - "learning_rate": 0.0002835571122786534, - "loss": 0.0356, + "epoch": 0.05, + "learning_rate": 0.0002923263592837935, + "loss": 0.0427, "step": 10140 }, { - "epoch": 0.11, - "learning_rate": 0.0002835408964130505, - "loss": 0.0321, + "epoch": 0.05, + "learning_rate": 0.0002923187915907795, + "loss": 0.0359, "step": 10150 }, { - "epoch": 0.11, - "learning_rate": 0.0002835246805474476, - "loss": 0.0363, + "epoch": 0.05, + "learning_rate": 0.00029231122389776547, + "loss": 0.0366, "step": 10160 }, { - "epoch": 0.11, - "learning_rate": 0.0002835084646818447, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.0002923036562047515, + "loss": 0.0341, "step": 10170 }, { - "epoch": 0.11, - "learning_rate": 0.0002834922488162418, - "loss": 0.0377, + "epoch": 0.05, + "learning_rate": 0.0002922960885117375, + "loss": 0.0412, "step": 10180 }, { - "epoch": 0.11, - "learning_rate": 0.00028347603295063886, - "loss": 0.0345, + "epoch": 0.05, + "learning_rate": 0.00029228852081872347, + "loss": 0.0317, "step": 10190 }, { - "epoch": 0.11, - "learning_rate": 0.000283459817085036, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.00029228095312570945, + "loss": 0.0363, "step": 10200 }, { - "epoch": 0.11, - "learning_rate": 0.00028344360121943305, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.00029227338543269543, + "loss": 0.0357, "step": 10210 }, { - "epoch": 0.11, - "learning_rate": 0.00028342738535383017, - "loss": 0.0399, + "epoch": 0.05, + "learning_rate": 0.0002922658177396814, + "loss": 0.0333, "step": 10220 }, { - "epoch": 0.11, - "learning_rate": 0.0002834111694882273, - "loss": 0.0361, + "epoch": 0.05, + "learning_rate": 0.00029225825004666745, + "loss": 0.0419, "step": 10230 }, { - "epoch": 0.11, - "learning_rate": 0.00028339495362262435, - "loss": 0.0394, + "epoch": 0.05, + "learning_rate": 0.00029225068235365343, + "loss": 0.0327, "step": 10240 }, { - "epoch": 0.11, - "learning_rate": 0.0002833787377570214, - "loss": 0.0379, + "epoch": 0.05, + "learning_rate": 0.0002922431146606394, + "loss": 0.0337, "step": 10250 }, { - "epoch": 0.11, - "learning_rate": 0.00028336252189141854, - "loss": 0.0395, + "epoch": 0.05, + "learning_rate": 0.0002922355469676254, + "loss": 0.0386, "step": 10260 }, { - "epoch": 0.11, - "learning_rate": 0.00028334630602581566, - "loss": 0.0454, + "epoch": 0.05, + "learning_rate": 0.00029222797927461137, + "loss": 0.0347, "step": 10270 }, { - "epoch": 0.11, - "learning_rate": 0.0002833300901602127, - "loss": 0.037, + "epoch": 0.05, + "learning_rate": 0.00029222041158159735, + "loss": 0.035, "step": 10280 }, { - "epoch": 0.11, - "learning_rate": 0.0002833138742946098, - "loss": 0.0398, + "epoch": 0.05, + "learning_rate": 0.00029221284388858333, + "loss": 0.0343, "step": 10290 }, { - "epoch": 0.11, - "learning_rate": 0.0002832976584290069, - "loss": 0.0401, + "epoch": 0.05, + "learning_rate": 0.00029220527619556937, + "loss": 0.0481, "step": 10300 }, { - "epoch": 0.11, - "learning_rate": 0.00028328144256340403, + "epoch": 0.05, + "learning_rate": 0.00029219770850255535, "loss": 0.0382, "step": 10310 }, { - "epoch": 0.11, - "learning_rate": 0.0002832652266978011, - "loss": 0.0342, + "epoch": 0.05, + "learning_rate": 0.00029219014080954133, + "loss": 0.0358, "step": 10320 }, { - "epoch": 0.11, - "learning_rate": 0.00028324901083219816, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.0002921825731165273, + "loss": 0.0422, "step": 10330 }, { - "epoch": 0.11, - "learning_rate": 0.0002832327949665953, - "loss": 0.0383, + "epoch": 0.05, + "learning_rate": 0.0002921750054235133, + "loss": 0.0343, "step": 10340 }, { - "epoch": 0.11, - "learning_rate": 0.0002832165791009924, - "loss": 0.036, + "epoch": 0.05, + "learning_rate": 0.0002921674377304993, + "loss": 0.046, "step": 10350 }, { - "epoch": 0.11, - "learning_rate": 0.0002832003632353895, - "loss": 0.0428, + "epoch": 0.05, + "learning_rate": 0.0002921598700374853, + "loss": 0.0407, "step": 10360 }, { - "epoch": 0.11, - "learning_rate": 0.0002831841473697866, - "loss": 0.0386, + "epoch": 0.05, + "learning_rate": 0.0002921523023444713, + "loss": 0.0364, "step": 10370 }, { - "epoch": 0.11, - "learning_rate": 0.00028316793150418365, - "loss": 0.0379, + "epoch": 0.05, + "learning_rate": 0.0002921447346514573, + "loss": 0.0349, "step": 10380 }, { - "epoch": 0.11, - "learning_rate": 0.00028315171563858077, - "loss": 0.0444, + "epoch": 0.05, + "learning_rate": 0.00029213716695844326, + "loss": 0.0338, "step": 10390 }, { - "epoch": 0.11, - "learning_rate": 0.0002831354997729779, - "loss": 0.037, + "epoch": 0.05, + "learning_rate": 0.00029212959926542924, + "loss": 0.0333, "step": 10400 }, { - "epoch": 0.11, - "learning_rate": 0.00028311928390737496, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.0002921220315724152, + "loss": 0.0347, "step": 10410 }, { - "epoch": 0.11, - "learning_rate": 0.000283103068041772, - "loss": 0.0387, + "epoch": 0.05, + "learning_rate": 0.0002921144638794012, + "loss": 0.0357, "step": 10420 }, { - "epoch": 0.11, - "learning_rate": 0.00028308685217616914, - "loss": 0.0341, + "epoch": 0.05, + "learning_rate": 0.00029210689618638724, + "loss": 0.0351, "step": 10430 }, { - "epoch": 0.11, - "learning_rate": 0.00028307063631056626, - "loss": 0.0369, + "epoch": 0.05, + "learning_rate": 0.0002920993284933732, + "loss": 0.0356, "step": 10440 }, { - "epoch": 0.11, - "learning_rate": 0.00028305442044496333, - "loss": 0.0326, + "epoch": 0.05, + "learning_rate": 0.0002920917608003592, + "loss": 0.0394, "step": 10450 }, { - "epoch": 0.11, - "learning_rate": 0.0002830382045793604, - "loss": 0.0367, + "epoch": 0.05, + "learning_rate": 0.0002920841931073452, + "loss": 0.0376, "step": 10460 }, { - "epoch": 0.11, - "learning_rate": 0.0002830219887137575, - "loss": 0.0321, + "epoch": 0.05, + "learning_rate": 0.00029207662541433116, + "loss": 0.0374, "step": 10470 }, { - "epoch": 0.11, - "learning_rate": 0.00028300577284815463, - "loss": 0.0335, + "epoch": 0.05, + "learning_rate": 0.00029206905772131714, + "loss": 0.0333, "step": 10480 }, { - "epoch": 0.11, - "learning_rate": 0.0002829895569825517, - "loss": 0.0392, + "epoch": 0.05, + "learning_rate": 0.0002920614900283032, + "loss": 0.0313, "step": 10490 }, { - "epoch": 0.11, - "learning_rate": 0.0002829733411169488, - "loss": 0.0382, + "epoch": 0.05, + "learning_rate": 0.00029205392233528916, + "loss": 0.0328, "step": 10500 }, { - "epoch": 0.11, - "learning_rate": 0.0002829571252513459, - "loss": 0.0367, + "epoch": 0.05, + "learning_rate": 0.00029204635464227514, + "loss": 0.0339, "step": 10510 }, { - "epoch": 0.11, - "learning_rate": 0.000282940909385743, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.0002920387869492611, + "loss": 0.03, "step": 10520 }, { - "epoch": 0.11, - "learning_rate": 0.00028292469352014007, - "loss": 0.0356, + "epoch": 0.05, + "learning_rate": 0.0002920312192562471, + "loss": 0.0353, "step": 10530 }, { - "epoch": 0.11, - "learning_rate": 0.0002829084776545372, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002920236515632331, + "loss": 0.035, "step": 10540 }, { - "epoch": 0.11, - "learning_rate": 0.00028289226178893425, - "loss": 0.0349, + "epoch": 0.05, + "learning_rate": 0.0002920160838702191, + "loss": 0.0311, "step": 10550 }, { - "epoch": 0.11, - "learning_rate": 0.0002828760459233314, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.0002920085161772051, + "loss": 0.0359, "step": 10560 }, { - "epoch": 0.11, - "learning_rate": 0.00028285983005772844, - "loss": 0.0333, + "epoch": 0.05, + "learning_rate": 0.0002920009484841911, + "loss": 0.0373, "step": 10570 }, { - "epoch": 0.11, - "learning_rate": 0.00028284361419212556, - "loss": 0.04, + "epoch": 0.05, + "learning_rate": 0.00029199338079117707, + "loss": 0.0408, "step": 10580 }, { - "epoch": 0.11, - "learning_rate": 0.0002828273983265226, - "loss": 0.0338, + "epoch": 0.05, + "learning_rate": 0.00029198581309816305, + "loss": 0.0406, "step": 10590 }, { - "epoch": 0.11, - "learning_rate": 0.00028281118246091975, - "loss": 0.0384, + "epoch": 0.05, + "learning_rate": 0.00029197824540514903, + "loss": 0.039, "step": 10600 }, { - "epoch": 0.11, - "learning_rate": 0.0002827949665953168, - "loss": 0.0359, + "epoch": 0.05, + "learning_rate": 0.000291970677712135, + "loss": 0.0318, "step": 10610 }, { - "epoch": 0.11, - "learning_rate": 0.00028277875072971393, - "loss": 0.0383, + "epoch": 0.05, + "learning_rate": 0.00029196311001912105, + "loss": 0.0357, "step": 10620 }, { - "epoch": 0.11, - "learning_rate": 0.000282762534864111, - "loss": 0.0379, + "epoch": 0.05, + "learning_rate": 0.00029195554232610703, + "loss": 0.0354, "step": 10630 }, { - "epoch": 0.12, - "learning_rate": 0.0002827463189985081, - "loss": 0.0375, + "epoch": 0.05, + "learning_rate": 0.000291947974633093, + "loss": 0.0331, "step": 10640 }, { - "epoch": 0.12, - "learning_rate": 0.0002827301031329052, - "loss": 0.0315, + "epoch": 0.05, + "learning_rate": 0.000291940406940079, + "loss": 0.0322, "step": 10650 }, { - "epoch": 0.12, - "learning_rate": 0.0002827138872673023, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.000291932839247065, + "loss": 0.0391, "step": 10660 }, { - "epoch": 0.12, - "learning_rate": 0.0002826976714016994, - "loss": 0.0369, + "epoch": 0.05, + "learning_rate": 0.00029192527155405095, + "loss": 0.0352, "step": 10670 }, { - "epoch": 0.12, - "learning_rate": 0.0002826814555360965, - "loss": 0.0387, + "epoch": 0.05, + "learning_rate": 0.000291917703861037, + "loss": 0.0335, "step": 10680 }, { - "epoch": 0.12, - "learning_rate": 0.00028266523967049355, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.0002919101361680229, + "loss": 0.0336, "step": 10690 }, { - "epoch": 0.12, - "learning_rate": 0.00028264902380489067, - "loss": 0.0396, + "epoch": 0.05, + "learning_rate": 0.0002919025684750089, + "loss": 0.0392, "step": 10700 }, { - "epoch": 0.12, - "learning_rate": 0.0002826328079392878, - "loss": 0.0427, + "epoch": 0.05, + "learning_rate": 0.0002918950007819949, + "loss": 0.0347, "step": 10710 }, { - "epoch": 0.12, - "learning_rate": 0.00028261659207368486, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.0002918874330889809, + "loss": 0.0386, "step": 10720 }, { - "epoch": 0.12, - "learning_rate": 0.0002826003762080819, - "loss": 0.0349, + "epoch": 0.05, + "learning_rate": 0.0002918798653959669, + "loss": 0.037, "step": 10730 }, { - "epoch": 0.12, - "learning_rate": 0.00028258416034247904, - "loss": 0.0361, + "epoch": 0.05, + "learning_rate": 0.0002918722977029529, + "loss": 0.042, "step": 10740 }, { - "epoch": 0.12, - "learning_rate": 0.00028256794447687616, - "loss": 0.0349, + "epoch": 0.05, + "learning_rate": 0.00029186473000993886, + "loss": 0.0359, "step": 10750 }, { - "epoch": 0.12, - "learning_rate": 0.00028255172861127323, - "loss": 0.0338, + "epoch": 0.05, + "learning_rate": 0.00029185716231692484, + "loss": 0.0392, "step": 10760 }, { - "epoch": 0.12, - "learning_rate": 0.00028253551274567035, - "loss": 0.0427, + "epoch": 0.05, + "learning_rate": 0.0002918495946239108, + "loss": 0.0366, "step": 10770 }, { - "epoch": 0.12, - "learning_rate": 0.0002825192968800674, - "loss": 0.0495, + "epoch": 0.05, + "learning_rate": 0.00029184202693089686, + "loss": 0.0351, "step": 10780 }, { - "epoch": 0.12, - "learning_rate": 0.00028250308101446453, - "loss": 0.0354, + "epoch": 0.05, + "learning_rate": 0.00029183445923788284, + "loss": 0.0386, "step": 10790 }, { - "epoch": 0.12, - "learning_rate": 0.00028248686514886165, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.0002918268915448688, + "loss": 0.0321, "step": 10800 }, { - "epoch": 0.12, - "learning_rate": 0.0002824706492832587, - "loss": 0.0326, + "epoch": 0.05, + "learning_rate": 0.0002918193238518548, + "loss": 0.0346, "step": 10810 }, { - "epoch": 0.12, - "learning_rate": 0.0002824544334176558, - "loss": 0.0406, + "epoch": 0.05, + "learning_rate": 0.0002918117561588408, + "loss": 0.0375, "step": 10820 }, { - "epoch": 0.12, - "learning_rate": 0.0002824382175520529, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.00029180418846582677, + "loss": 0.0344, "step": 10830 }, { - "epoch": 0.12, - "learning_rate": 0.00028242200168645, - "loss": 0.0334, + "epoch": 0.05, + "learning_rate": 0.00029179662077281275, + "loss": 0.036, "step": 10840 }, { - "epoch": 0.12, - "learning_rate": 0.0002824057858208471, - "loss": 0.0376, + "epoch": 0.05, + "learning_rate": 0.0002917890530797988, + "loss": 0.0319, "step": 10850 }, { - "epoch": 0.12, - "learning_rate": 0.00028238956995524416, - "loss": 0.0442, + "epoch": 0.05, + "learning_rate": 0.00029178148538678476, + "loss": 0.0333, "step": 10860 }, { - "epoch": 0.12, - "learning_rate": 0.0002823733540896413, - "loss": 0.0419, + "epoch": 0.05, + "learning_rate": 0.00029177391769377075, + "loss": 0.0359, "step": 10870 }, { - "epoch": 0.12, - "learning_rate": 0.0002823571382240384, - "loss": 0.0417, + "epoch": 0.05, + "learning_rate": 0.00029176635000075673, + "loss": 0.0368, "step": 10880 }, { - "epoch": 0.12, - "learning_rate": 0.00028234092235843546, - "loss": 0.0368, + "epoch": 0.05, + "learning_rate": 0.0002917587823077427, + "loss": 0.0322, "step": 10890 }, { - "epoch": 0.12, - "learning_rate": 0.00028232470649283253, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.0002917512146147287, + "loss": 0.0395, "step": 10900 }, { - "epoch": 0.12, - "learning_rate": 0.00028230849062722965, - "loss": 0.0378, + "epoch": 0.06, + "learning_rate": 0.0002917436469217147, + "loss": 0.0388, "step": 10910 }, { - "epoch": 0.12, - "learning_rate": 0.00028229227476162677, - "loss": 0.0416, + "epoch": 0.06, + "learning_rate": 0.0002917360792287007, + "loss": 0.0349, "step": 10920 }, { - "epoch": 0.12, - "learning_rate": 0.00028227605889602383, - "loss": 0.0413, + "epoch": 0.06, + "learning_rate": 0.0002917285115356867, + "loss": 0.0386, "step": 10930 }, { - "epoch": 0.12, - "learning_rate": 0.00028225984303042095, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.00029172094384267267, + "loss": 0.0409, "step": 10940 }, { - "epoch": 0.12, - "learning_rate": 0.000282243627164818, - "loss": 0.0389, + "epoch": 0.06, + "learning_rate": 0.00029171337614965865, + "loss": 0.0367, "step": 10950 }, { - "epoch": 0.12, - "learning_rate": 0.00028222741129921514, - "loss": 0.0385, + "epoch": 0.06, + "learning_rate": 0.00029170580845664463, + "loss": 0.0355, "step": 10960 }, { - "epoch": 0.12, - "learning_rate": 0.00028221119543361226, - "loss": 0.0358, + "epoch": 0.06, + "learning_rate": 0.0002916982407636306, + "loss": 0.0337, "step": 10970 }, { - "epoch": 0.12, - "learning_rate": 0.0002821949795680093, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.00029169067307061665, + "loss": 0.0409, "step": 10980 }, { - "epoch": 0.12, - "learning_rate": 0.0002821787637024064, - "loss": 0.0344, + "epoch": 0.06, + "learning_rate": 0.00029168310537760263, + "loss": 0.0377, "step": 10990 }, { - "epoch": 0.12, - "learning_rate": 0.0002821625478368035, - "loss": 0.0382, + "epoch": 0.06, + "learning_rate": 0.0002916755376845886, + "loss": 0.0333, "step": 11000 }, { - "epoch": 0.12, - "eval_cer": 0.9215694960539368, - "eval_loss": 0.02685784548521042, - "eval_runtime": 119.8402, - "eval_samples_per_second": 16.689, - "eval_steps_per_second": 4.172, + "epoch": 0.06, + "eval_cer": 0.9145003381830497, + "eval_loss": 0.027273865416646004, + "eval_runtime": 117.4476, + "eval_samples_per_second": 17.029, + "eval_steps_per_second": 4.257, "step": 11000 }, { - "epoch": 0.12, - "learning_rate": 0.00028214633197120063, - "loss": 0.0346, + "epoch": 0.06, + "learning_rate": 0.0002916679699915746, + "loss": 0.032, "step": 11010 }, { - "epoch": 0.12, - "learning_rate": 0.0002821301161055977, - "loss": 0.0357, + "epoch": 0.06, + "learning_rate": 0.0002916604022985606, + "loss": 0.0327, "step": 11020 }, { - "epoch": 0.12, - "learning_rate": 0.00028211390023999476, - "loss": 0.0346, + "epoch": 0.06, + "learning_rate": 0.00029165283460554656, + "loss": 0.0479, "step": 11030 }, { - "epoch": 0.12, - "learning_rate": 0.0002820976843743919, - "loss": 0.0367, + "epoch": 0.06, + "learning_rate": 0.0002916452669125326, + "loss": 0.0659, "step": 11040 }, { - "epoch": 0.12, - "learning_rate": 0.000282081468508789, - "loss": 0.036, + "epoch": 0.06, + "learning_rate": 0.0002916376992195186, + "loss": 0.044, "step": 11050 }, { - "epoch": 0.12, - "learning_rate": 0.00028206525264318607, - "loss": 0.0408, + "epoch": 0.06, + "learning_rate": 0.00029163013152650456, + "loss": 0.0389, "step": 11060 }, { - "epoch": 0.12, - "learning_rate": 0.0002820490367775832, - "loss": 0.0321, + "epoch": 0.06, + "learning_rate": 0.00029162256383349054, + "loss": 0.0395, "step": 11070 }, { - "epoch": 0.12, - "learning_rate": 0.00028203282091198025, - "loss": 0.043, + "epoch": 0.06, + "learning_rate": 0.0002916149961404765, + "loss": 0.0589, "step": 11080 }, { - "epoch": 0.12, - "learning_rate": 0.00028201660504637737, - "loss": 0.0364, + "epoch": 0.06, + "learning_rate": 0.0002916074284474625, + "loss": 0.0441, "step": 11090 }, { - "epoch": 0.12, - "learning_rate": 0.00028200038918077444, - "loss": 0.0373, + "epoch": 0.06, + "learning_rate": 0.00029159986075444854, + "loss": 0.0429, "step": 11100 }, { - "epoch": 0.12, - "learning_rate": 0.00028198417331517156, - "loss": 0.0451, + "epoch": 0.06, + "learning_rate": 0.0002915922930614345, + "loss": 0.0401, "step": 11110 }, { - "epoch": 0.12, - "learning_rate": 0.0002819679574495686, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.0002915847253684205, + "loss": 0.0403, "step": 11120 }, { - "epoch": 0.12, - "learning_rate": 0.00028195174158396574, - "loss": 0.0345, + "epoch": 0.06, + "learning_rate": 0.0002915771576754065, + "loss": 0.0418, "step": 11130 }, { - "epoch": 0.12, - "learning_rate": 0.0002819355257183628, - "loss": 0.0376, + "epoch": 0.06, + "learning_rate": 0.00029156958998239246, + "loss": 0.0355, "step": 11140 }, { - "epoch": 0.12, - "learning_rate": 0.00028191930985275993, - "loss": 0.038, + "epoch": 0.06, + "learning_rate": 0.00029156202228937844, + "loss": 0.0404, "step": 11150 }, { - "epoch": 0.12, - "learning_rate": 0.000281903093987157, - "loss": 0.0364, + "epoch": 0.06, + "learning_rate": 0.0002915544545963644, + "loss": 0.0396, "step": 11160 }, { - "epoch": 0.12, - "learning_rate": 0.0002818868781215541, - "loss": 0.0389, + "epoch": 0.06, + "learning_rate": 0.00029154688690335046, + "loss": 0.0428, "step": 11170 }, { - "epoch": 0.12, - "learning_rate": 0.0002818706622559512, - "loss": 0.036, + "epoch": 0.06, + "learning_rate": 0.00029153931921033644, + "loss": 0.0404, "step": 11180 }, { - "epoch": 0.12, - "learning_rate": 0.0002818544463903483, - "loss": 0.034, + "epoch": 0.06, + "learning_rate": 0.0002915317515173224, + "loss": 0.0358, "step": 11190 }, { - "epoch": 0.12, - "learning_rate": 0.00028183823052474536, - "loss": 0.0349, + "epoch": 0.06, + "learning_rate": 0.0002915241838243084, + "loss": 0.0383, "step": 11200 }, { - "epoch": 0.12, - "learning_rate": 0.0002818220146591425, - "loss": 0.0335, + "epoch": 0.06, + "learning_rate": 0.0002915166161312944, + "loss": 0.0385, "step": 11210 }, { - "epoch": 0.12, - "learning_rate": 0.00028180579879353955, - "loss": 0.0338, + "epoch": 0.06, + "learning_rate": 0.00029150904843828037, + "loss": 0.0371, "step": 11220 }, { - "epoch": 0.12, - "learning_rate": 0.00028178958292793667, - "loss": 0.035, + "epoch": 0.06, + "learning_rate": 0.0002915014807452664, + "loss": 0.0374, "step": 11230 }, { - "epoch": 0.12, - "learning_rate": 0.0002817733670623338, - "loss": 0.041, + "epoch": 0.06, + "learning_rate": 0.0002914939130522524, + "loss": 0.0389, "step": 11240 }, { - "epoch": 0.12, - "learning_rate": 0.00028175715119673086, - "loss": 0.0395, + "epoch": 0.06, + "learning_rate": 0.00029148634535923837, + "loss": 0.0397, "step": 11250 }, { - "epoch": 0.12, - "learning_rate": 0.0002817409353311279, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029147877766622435, + "loss": 0.0373, "step": 11260 }, { - "epoch": 0.12, - "learning_rate": 0.00028172471946552504, - "loss": 0.0388, + "epoch": 0.06, + "learning_rate": 0.00029147120997321033, + "loss": 0.0372, "step": 11270 }, { - "epoch": 0.12, - "learning_rate": 0.00028170850359992216, - "loss": 0.0362, + "epoch": 0.06, + "learning_rate": 0.0002914636422801963, + "loss": 0.0383, "step": 11280 }, { - "epoch": 0.12, - "learning_rate": 0.0002816922877343192, - "loss": 0.0391, + "epoch": 0.06, + "learning_rate": 0.00029145607458718235, + "loss": 0.036, "step": 11290 }, { - "epoch": 0.12, - "learning_rate": 0.0002816760718687163, - "loss": 0.0399, + "epoch": 0.06, + "learning_rate": 0.00029144850689416833, + "loss": 0.0377, "step": 11300 }, { - "epoch": 0.12, - "learning_rate": 0.0002816598560031134, - "loss": 0.0374, + "epoch": 0.06, + "learning_rate": 0.0002914409392011543, + "loss": 0.0394, "step": 11310 }, { - "epoch": 0.12, - "learning_rate": 0.00028164364013751053, - "loss": 0.0334, + "epoch": 0.06, + "learning_rate": 0.0002914333715081403, + "loss": 0.0408, "step": 11320 }, { - "epoch": 0.12, - "learning_rate": 0.0002816274242719076, - "loss": 0.036, + "epoch": 0.06, + "learning_rate": 0.00029142580381512627, + "loss": 0.0381, "step": 11330 }, { - "epoch": 0.12, - "learning_rate": 0.00028161120840630466, - "loss": 0.0376, + "epoch": 0.06, + "learning_rate": 0.00029141823612211225, + "loss": 0.038, "step": 11340 }, { - "epoch": 0.12, - "learning_rate": 0.0002815949925407018, - "loss": 0.0368, + "epoch": 0.06, + "learning_rate": 0.00029141066842909824, + "loss": 0.0319, "step": 11350 }, { - "epoch": 0.12, - "learning_rate": 0.0002815787766750989, - "loss": 0.0401, + "epoch": 0.06, + "learning_rate": 0.00029140310073608427, + "loss": 0.0309, "step": 11360 }, { - "epoch": 0.12, - "learning_rate": 0.000281562560809496, - "loss": 0.0335, + "epoch": 0.06, + "learning_rate": 0.00029139553304307025, + "loss": 0.036, "step": 11370 }, { - "epoch": 0.12, - "learning_rate": 0.0002815463449438931, - "loss": 0.0352, + "epoch": 0.06, + "learning_rate": 0.00029138796535005623, + "loss": 0.0346, "step": 11380 }, { - "epoch": 0.12, - "learning_rate": 0.00028153012907829015, - "loss": 0.0387, + "epoch": 0.06, + "learning_rate": 0.0002913803976570422, + "loss": 0.0753, "step": 11390 }, { - "epoch": 0.12, - "learning_rate": 0.0002815139132126873, - "loss": 0.0322, + "epoch": 0.06, + "learning_rate": 0.0002913728299640282, + "loss": 0.037, "step": 11400 }, { - "epoch": 0.12, - "learning_rate": 0.0002814976973470844, - "loss": 0.0347, + "epoch": 0.06, + "learning_rate": 0.0002913652622710142, + "loss": 0.0302, "step": 11410 }, { - "epoch": 0.12, - "learning_rate": 0.00028148148148148146, - "loss": 0.0359, + "epoch": 0.06, + "learning_rate": 0.0002913576945780002, + "loss": 0.0365, "step": 11420 }, { - "epoch": 0.12, - "learning_rate": 0.0002814652656158785, - "loss": 0.0307, + "epoch": 0.06, + "learning_rate": 0.0002913501268849862, + "loss": 0.0351, "step": 11430 }, { - "epoch": 0.12, - "learning_rate": 0.00028144904975027564, - "loss": 0.0368, + "epoch": 0.06, + "learning_rate": 0.0002913425591919722, + "loss": 0.0354, "step": 11440 }, { - "epoch": 0.12, - "learning_rate": 0.00028143283388467276, - "loss": 0.0382, + "epoch": 0.06, + "learning_rate": 0.00029133499149895816, + "loss": 0.0371, "step": 11450 }, { - "epoch": 0.12, - "learning_rate": 0.00028141661801906983, - "loss": 0.031, + "epoch": 0.06, + "learning_rate": 0.00029132742380594414, + "loss": 0.0396, "step": 11460 }, { - "epoch": 0.12, - "learning_rate": 0.0002814004021534669, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002913198561129301, + "loss": 0.0351, "step": 11470 }, { - "epoch": 0.12, - "learning_rate": 0.000281384186287864, - "loss": 0.038, + "epoch": 0.06, + "learning_rate": 0.0002913122884199161, + "loss": 0.0356, "step": 11480 }, { - "epoch": 0.12, - "learning_rate": 0.00028136797042226114, - "loss": 0.0345, + "epoch": 0.06, + "learning_rate": 0.00029130472072690214, + "loss": 0.0317, "step": 11490 }, { - "epoch": 0.12, - "learning_rate": 0.0002813517545566582, - "loss": 0.0398, + "epoch": 0.06, + "learning_rate": 0.0002912971530338881, + "loss": 0.0347, "step": 11500 }, { - "epoch": 0.12, - "learning_rate": 0.0002813355386910553, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.0002912895853408741, + "loss": 0.0338, "step": 11510 }, { - "epoch": 0.12, - "learning_rate": 0.0002813193228254524, - "loss": 0.0367, + "epoch": 0.06, + "learning_rate": 0.0002912820176478601, + "loss": 0.0393, "step": 11520 }, { - "epoch": 0.12, - "learning_rate": 0.0002813031069598495, - "loss": 0.0308, + "epoch": 0.06, + "learning_rate": 0.00029127444995484606, + "loss": 0.0316, "step": 11530 }, { - "epoch": 0.12, - "learning_rate": 0.0002812868910942466, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.00029126688226183205, + "loss": 0.04, "step": 11540 }, { - "epoch": 0.12, - "learning_rate": 0.0002812706752286437, - "loss": 0.0368, + "epoch": 0.06, + "learning_rate": 0.0002912593145688181, + "loss": 0.0313, "step": 11550 }, { - "epoch": 0.12, - "learning_rate": 0.00028125445936304076, - "loss": 0.0378, + "epoch": 0.06, + "learning_rate": 0.00029125174687580406, + "loss": 0.0319, "step": 11560 }, { - "epoch": 0.13, - "learning_rate": 0.0002812382434974379, - "loss": 0.0378, + "epoch": 0.06, + "learning_rate": 0.00029124417918279004, + "loss": 0.0326, "step": 11570 }, { - "epoch": 0.13, - "learning_rate": 0.000281222027631835, - "loss": 0.0357, + "epoch": 0.06, + "learning_rate": 0.000291236611489776, + "loss": 0.038, "step": 11580 }, { - "epoch": 0.13, - "learning_rate": 0.00028120581176623206, - "loss": 0.0403, + "epoch": 0.06, + "learning_rate": 0.000291229043796762, + "loss": 0.0363, "step": 11590 }, { - "epoch": 0.13, - "learning_rate": 0.00028118959590062913, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.000291221476103748, + "loss": 0.0331, "step": 11600 }, { - "epoch": 0.13, - "learning_rate": 0.00028117338003502625, - "loss": 0.0373, + "epoch": 0.06, + "learning_rate": 0.000291213908410734, + "loss": 0.033, "step": 11610 }, { - "epoch": 0.13, - "learning_rate": 0.00028115716416942337, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.00029120634071772, + "loss": 0.0379, "step": 11620 }, { - "epoch": 0.13, - "learning_rate": 0.00028114094830382043, - "loss": 0.0333, + "epoch": 0.06, + "learning_rate": 0.000291198773024706, + "loss": 0.037, "step": 11630 }, { - "epoch": 0.13, - "learning_rate": 0.0002811247324382175, - "loss": 0.035, + "epoch": 0.06, + "learning_rate": 0.00029119120533169197, + "loss": 0.038, "step": 11640 }, { - "epoch": 0.13, - "learning_rate": 0.0002811085165726146, - "loss": 0.0281, + "epoch": 0.06, + "learning_rate": 0.00029118363763867795, + "loss": 0.0337, "step": 11650 }, { - "epoch": 0.13, - "learning_rate": 0.00028109230070701174, - "loss": 0.0279, + "epoch": 0.06, + "learning_rate": 0.00029117606994566393, + "loss": 0.034, "step": 11660 }, { - "epoch": 0.13, - "learning_rate": 0.0002810760848414088, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.0002911685022526499, + "loss": 0.0362, "step": 11670 }, { - "epoch": 0.13, - "learning_rate": 0.0002810598689758059, - "loss": 0.0391, + "epoch": 0.06, + "learning_rate": 0.00029116093455963595, + "loss": 0.0363, "step": 11680 }, { - "epoch": 0.13, - "learning_rate": 0.000281043653110203, - "loss": 0.0394, + "epoch": 0.06, + "learning_rate": 0.00029115336686662193, + "loss": 0.0393, "step": 11690 }, { - "epoch": 0.13, - "learning_rate": 0.0002810274372446001, - "loss": 0.0433, + "epoch": 0.06, + "learning_rate": 0.0002911457991736079, + "loss": 0.0366, "step": 11700 }, { - "epoch": 0.13, - "learning_rate": 0.0002810112213789972, - "loss": 0.0362, + "epoch": 0.06, + "learning_rate": 0.0002911382314805939, + "loss": 0.0364, "step": 11710 }, { - "epoch": 0.13, - "learning_rate": 0.0002809950055133943, - "loss": 0.0335, + "epoch": 0.06, + "learning_rate": 0.0002911306637875799, + "loss": 0.0375, "step": 11720 }, { - "epoch": 0.13, - "learning_rate": 0.00028097878964779136, - "loss": 0.0378, + "epoch": 0.06, + "learning_rate": 0.00029112309609456586, + "loss": 0.0362, "step": 11730 }, { - "epoch": 0.13, - "learning_rate": 0.0002809625737821885, - "loss": 0.0295, + "epoch": 0.06, + "learning_rate": 0.0002911155284015519, + "loss": 0.0365, "step": 11740 }, { - "epoch": 0.13, - "learning_rate": 0.00028094635791658555, - "loss": 0.0383, + "epoch": 0.06, + "learning_rate": 0.00029110796070853787, + "loss": 0.0312, "step": 11750 }, { - "epoch": 0.13, - "learning_rate": 0.00028093014205098267, - "loss": 0.0334, + "epoch": 0.06, + "learning_rate": 0.00029110039301552385, + "loss": 0.0329, "step": 11760 }, { - "epoch": 0.13, - "learning_rate": 0.00028091392618537973, + "epoch": 0.06, + "learning_rate": 0.00029109282532250984, "loss": 0.0376, "step": 11770 }, { - "epoch": 0.13, - "learning_rate": 0.00028089771031977685, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.0002910852576294958, + "loss": 0.0363, "step": 11780 }, { - "epoch": 0.13, - "learning_rate": 0.0002808814944541739, - "loss": 0.0368, + "epoch": 0.06, + "learning_rate": 0.0002910776899364818, + "loss": 0.0418, "step": 11790 }, { - "epoch": 0.13, - "learning_rate": 0.00028086527858857104, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.00029107012224346783, + "loss": 0.0339, "step": 11800 }, { - "epoch": 0.13, - "learning_rate": 0.00028084906272296816, - "loss": 0.0327, + "epoch": 0.06, + "learning_rate": 0.0002910625545504538, + "loss": 0.0385, "step": 11810 }, { - "epoch": 0.13, - "learning_rate": 0.0002808328468573652, - "loss": 0.0356, + "epoch": 0.06, + "learning_rate": 0.0002910549868574398, + "loss": 0.0373, "step": 11820 }, { - "epoch": 0.13, - "learning_rate": 0.0002808166309917623, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002910474191644258, + "loss": 0.0311, "step": 11830 }, { - "epoch": 0.13, - "learning_rate": 0.0002808004151261594, - "loss": 0.0345, + "epoch": 0.06, + "learning_rate": 0.00029103985147141176, + "loss": 0.0353, "step": 11840 }, { - "epoch": 0.13, - "learning_rate": 0.00028078419926055653, - "loss": 0.0393, + "epoch": 0.06, + "learning_rate": 0.00029103228377839774, + "loss": 0.0359, "step": 11850 }, { - "epoch": 0.13, - "learning_rate": 0.0002807679833949536, - "loss": 0.0329, + "epoch": 0.06, + "learning_rate": 0.0002910247160853837, + "loss": 0.0353, "step": 11860 }, { - "epoch": 0.13, - "learning_rate": 0.00028075176752935066, - "loss": 0.0365, + "epoch": 0.06, + "learning_rate": 0.00029101714839236976, + "loss": 0.0389, "step": 11870 }, { - "epoch": 0.13, - "learning_rate": 0.0002807355516637478, - "loss": 0.038, + "epoch": 0.06, + "learning_rate": 0.00029100958069935574, + "loss": 0.0358, "step": 11880 }, { - "epoch": 0.13, - "learning_rate": 0.0002807193357981449, - "loss": 0.0315, + "epoch": 0.06, + "learning_rate": 0.0002910020130063417, + "loss": 0.0369, "step": 11890 }, { - "epoch": 0.13, - "learning_rate": 0.00028070311993254196, - "loss": 0.036, + "epoch": 0.06, + "learning_rate": 0.0002909944453133277, + "loss": 0.0368, "step": 11900 }, { - "epoch": 0.13, - "learning_rate": 0.00028068690406693903, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.0002909868776203137, + "loss": 0.0347, "step": 11910 }, { - "epoch": 0.13, - "learning_rate": 0.00028067068820133615, - "loss": 0.0365, + "epoch": 0.06, + "learning_rate": 0.00029097930992729967, + "loss": 0.0351, "step": 11920 }, { - "epoch": 0.13, - "learning_rate": 0.00028065447233573327, - "loss": 0.0402, + "epoch": 0.06, + "learning_rate": 0.0002909717422342857, + "loss": 0.0364, "step": 11930 }, { - "epoch": 0.13, - "learning_rate": 0.00028063825647013034, - "loss": 0.0368, + "epoch": 0.06, + "learning_rate": 0.0002909641745412717, + "loss": 0.0358, "step": 11940 }, { - "epoch": 0.13, - "learning_rate": 0.00028062204060452746, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.0002909566068482576, + "loss": 0.0367, "step": 11950 }, { - "epoch": 0.13, - "learning_rate": 0.0002806058247389245, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.0002909490391552436, + "loss": 0.0375, "step": 11960 }, { - "epoch": 0.13, - "learning_rate": 0.00028058960887332164, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.0002909414714622296, + "loss": 0.0364, "step": 11970 }, { - "epoch": 0.13, - "learning_rate": 0.00028057339300771876, - "loss": 0.0402, + "epoch": 0.06, + "learning_rate": 0.0002909339037692156, + "loss": 0.0374, "step": 11980 }, { - "epoch": 0.13, - "learning_rate": 0.0002805571771421158, - "loss": 0.0445, + "epoch": 0.06, + "learning_rate": 0.0002909263360762016, + "loss": 0.0334, "step": 11990 }, { - "epoch": 0.13, - "learning_rate": 0.0002805409612765129, - "loss": 0.036, + "epoch": 0.06, + "learning_rate": 0.00029091876838318757, + "loss": 0.0286, "step": 12000 }, { - "epoch": 0.13, - "eval_cer": 0.9215616786273294, - "eval_loss": 0.025386789813637733, - "eval_runtime": 119.9223, - "eval_samples_per_second": 16.677, - "eval_steps_per_second": 4.169, + "epoch": 0.06, + "eval_cer": 0.9145042197675514, + "eval_loss": 0.026305437088012695, + "eval_runtime": 117.4972, + "eval_samples_per_second": 17.022, + "eval_steps_per_second": 4.255, "step": 12000 }, { - "epoch": 0.13, - "learning_rate": 0.00028052474541091, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.00029091120069017355, + "loss": 0.0336, "step": 12010 }, { - "epoch": 0.13, - "learning_rate": 0.00028050852954530713, - "loss": 0.0388, + "epoch": 0.06, + "learning_rate": 0.00029090363299715953, + "loss": 0.0372, "step": 12020 }, { - "epoch": 0.13, - "learning_rate": 0.0002804923136797042, - "loss": 0.0365, + "epoch": 0.06, + "learning_rate": 0.00029089606530414557, + "loss": 0.0361, "step": 12030 }, { - "epoch": 0.13, - "learning_rate": 0.00028047609781410126, - "loss": 0.0401, + "epoch": 0.06, + "learning_rate": 0.00029088849761113155, + "loss": 0.0325, "step": 12040 }, { - "epoch": 0.13, - "learning_rate": 0.0002804598819484984, - "loss": 0.031, + "epoch": 0.06, + "learning_rate": 0.00029088092991811753, + "loss": 0.0327, "step": 12050 }, { - "epoch": 0.13, - "learning_rate": 0.0002804436660828955, - "loss": 0.0402, + "epoch": 0.06, + "learning_rate": 0.0002908733622251035, + "loss": 0.0293, "step": 12060 }, { - "epoch": 0.13, - "learning_rate": 0.00028042745021729257, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.0002908657945320895, + "loss": 0.033, "step": 12070 }, { - "epoch": 0.13, - "learning_rate": 0.0002804112343516897, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002908582268390755, + "loss": 0.0414, "step": 12080 }, { - "epoch": 0.13, - "learning_rate": 0.00028039501848608675, - "loss": 0.0348, + "epoch": 0.06, + "learning_rate": 0.00029085065914606146, + "loss": 0.0345, "step": 12090 }, { - "epoch": 0.13, - "learning_rate": 0.0002803788026204839, - "loss": 0.0341, + "epoch": 0.06, + "learning_rate": 0.0002908430914530475, + "loss": 0.0344, "step": 12100 }, { - "epoch": 0.13, - "learning_rate": 0.00028036258675488094, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.0002908355237600335, + "loss": 0.0329, "step": 12110 }, { - "epoch": 0.13, - "learning_rate": 0.00028034637088927806, - "loss": 0.0316, + "epoch": 0.06, + "learning_rate": 0.00029082795606701946, + "loss": 0.0307, "step": 12120 }, { - "epoch": 0.13, - "learning_rate": 0.0002803301550236751, - "loss": 0.0399, + "epoch": 0.06, + "learning_rate": 0.00029082038837400544, + "loss": 0.0321, "step": 12130 }, { - "epoch": 0.13, - "learning_rate": 0.00028031393915807224, - "loss": 0.0306, + "epoch": 0.06, + "learning_rate": 0.0002908128206809914, + "loss": 0.0359, "step": 12140 }, { - "epoch": 0.13, - "learning_rate": 0.0002802977232924693, - "loss": 0.0281, + "epoch": 0.06, + "learning_rate": 0.0002908052529879774, + "loss": 0.0324, "step": 12150 }, { - "epoch": 0.13, - "learning_rate": 0.00028028150742686643, - "loss": 0.0263, + "epoch": 0.06, + "learning_rate": 0.00029079768529496344, + "loss": 0.0349, "step": 12160 }, { - "epoch": 0.13, - "learning_rate": 0.0002802652915612635, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002907901176019494, + "loss": 0.0323, "step": 12170 }, { - "epoch": 0.13, - "learning_rate": 0.0002802490756956606, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002907825499089354, + "loss": 0.0378, "step": 12180 }, { - "epoch": 0.13, - "learning_rate": 0.0002802328598300577, - "loss": 0.0315, + "epoch": 0.06, + "learning_rate": 0.0002907749822159214, + "loss": 0.0332, "step": 12190 }, { - "epoch": 0.13, - "learning_rate": 0.0002802166439644548, - "loss": 0.0376, + "epoch": 0.06, + "learning_rate": 0.00029076741452290736, + "loss": 0.0339, "step": 12200 }, { - "epoch": 0.13, - "learning_rate": 0.00028020042809885187, - "loss": 0.0355, + "epoch": 0.06, + "learning_rate": 0.00029075984682989334, + "loss": 0.0361, "step": 12210 }, { - "epoch": 0.13, - "learning_rate": 0.000280184212233249, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.0002907522791368793, + "loss": 0.0336, "step": 12220 }, { - "epoch": 0.13, - "learning_rate": 0.0002801679963676461, - "loss": 0.0356, + "epoch": 0.06, + "learning_rate": 0.00029074471144386536, + "loss": 0.0313, "step": 12230 }, { - "epoch": 0.13, - "learning_rate": 0.00028015178050204317, - "loss": 0.0319, + "epoch": 0.06, + "learning_rate": 0.00029073714375085134, + "loss": 0.0326, "step": 12240 }, { - "epoch": 0.13, - "learning_rate": 0.0002801355646364403, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.0002907295760578373, + "loss": 0.0321, "step": 12250 }, { - "epoch": 0.13, - "learning_rate": 0.00028011934877083736, - "loss": 0.0313, + "epoch": 0.06, + "learning_rate": 0.0002907220083648233, + "loss": 0.0311, "step": 12260 }, { - "epoch": 0.13, - "learning_rate": 0.0002801031329052345, - "loss": 0.0359, + "epoch": 0.06, + "learning_rate": 0.0002907144406718093, + "loss": 0.0396, "step": 12270 }, { - "epoch": 0.13, - "learning_rate": 0.00028008691703963154, - "loss": 0.0397, + "epoch": 0.06, + "learning_rate": 0.00029070687297879527, + "loss": 0.0312, "step": 12280 }, { - "epoch": 0.13, - "learning_rate": 0.00028007070117402866, - "loss": 0.0356, + "epoch": 0.06, + "learning_rate": 0.0002906993052857813, + "loss": 0.0345, "step": 12290 }, { - "epoch": 0.13, - "learning_rate": 0.00028005448530842573, - "loss": 0.0361, + "epoch": 0.06, + "learning_rate": 0.0002906917375927673, + "loss": 0.0336, "step": 12300 }, { - "epoch": 0.13, - "learning_rate": 0.00028003826944282285, - "loss": 0.0334, + "epoch": 0.06, + "learning_rate": 0.00029068416989975327, + "loss": 0.0433, "step": 12310 }, { - "epoch": 0.13, - "learning_rate": 0.0002800220535772199, - "loss": 0.0355, + "epoch": 0.06, + "learning_rate": 0.00029067660220673925, + "loss": 0.0356, "step": 12320 }, { - "epoch": 0.13, - "learning_rate": 0.00028000583771161703, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.00029066903451372523, + "loss": 0.0329, "step": 12330 }, { - "epoch": 0.13, - "learning_rate": 0.0002799896218460141, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.0002906614668207112, + "loss": 0.0341, "step": 12340 }, { - "epoch": 0.13, - "learning_rate": 0.0002799734059804112, - "loss": 0.0335, + "epoch": 0.06, + "learning_rate": 0.00029065389912769725, + "loss": 0.033, "step": 12350 }, { - "epoch": 0.13, - "learning_rate": 0.0002799571901148083, - "loss": 0.0342, + "epoch": 0.06, + "learning_rate": 0.00029064633143468323, + "loss": 0.0393, "step": 12360 }, { - "epoch": 0.13, - "learning_rate": 0.0002799409742492054, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.0002906387637416692, + "loss": 0.0398, "step": 12370 }, { - "epoch": 0.13, - "learning_rate": 0.0002799247583836025, - "loss": 0.0332, + "epoch": 0.06, + "learning_rate": 0.0002906311960486552, + "loss": 0.0456, "step": 12380 }, { - "epoch": 0.13, - "learning_rate": 0.0002799085425179996, - "loss": 0.0341, + "epoch": 0.06, + "learning_rate": 0.00029062362835564117, + "loss": 0.0452, "step": 12390 }, { - "epoch": 0.13, - "learning_rate": 0.00027989232665239666, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.00029061606066262715, + "loss": 0.0408, "step": 12400 }, { - "epoch": 0.13, - "learning_rate": 0.0002798761107867938, - "loss": 0.0345, + "epoch": 0.06, + "learning_rate": 0.00029060849296961314, + "loss": 0.0333, "step": 12410 }, { - "epoch": 0.13, - "learning_rate": 0.0002798598949211909, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029060092527659917, + "loss": 0.0363, "step": 12420 }, { - "epoch": 0.13, - "learning_rate": 0.00027984367905558796, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.00029059335758358515, + "loss": 0.036, "step": 12430 }, { - "epoch": 0.13, - "learning_rate": 0.000279827463189985, - "loss": 0.0405, + "epoch": 0.06, + "learning_rate": 0.00029058578989057113, + "loss": 0.0361, "step": 12440 }, { - "epoch": 0.13, - "learning_rate": 0.00027981124732438215, + "epoch": 0.06, + "learning_rate": 0.0002905782221975571, "loss": 0.0384, "step": 12450 }, { - "epoch": 0.13, - "learning_rate": 0.00027979503145877927, - "loss": 0.039, + "epoch": 0.06, + "learning_rate": 0.0002905706545045431, + "loss": 0.0354, "step": 12460 }, { - "epoch": 0.13, - "learning_rate": 0.00027977881559317633, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.0002905630868115291, + "loss": 0.0404, "step": 12470 }, { - "epoch": 0.13, - "learning_rate": 0.0002797625997275734, - "loss": 0.0313, + "epoch": 0.06, + "learning_rate": 0.0002905555191185151, + "loss": 0.0301, "step": 12480 }, { - "epoch": 0.14, - "learning_rate": 0.0002797463838619705, - "loss": 0.0408, + "epoch": 0.06, + "learning_rate": 0.0002905479514255011, + "loss": 0.0325, "step": 12490 }, { - "epoch": 0.14, - "learning_rate": 0.00027973016799636764, - "loss": 0.0338, + "epoch": 0.06, + "learning_rate": 0.0002905403837324871, + "loss": 0.0303, "step": 12500 }, { - "epoch": 0.14, - "learning_rate": 0.0002797139521307647, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029053281603947306, + "loss": 0.0342, "step": 12510 }, { - "epoch": 0.14, - "learning_rate": 0.0002796977362651618, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.00029052524834645904, + "loss": 0.0303, "step": 12520 }, { - "epoch": 0.14, - "learning_rate": 0.0002796815203995589, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.000290517680653445, + "loss": 0.0327, "step": 12530 }, { - "epoch": 0.14, - "learning_rate": 0.000279665304533956, - "loss": 0.0299, + "epoch": 0.06, + "learning_rate": 0.000290510112960431, + "loss": 0.036, "step": 12540 }, { - "epoch": 0.14, - "learning_rate": 0.00027964908866835313, - "loss": 0.0324, + "epoch": 0.06, + "learning_rate": 0.00029050254526741704, + "loss": 0.0303, "step": 12550 }, { - "epoch": 0.14, - "learning_rate": 0.0002796328728027502, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.000290494977574403, + "loss": 0.0349, "step": 12560 }, { - "epoch": 0.14, - "learning_rate": 0.00027961665693714726, - "loss": 0.0395, + "epoch": 0.06, + "learning_rate": 0.000290487409881389, + "loss": 0.0347, "step": 12570 }, { - "epoch": 0.14, - "learning_rate": 0.0002796004410715444, - "loss": 0.0369, + "epoch": 0.06, + "learning_rate": 0.000290479842188375, + "loss": 0.035, "step": 12580 }, { - "epoch": 0.14, - "learning_rate": 0.0002795842252059415, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.00029047227449536096, + "loss": 0.0285, "step": 12590 }, { - "epoch": 0.14, - "learning_rate": 0.00027956800934033857, - "loss": 0.0341, + "epoch": 0.06, + "learning_rate": 0.00029046470680234695, + "loss": 0.032, "step": 12600 }, { - "epoch": 0.14, - "learning_rate": 0.00027955179347473563, - "loss": 0.0351, + "epoch": 0.06, + "learning_rate": 0.000290457139109333, + "loss": 0.0345, "step": 12610 }, { - "epoch": 0.14, - "learning_rate": 0.00027953557760913275, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.00029044957141631896, + "loss": 0.0381, "step": 12620 }, { - "epoch": 0.14, - "learning_rate": 0.00027951936174352987, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.00029044200372330494, + "loss": 0.04, "step": 12630 }, { - "epoch": 0.14, - "learning_rate": 0.00027950314587792694, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.0002904344360302909, + "loss": 0.0362, "step": 12640 }, { - "epoch": 0.14, - "learning_rate": 0.000279486930012324, - "loss": 0.0329, + "epoch": 0.06, + "learning_rate": 0.0002904268683372769, + "loss": 0.032, "step": 12650 }, { - "epoch": 0.14, - "learning_rate": 0.0002794707141467211, - "loss": 0.0363, + "epoch": 0.06, + "learning_rate": 0.0002904193006442629, + "loss": 0.0366, "step": 12660 }, { - "epoch": 0.14, - "learning_rate": 0.00027945449828111824, - "loss": 0.0466, + "epoch": 0.06, + "learning_rate": 0.0002904117329512489, + "loss": 0.0349, "step": 12670 }, { - "epoch": 0.14, - "learning_rate": 0.0002794382824155153, - "loss": 0.0397, + "epoch": 0.06, + "learning_rate": 0.0002904041652582349, + "loss": 0.0369, "step": 12680 }, { - "epoch": 0.14, - "learning_rate": 0.0002794220665499124, - "loss": 0.0314, + "epoch": 0.06, + "learning_rate": 0.0002903965975652209, + "loss": 0.0337, "step": 12690 }, { - "epoch": 0.14, - "learning_rate": 0.0002794058506843095, - "loss": 0.0332, + "epoch": 0.06, + "learning_rate": 0.00029038902987220687, + "loss": 0.0308, "step": 12700 }, { - "epoch": 0.14, - "learning_rate": 0.0002793896348187066, - "loss": 0.0311, + "epoch": 0.06, + "learning_rate": 0.00029038146217919285, + "loss": 0.0523, "step": 12710 }, { - "epoch": 0.14, - "learning_rate": 0.0002793734189531037, - "loss": 0.0363, + "epoch": 0.06, + "learning_rate": 0.00029037389448617883, + "loss": 0.0437, "step": 12720 }, { - "epoch": 0.14, - "learning_rate": 0.0002793572030875008, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002903663267931648, + "loss": 0.0365, "step": 12730 }, { - "epoch": 0.14, - "learning_rate": 0.00027934098722189786, - "loss": 0.0325, + "epoch": 0.06, + "learning_rate": 0.00029035875910015085, + "loss": 0.0349, "step": 12740 }, { - "epoch": 0.14, - "learning_rate": 0.000279324771356295, - "loss": 0.0335, + "epoch": 0.06, + "learning_rate": 0.00029035119140713683, + "loss": 0.0321, "step": 12750 }, { - "epoch": 0.14, - "learning_rate": 0.00027930855549069205, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002903436237141228, + "loss": 0.0318, "step": 12760 }, { - "epoch": 0.14, - "learning_rate": 0.00027929233962508917, - "loss": 0.0328, + "epoch": 0.06, + "learning_rate": 0.0002903360560211088, + "loss": 0.0335, "step": 12770 }, { - "epoch": 0.14, - "learning_rate": 0.00027927612375948623, - "loss": 0.0303, + "epoch": 0.06, + "learning_rate": 0.0002903284883280948, + "loss": 0.0305, "step": 12780 }, { - "epoch": 0.14, - "learning_rate": 0.00027925990789388335, - "loss": 0.0337, + "epoch": 0.06, + "learning_rate": 0.00029032092063508076, + "loss": 0.0381, "step": 12790 }, { - "epoch": 0.14, - "learning_rate": 0.0002792436920282804, - "loss": 0.035, + "epoch": 0.06, + "learning_rate": 0.0002903133529420668, + "loss": 0.0327, "step": 12800 }, { - "epoch": 0.14, - "learning_rate": 0.00027922747616267754, - "loss": 0.0322, + "epoch": 0.06, + "learning_rate": 0.00029030578524905277, + "loss": 0.0432, "step": 12810 }, { - "epoch": 0.14, - "learning_rate": 0.00027921126029707466, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.00029029821755603875, + "loss": 0.0372, "step": 12820 }, { - "epoch": 0.14, - "learning_rate": 0.0002791950444314717, - "loss": 0.0376, + "epoch": 0.06, + "learning_rate": 0.00029029064986302474, + "loss": 0.0574, "step": 12830 }, { - "epoch": 0.14, - "learning_rate": 0.0002791788285658688, - "loss": 0.0376, + "epoch": 0.06, + "learning_rate": 0.0002902830821700107, + "loss": 0.045, "step": 12840 }, { - "epoch": 0.14, - "learning_rate": 0.0002791626127002659, - "loss": 0.0364, + "epoch": 0.06, + "learning_rate": 0.0002902755144769967, + "loss": 0.0303, "step": 12850 }, { - "epoch": 0.14, - "learning_rate": 0.00027914639683466303, - "loss": 0.0348, + "epoch": 0.06, + "learning_rate": 0.00029026794678398273, + "loss": 0.0365, "step": 12860 }, { - "epoch": 0.14, - "learning_rate": 0.0002791301809690601, - "loss": 0.0354, + "epoch": 0.06, + "learning_rate": 0.0002902603790909687, + "loss": 0.0443, "step": 12870 }, { - "epoch": 0.14, - "learning_rate": 0.00027911396510345716, - "loss": 0.0455, + "epoch": 0.06, + "learning_rate": 0.0002902528113979547, + "loss": 0.0384, "step": 12880 }, { - "epoch": 0.14, - "learning_rate": 0.0002790977492378543, - "loss": 0.0382, + "epoch": 0.07, + "learning_rate": 0.0002902452437049407, + "loss": 0.035, "step": 12890 }, { - "epoch": 0.14, - "learning_rate": 0.0002790815333722514, - "loss": 0.0423, + "epoch": 0.07, + "learning_rate": 0.00029023767601192666, + "loss": 0.0431, "step": 12900 }, { - "epoch": 0.14, - "learning_rate": 0.00027906531750664847, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.00029023010831891264, + "loss": 0.0393, "step": 12910 }, { - "epoch": 0.14, - "learning_rate": 0.00027904910164104553, - "loss": 0.0424, + "epoch": 0.07, + "learning_rate": 0.0002902225406258986, + "loss": 0.0324, "step": 12920 }, { - "epoch": 0.14, - "learning_rate": 0.00027903288577544265, - "loss": 0.0346, + "epoch": 0.07, + "learning_rate": 0.00029021497293288466, + "loss": 0.0353, "step": 12930 }, { - "epoch": 0.14, - "learning_rate": 0.00027901666990983977, - "loss": 0.0318, + "epoch": 0.07, + "learning_rate": 0.00029020740523987064, + "loss": 0.0457, "step": 12940 }, { - "epoch": 0.14, - "learning_rate": 0.00027900045404423684, - "loss": 0.0331, + "epoch": 0.07, + "learning_rate": 0.0002901998375468566, + "loss": 0.0338, "step": 12950 }, { - "epoch": 0.14, - "learning_rate": 0.00027898423817863396, - "loss": 0.033, + "epoch": 0.07, + "learning_rate": 0.0002901922698538426, + "loss": 0.0305, "step": 12960 }, { - "epoch": 0.14, - "learning_rate": 0.000278968022313031, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.0002901847021608286, + "loss": 0.0322, "step": 12970 }, { - "epoch": 0.14, - "learning_rate": 0.00027895180644742814, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.00029017713446781457, + "loss": 0.0351, "step": 12980 }, { - "epoch": 0.14, - "learning_rate": 0.00027893559058182526, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.0002901695667748006, + "loss": 0.0309, "step": 12990 }, { - "epoch": 0.14, - "learning_rate": 0.00027891937471622233, - "loss": 0.0412, + "epoch": 0.07, + "learning_rate": 0.0002901619990817866, + "loss": 0.0373, "step": 13000 }, { - "epoch": 0.14, - "eval_cer": 0.9216059773781046, - "eval_loss": 0.025849705561995506, - "eval_runtime": 120.1846, - "eval_samples_per_second": 16.641, - "eval_steps_per_second": 4.16, + "epoch": 0.07, + "eval_cer": 0.9145245980861848, + "eval_loss": 0.026163555681705475, + "eval_runtime": 116.7644, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, "step": 13000 }, { - "epoch": 0.14, - "learning_rate": 0.0002789031588506194, - "loss": 0.0486, + "epoch": 0.07, + "learning_rate": 0.00029015443138877256, + "loss": 0.0371, "step": 13010 }, { - "epoch": 0.14, - "learning_rate": 0.0002788869429850165, - "loss": 0.0407, + "epoch": 0.07, + "learning_rate": 0.00029014686369575855, + "loss": 0.0344, "step": 13020 }, { - "epoch": 0.14, - "learning_rate": 0.00027887072711941363, - "loss": 0.0337, + "epoch": 0.07, + "learning_rate": 0.0002901392960027445, + "loss": 0.0352, "step": 13030 }, { - "epoch": 0.14, - "learning_rate": 0.0002788545112538107, - "loss": 0.0411, + "epoch": 0.07, + "learning_rate": 0.0002901317283097305, + "loss": 0.0361, "step": 13040 }, { - "epoch": 0.14, - "learning_rate": 0.00027883829538820777, - "loss": 0.0356, + "epoch": 0.07, + "learning_rate": 0.0002901241606167165, + "loss": 0.0444, "step": 13050 }, { - "epoch": 0.14, - "learning_rate": 0.0002788220795226049, - "loss": 0.0417, + "epoch": 0.07, + "learning_rate": 0.0002901165929237025, + "loss": 0.0307, "step": 13060 }, { - "epoch": 0.14, - "learning_rate": 0.000278805863657002, - "loss": 0.0295, + "epoch": 0.07, + "learning_rate": 0.0002901090252306885, + "loss": 0.034, "step": 13070 }, { - "epoch": 0.14, - "learning_rate": 0.00027878964779139907, - "loss": 0.0361, + "epoch": 0.07, + "learning_rate": 0.0002901014575376745, + "loss": 0.0451, "step": 13080 }, { - "epoch": 0.14, - "learning_rate": 0.0002787734319257962, - "loss": 0.033, + "epoch": 0.07, + "learning_rate": 0.00029009388984466047, + "loss": 0.0379, "step": 13090 }, { - "epoch": 0.14, - "learning_rate": 0.00027875721606019326, + "epoch": 0.07, + "learning_rate": 0.00029008632215164645, "loss": 0.0347, "step": 13100 }, { - "epoch": 0.14, - "learning_rate": 0.0002787410001945904, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00029007875445863243, + "loss": 0.0288, "step": 13110 }, { - "epoch": 0.14, - "learning_rate": 0.0002787247843289875, - "loss": 0.0395, + "epoch": 0.07, + "learning_rate": 0.00029007118676561847, + "loss": 0.038, "step": 13120 }, { - "epoch": 0.14, - "learning_rate": 0.00027870856846338456, - "loss": 0.0346, + "epoch": 0.07, + "learning_rate": 0.00029006361907260445, + "loss": 0.032, "step": 13130 }, { - "epoch": 0.14, - "learning_rate": 0.00027869235259778163, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.00029005605137959043, + "loss": 0.0372, "step": 13140 }, { - "epoch": 0.14, - "learning_rate": 0.00027867613673217875, - "loss": 0.045, + "epoch": 0.07, + "learning_rate": 0.0002900484836865764, + "loss": 0.0325, "step": 13150 }, { - "epoch": 0.14, - "learning_rate": 0.00027865992086657587, - "loss": 0.0347, + "epoch": 0.07, + "learning_rate": 0.0002900409159935624, + "loss": 0.0342, "step": 13160 }, { - "epoch": 0.14, - "learning_rate": 0.00027864370500097293, - "loss": 0.0355, + "epoch": 0.07, + "learning_rate": 0.0002900333483005484, + "loss": 0.0377, "step": 13170 }, { - "epoch": 0.14, - "learning_rate": 0.00027862748913537, - "loss": 0.0426, + "epoch": 0.07, + "learning_rate": 0.0002900257806075344, + "loss": 0.0408, "step": 13180 }, { - "epoch": 0.14, - "learning_rate": 0.0002786112732697671, - "loss": 0.045, + "epoch": 0.07, + "learning_rate": 0.0002900182129145204, + "loss": 0.0353, "step": 13190 }, { - "epoch": 0.14, - "learning_rate": 0.00027859505740416424, - "loss": 0.0338, + "epoch": 0.07, + "learning_rate": 0.0002900106452215063, + "loss": 0.0307, "step": 13200 }, { - "epoch": 0.14, - "learning_rate": 0.0002785788415385613, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.0002900030775284923, + "loss": 0.0331, "step": 13210 }, { - "epoch": 0.14, - "learning_rate": 0.00027856262567295837, - "loss": 0.0338, + "epoch": 0.07, + "learning_rate": 0.00028999550983547834, + "loss": 0.0322, "step": 13220 }, { - "epoch": 0.14, - "learning_rate": 0.0002785464098073555, - "loss": 0.0333, + "epoch": 0.07, + "learning_rate": 0.0002899879421424643, + "loss": 0.0342, "step": 13230 }, { - "epoch": 0.14, - "learning_rate": 0.0002785301939417526, - "loss": 0.0844, + "epoch": 0.07, + "learning_rate": 0.0002899803744494503, + "loss": 0.0312, "step": 13240 }, { - "epoch": 0.14, - "learning_rate": 0.0002785139780761497, - "loss": 0.0348, + "epoch": 0.07, + "learning_rate": 0.0002899728067564363, + "loss": 0.0645, "step": 13250 }, { - "epoch": 0.14, - "learning_rate": 0.0002784977622105468, - "loss": 0.0342, + "epoch": 0.07, + "learning_rate": 0.00028996523906342226, + "loss": 0.0352, "step": 13260 }, { - "epoch": 0.14, - "learning_rate": 0.00027848154634494386, - "loss": 0.0345, + "epoch": 0.07, + "learning_rate": 0.00028995767137040824, + "loss": 0.0671, "step": 13270 }, { - "epoch": 0.14, - "learning_rate": 0.000278465330479341, - "loss": 0.0353, + "epoch": 0.07, + "learning_rate": 0.0002899501036773942, + "loss": 0.0338, "step": 13280 }, { - "epoch": 0.14, - "learning_rate": 0.00027844911461373805, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00028994253598438026, + "loss": 0.0341, "step": 13290 }, { - "epoch": 0.14, - "learning_rate": 0.00027843289874813517, - "loss": 0.0368, + "epoch": 0.07, + "learning_rate": 0.00028993496829136624, + "loss": 0.036, "step": 13300 }, { - "epoch": 0.14, - "learning_rate": 0.00027841668288253223, - "loss": 0.0314, + "epoch": 0.07, + "learning_rate": 0.0002899274005983522, + "loss": 0.0352, "step": 13310 }, { - "epoch": 0.14, - "learning_rate": 0.00027840046701692935, - "loss": 0.0349, + "epoch": 0.07, + "learning_rate": 0.0002899198329053382, + "loss": 0.0352, "step": 13320 }, { - "epoch": 0.14, - "learning_rate": 0.0002783842511513264, - "loss": 0.0358, + "epoch": 0.07, + "learning_rate": 0.0002899122652123242, + "loss": 0.0402, "step": 13330 }, { - "epoch": 0.14, - "learning_rate": 0.00027836803528572354, - "loss": 0.034, + "epoch": 0.07, + "learning_rate": 0.00028990469751931017, + "loss": 0.0315, "step": 13340 }, { - "epoch": 0.14, - "learning_rate": 0.0002783518194201206, - "loss": 0.0474, + "epoch": 0.07, + "learning_rate": 0.0002898971298262962, + "loss": 0.0331, "step": 13350 }, { - "epoch": 0.14, - "learning_rate": 0.0002783356035545177, - "loss": 0.0346, + "epoch": 0.07, + "learning_rate": 0.0002898895621332822, + "loss": 0.0371, "step": 13360 }, { - "epoch": 0.14, - "learning_rate": 0.0002783193876889148, - "loss": 0.036, + "epoch": 0.07, + "learning_rate": 0.00028988199444026817, + "loss": 0.0314, "step": 13370 }, { - "epoch": 0.14, - "learning_rate": 0.0002783031718233119, - "loss": 0.041, + "epoch": 0.07, + "learning_rate": 0.00028987442674725415, + "loss": 0.0473, "step": 13380 }, { - "epoch": 0.14, - "learning_rate": 0.00027828695595770903, - "loss": 0.0397, + "epoch": 0.07, + "learning_rate": 0.00028986685905424013, + "loss": 0.0328, "step": 13390 }, { - "epoch": 0.14, - "learning_rate": 0.0002782707400921061, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.0002898592913612261, + "loss": 0.0332, "step": 13400 }, { - "epoch": 0.14, - "learning_rate": 0.00027825452422650316, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00028985172366821215, + "loss": 0.0323, "step": 13410 }, { - "epoch": 0.15, - "learning_rate": 0.0002782383083609003, - "loss": 0.0329, + "epoch": 0.07, + "learning_rate": 0.00028984415597519813, + "loss": 0.0412, "step": 13420 }, { - "epoch": 0.15, - "learning_rate": 0.0002782220924952974, - "loss": 0.0845, + "epoch": 0.07, + "learning_rate": 0.0002898365882821841, + "loss": 0.037, "step": 13430 }, { - "epoch": 0.15, - "learning_rate": 0.00027820587662969446, - "loss": 0.0418, + "epoch": 0.07, + "learning_rate": 0.0002898290205891701, + "loss": 0.0363, "step": 13440 }, { - "epoch": 0.15, - "learning_rate": 0.00027818966076409153, - "loss": 0.0442, + "epoch": 0.07, + "learning_rate": 0.00028982145289615607, + "loss": 0.0358, "step": 13450 }, { - "epoch": 0.15, - "learning_rate": 0.00027817344489848865, - "loss": 0.0336, + "epoch": 0.07, + "learning_rate": 0.00028981388520314205, + "loss": 0.026, "step": 13460 }, { - "epoch": 0.15, - "learning_rate": 0.00027815722903288577, - "loss": 0.0342, + "epoch": 0.07, + "learning_rate": 0.00028980631751012804, + "loss": 0.04, "step": 13470 }, { - "epoch": 0.15, - "learning_rate": 0.00027814101316728284, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.00028979874981711407, + "loss": 0.0377, "step": 13480 }, { - "epoch": 0.15, - "learning_rate": 0.0002781247973016799, - "loss": 0.0334, + "epoch": 0.07, + "learning_rate": 0.00028979118212410005, + "loss": 0.0385, "step": 13490 }, { - "epoch": 0.15, - "learning_rate": 0.000278108581436077, - "loss": 0.0308, + "epoch": 0.07, + "learning_rate": 0.00028978361443108603, + "loss": 0.0294, "step": 13500 }, { - "epoch": 0.15, - "learning_rate": 0.00027809236557047414, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.000289776046738072, + "loss": 0.0346, "step": 13510 }, { - "epoch": 0.15, - "learning_rate": 0.0002780761497048712, - "loss": 0.0457, + "epoch": 0.07, + "learning_rate": 0.000289768479045058, + "loss": 0.0333, "step": 13520 }, { - "epoch": 0.15, - "learning_rate": 0.0002780599338392683, - "loss": 0.0372, + "epoch": 0.07, + "learning_rate": 0.000289760911352044, + "loss": 0.0357, "step": 13530 }, { - "epoch": 0.15, - "learning_rate": 0.0002780437179736654, - "loss": 0.0297, + "epoch": 0.07, + "learning_rate": 0.00028975334365903, + "loss": 0.0348, "step": 13540 }, { - "epoch": 0.15, - "learning_rate": 0.0002780275021080625, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.000289745775966016, + "loss": 0.0355, "step": 13550 }, { - "epoch": 0.15, - "learning_rate": 0.00027801128624245963, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.000289738208273002, + "loss": 0.0329, "step": 13560 }, { - "epoch": 0.15, - "learning_rate": 0.0002779950703768567, - "loss": 0.0329, + "epoch": 0.07, + "learning_rate": 0.00028973064057998796, + "loss": 0.0385, "step": 13570 }, { - "epoch": 0.15, - "learning_rate": 0.00027797885451125376, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.00028972307288697394, + "loss": 0.0433, "step": 13580 }, { - "epoch": 0.15, - "learning_rate": 0.0002779626386456509, - "loss": 0.029, + "epoch": 0.07, + "learning_rate": 0.0002897155051939599, + "loss": 0.0325, "step": 13590 }, { - "epoch": 0.15, - "learning_rate": 0.000277946422780048, - "loss": 0.0345, + "epoch": 0.07, + "learning_rate": 0.00028970793750094596, + "loss": 0.0367, "step": 13600 }, { - "epoch": 0.15, - "learning_rate": 0.00027793020691444507, - "loss": 0.0314, + "epoch": 0.07, + "learning_rate": 0.00028970036980793194, + "loss": 0.0551, "step": 13610 }, { - "epoch": 0.15, - "learning_rate": 0.00027791399104884213, - "loss": 0.0311, + "epoch": 0.07, + "learning_rate": 0.0002896928021149179, + "loss": 0.0347, "step": 13620 }, { - "epoch": 0.15, - "learning_rate": 0.00027789777518323925, - "loss": 0.0396, + "epoch": 0.07, + "learning_rate": 0.0002896852344219039, + "loss": 0.0574, "step": 13630 }, { - "epoch": 0.15, - "learning_rate": 0.0002778815593176364, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.0002896776667288899, + "loss": 0.0331, "step": 13640 }, { - "epoch": 0.15, - "learning_rate": 0.00027786534345203344, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.00028967009903587586, + "loss": 0.0646, "step": 13650 }, { - "epoch": 0.15, - "learning_rate": 0.0002778491275864305, - "loss": 0.0278, + "epoch": 0.07, + "learning_rate": 0.00028966253134286185, + "loss": 0.0507, "step": 13660 }, { - "epoch": 0.15, - "learning_rate": 0.0002778329117208276, - "loss": 0.0331, + "epoch": 0.07, + "learning_rate": 0.0002896549636498479, + "loss": 0.0312, "step": 13670 }, { - "epoch": 0.15, - "learning_rate": 0.00027781669585522474, - "loss": 0.0318, + "epoch": 0.07, + "learning_rate": 0.00028964739595683386, + "loss": 0.0364, "step": 13680 }, { - "epoch": 0.15, - "learning_rate": 0.00027780047998962186, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00028963982826381984, + "loss": 0.0587, "step": 13690 }, { - "epoch": 0.15, - "learning_rate": 0.00027778426412401893, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.0002896322605708058, + "loss": 0.0328, "step": 13700 }, { - "epoch": 0.15, - "learning_rate": 0.000277768048258416, - "loss": 0.035, + "epoch": 0.07, + "learning_rate": 0.0002896246928777918, + "loss": 0.04, "step": 13710 }, { - "epoch": 0.15, - "learning_rate": 0.0002777518323928131, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.0002896171251847778, + "loss": 0.0367, "step": 13720 }, { - "epoch": 0.15, - "learning_rate": 0.00027773561652721023, - "loss": 0.0354, + "epoch": 0.07, + "learning_rate": 0.0002896095574917638, + "loss": 0.0464, "step": 13730 }, { - "epoch": 0.15, - "learning_rate": 0.0002777194006616073, - "loss": 0.0344, + "epoch": 0.07, + "learning_rate": 0.0002896019897987498, + "loss": 0.0357, "step": 13740 }, { - "epoch": 0.15, - "learning_rate": 0.00027770318479600437, - "loss": 0.0348, + "epoch": 0.07, + "learning_rate": 0.0002895944221057358, + "loss": 0.0395, "step": 13750 }, { - "epoch": 0.15, - "learning_rate": 0.0002776869689304015, - "loss": 0.0328, + "epoch": 0.07, + "learning_rate": 0.00028958685441272177, + "loss": 0.0346, "step": 13760 }, { - "epoch": 0.15, - "learning_rate": 0.0002776707530647986, - "loss": 0.0368, + "epoch": 0.07, + "learning_rate": 0.00028957928671970775, + "loss": 0.0306, "step": 13770 }, { - "epoch": 0.15, - "learning_rate": 0.00027765453719919567, - "loss": 0.0342, + "epoch": 0.07, + "learning_rate": 0.00028957171902669373, + "loss": 0.0604, "step": 13780 }, { - "epoch": 0.15, - "learning_rate": 0.00027763832133359274, - "loss": 0.0268, + "epoch": 0.07, + "learning_rate": 0.0002895641513336797, + "loss": 0.0405, "step": 13790 }, { - "epoch": 0.15, - "learning_rate": 0.00027762210546798986, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028955658364066575, + "loss": 0.0467, "step": 13800 }, { - "epoch": 0.15, - "learning_rate": 0.000277605889602387, - "loss": 0.0652, + "epoch": 0.07, + "learning_rate": 0.00028954901594765173, + "loss": 0.0378, "step": 13810 }, { - "epoch": 0.15, - "learning_rate": 0.00027758967373678404, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.0002895414482546377, + "loss": 0.0559, "step": 13820 }, { - "epoch": 0.15, - "learning_rate": 0.00027757345787118116, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.0002895338805616237, + "loss": 0.0322, "step": 13830 }, { - "epoch": 0.15, - "learning_rate": 0.00027755724200557823, - "loss": 0.0903, + "epoch": 0.07, + "learning_rate": 0.0002895263128686097, + "loss": 0.0332, "step": 13840 }, { - "epoch": 0.15, - "learning_rate": 0.00027754102613997535, - "loss": 0.0487, + "epoch": 0.07, + "learning_rate": 0.00028951874517559566, + "loss": 0.0363, "step": 13850 }, { - "epoch": 0.15, - "learning_rate": 0.0002775248102743724, - "loss": 0.0474, + "epoch": 0.07, + "learning_rate": 0.0002895111774825817, + "loss": 0.0429, "step": 13860 }, { - "epoch": 0.15, - "learning_rate": 0.00027750859440876953, - "loss": 0.0322, + "epoch": 0.07, + "learning_rate": 0.00028950360978956767, + "loss": 0.0317, "step": 13870 }, { - "epoch": 0.15, - "learning_rate": 0.0002774923785431666, - "loss": 0.0306, + "epoch": 0.07, + "learning_rate": 0.00028949604209655365, + "loss": 0.0326, "step": 13880 }, { - "epoch": 0.15, - "learning_rate": 0.0002774761626775637, - "loss": 0.1102, + "epoch": 0.07, + "learning_rate": 0.00028948847440353964, + "loss": 0.0333, "step": 13890 }, { - "epoch": 0.15, - "learning_rate": 0.0002774599468119608, - "loss": 0.0365, + "epoch": 0.07, + "learning_rate": 0.0002894809067105256, + "loss": 0.0299, "step": 13900 }, { - "epoch": 0.15, - "learning_rate": 0.0002774437309463579, + "epoch": 0.07, + "learning_rate": 0.0002894733390175116, "loss": 0.0324, "step": 13910 }, { - "epoch": 0.15, - "learning_rate": 0.00027742751508075497, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.00028946577132449763, + "loss": 0.0354, "step": 13920 }, { - "epoch": 0.15, - "learning_rate": 0.0002774112992151521, - "loss": 0.033, + "epoch": 0.07, + "learning_rate": 0.0002894582036314836, + "loss": 0.0404, "step": 13930 }, { - "epoch": 0.15, - "learning_rate": 0.00027739508334954916, - "loss": 0.0327, + "epoch": 0.07, + "learning_rate": 0.0002894506359384696, + "loss": 0.0354, "step": 13940 }, { - "epoch": 0.15, - "learning_rate": 0.0002773788674839463, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.0002894430682454556, + "loss": 0.0367, "step": 13950 }, { - "epoch": 0.15, - "learning_rate": 0.00027736265161834334, - "loss": 0.0322, + "epoch": 0.07, + "learning_rate": 0.00028943550055244156, + "loss": 0.031, "step": 13960 }, { - "epoch": 0.15, - "learning_rate": 0.00027734643575274046, - "loss": 0.0365, + "epoch": 0.07, + "learning_rate": 0.00028942793285942754, + "loss": 0.0277, "step": 13970 }, { - "epoch": 0.15, - "learning_rate": 0.0002773302198871375, - "loss": 0.038, + "epoch": 0.07, + "learning_rate": 0.0002894203651664135, + "loss": 0.0345, "step": 13980 }, { - "epoch": 0.15, - "learning_rate": 0.00027731400402153465, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.00028941279747339956, + "loss": 0.0318, "step": 13990 }, { - "epoch": 0.15, - "learning_rate": 0.00027729778815593177, - "loss": 0.0404, + "epoch": 0.07, + "learning_rate": 0.00028940522978038554, + "loss": 0.0418, "step": 14000 }, { - "epoch": 0.15, - "eval_cer": 0.9215990285544536, - "eval_loss": 0.023803718388080597, - "eval_runtime": 119.9898, - "eval_samples_per_second": 16.668, - "eval_steps_per_second": 4.167, + "epoch": 0.07, + "eval_cer": 0.9144731670915385, + "eval_loss": 0.02422579564154148, + "eval_runtime": 116.5786, + "eval_samples_per_second": 17.156, + "eval_steps_per_second": 4.289, "step": 14000 }, { - "epoch": 0.15, - "learning_rate": 0.00027728157229032883, - "loss": 0.0351, + "epoch": 0.07, + "learning_rate": 0.0002893976620873715, + "loss": 0.0302, "step": 14010 }, { - "epoch": 0.15, - "learning_rate": 0.0002772653564247259, - "loss": 0.0353, + "epoch": 0.07, + "learning_rate": 0.0002893900943943575, + "loss": 0.0365, "step": 14020 }, { - "epoch": 0.15, - "learning_rate": 0.000277249140559123, - "loss": 0.0449, + "epoch": 0.07, + "learning_rate": 0.0002893825267013435, + "loss": 0.0346, "step": 14030 }, { - "epoch": 0.15, - "learning_rate": 0.00027723292469352014, - "loss": 0.0301, + "epoch": 0.07, + "learning_rate": 0.00028937495900832947, + "loss": 0.0365, "step": 14040 }, { - "epoch": 0.15, - "learning_rate": 0.0002772167088279172, - "loss": 0.0349, + "epoch": 0.07, + "learning_rate": 0.0002893673913153155, + "loss": 0.0297, "step": 14050 }, { - "epoch": 0.15, - "learning_rate": 0.00027720049296231427, - "loss": 0.0326, + "epoch": 0.07, + "learning_rate": 0.0002893598236223015, + "loss": 0.0367, "step": 14060 }, { - "epoch": 0.15, - "learning_rate": 0.0002771842770967114, - "loss": 0.038, + "epoch": 0.07, + "learning_rate": 0.00028935225592928746, + "loss": 0.0343, "step": 14070 }, { - "epoch": 0.15, - "learning_rate": 0.0002771680612311085, - "loss": 0.0362, + "epoch": 0.07, + "learning_rate": 0.00028934468823627345, + "loss": 0.0285, "step": 14080 }, { - "epoch": 0.15, - "learning_rate": 0.0002771518453655056, - "loss": 0.0422, + "epoch": 0.07, + "learning_rate": 0.00028933712054325943, + "loss": 0.0311, "step": 14090 }, { - "epoch": 0.15, - "learning_rate": 0.0002771356294999027, - "loss": 0.0372, + "epoch": 0.07, + "learning_rate": 0.0002893295528502454, + "loss": 0.0287, "step": 14100 }, { - "epoch": 0.15, - "learning_rate": 0.00027711941363429976, - "loss": 0.0312, + "epoch": 0.07, + "learning_rate": 0.00028932198515723144, + "loss": 0.034, "step": 14110 }, { - "epoch": 0.15, - "learning_rate": 0.0002771031977686969, - "loss": 0.0353, + "epoch": 0.07, + "learning_rate": 0.0002893144174642174, + "loss": 0.0345, "step": 14120 }, { - "epoch": 0.15, - "learning_rate": 0.000277086981903094, - "loss": 0.0319, + "epoch": 0.07, + "learning_rate": 0.0002893068497712034, + "loss": 0.0444, "step": 14130 }, { - "epoch": 0.15, - "learning_rate": 0.00027707076603749106, - "loss": 0.0296, + "epoch": 0.07, + "learning_rate": 0.0002892992820781894, + "loss": 0.0327, "step": 14140 }, { - "epoch": 0.15, - "learning_rate": 0.00027705455017188813, - "loss": 0.0347, + "epoch": 0.07, + "learning_rate": 0.00028929171438517537, + "loss": 0.0286, "step": 14150 }, { - "epoch": 0.15, - "learning_rate": 0.00027703833430628525, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.00028928414669216135, + "loss": 0.0295, "step": 14160 }, { - "epoch": 0.15, - "learning_rate": 0.00027702211844068237, - "loss": 0.0296, + "epoch": 0.07, + "learning_rate": 0.00028927657899914733, + "loss": 0.0294, "step": 14170 }, { - "epoch": 0.15, - "learning_rate": 0.00027700590257507944, - "loss": 0.0322, + "epoch": 0.07, + "learning_rate": 0.00028926901130613337, + "loss": 0.0357, "step": 14180 }, { - "epoch": 0.15, - "learning_rate": 0.0002769896867094765, - "loss": 0.0292, + "epoch": 0.07, + "learning_rate": 0.00028926144361311935, + "loss": 0.035, "step": 14190 }, { - "epoch": 0.15, - "learning_rate": 0.0002769734708438736, - "loss": 0.0294, + "epoch": 0.07, + "learning_rate": 0.00028925387592010533, + "loss": 0.0372, "step": 14200 }, { - "epoch": 0.15, - "learning_rate": 0.00027695725497827074, - "loss": 0.0348, + "epoch": 0.07, + "learning_rate": 0.0002892463082270913, + "loss": 0.036, "step": 14210 }, { - "epoch": 0.15, - "learning_rate": 0.0002769410391126678, - "loss": 0.032, + "epoch": 0.07, + "learning_rate": 0.0002892387405340773, + "loss": 0.0359, "step": 14220 }, { - "epoch": 0.15, - "learning_rate": 0.00027692482324706487, - "loss": 0.0336, + "epoch": 0.07, + "learning_rate": 0.0002892311728410633, + "loss": 0.0477, "step": 14230 }, { - "epoch": 0.15, - "learning_rate": 0.000276908607381462, - "loss": 0.0353, + "epoch": 0.07, + "learning_rate": 0.0002892236051480493, + "loss": 0.0356, "step": 14240 }, { - "epoch": 0.15, - "learning_rate": 0.0002768923915158591, - "loss": 0.0341, + "epoch": 0.07, + "learning_rate": 0.0002892160374550353, + "loss": 0.0357, "step": 14250 }, { - "epoch": 0.15, - "learning_rate": 0.0002768761756502562, - "loss": 0.0464, + "epoch": 0.07, + "learning_rate": 0.0002892084697620213, + "loss": 0.0348, "step": 14260 }, { - "epoch": 0.15, - "learning_rate": 0.0002768599597846533, - "loss": 0.0359, + "epoch": 0.07, + "learning_rate": 0.00028920090206900726, + "loss": 0.0356, "step": 14270 }, { - "epoch": 0.15, - "learning_rate": 0.00027684374391905036, - "loss": 0.0613, + "epoch": 0.07, + "learning_rate": 0.00028919333437599324, + "loss": 0.0336, "step": 14280 }, { - "epoch": 0.15, - "learning_rate": 0.0002768275280534475, - "loss": 0.0445, + "epoch": 0.07, + "learning_rate": 0.0002891857666829792, + "loss": 0.053, "step": 14290 }, { - "epoch": 0.15, - "learning_rate": 0.00027681131218784455, - "loss": 0.0389, + "epoch": 0.07, + "learning_rate": 0.0002891781989899652, + "loss": 0.0315, "step": 14300 }, { - "epoch": 0.15, - "learning_rate": 0.00027679509632224167, - "loss": 0.0336, + "epoch": 0.07, + "learning_rate": 0.00028917063129695124, + "loss": 0.0358, "step": 14310 }, { - "epoch": 0.15, - "learning_rate": 0.00027677888045663873, - "loss": 0.0661, + "epoch": 0.07, + "learning_rate": 0.0002891630636039372, + "loss": 0.0324, "step": 14320 }, { - "epoch": 0.15, - "learning_rate": 0.00027676266459103585, - "loss": 0.0439, + "epoch": 0.07, + "learning_rate": 0.0002891554959109232, + "loss": 0.0473, "step": 14330 }, { - "epoch": 0.16, - "learning_rate": 0.0002767464487254329, - "loss": 0.0377, + "epoch": 0.07, + "learning_rate": 0.0002891479282179092, + "loss": 0.0392, "step": 14340 }, { - "epoch": 0.16, - "learning_rate": 0.00027673023285983004, - "loss": 0.0317, + "epoch": 0.07, + "learning_rate": 0.00028914036052489516, + "loss": 0.0394, "step": 14350 }, { - "epoch": 0.16, - "learning_rate": 0.0002767140169942271, - "loss": 0.032, + "epoch": 0.07, + "learning_rate": 0.00028913279283188114, + "loss": 0.0356, "step": 14360 }, { - "epoch": 0.16, - "learning_rate": 0.0002766978011286242, - "loss": 0.0305, + "epoch": 0.07, + "learning_rate": 0.0002891252251388672, + "loss": 0.0348, "step": 14370 }, { - "epoch": 0.16, - "learning_rate": 0.0002766815852630213, - "loss": 0.038, + "epoch": 0.07, + "learning_rate": 0.00028911765744585316, + "loss": 0.0415, "step": 14380 }, { - "epoch": 0.16, - "learning_rate": 0.0002766653693974184, - "loss": 0.0357, + "epoch": 0.07, + "learning_rate": 0.00028911008975283914, + "loss": 0.0364, "step": 14390 }, { - "epoch": 0.16, - "learning_rate": 0.00027664915353181553, - "loss": 0.0334, + "epoch": 0.07, + "learning_rate": 0.0002891025220598251, + "loss": 0.0495, "step": 14400 }, { - "epoch": 0.16, - "learning_rate": 0.0002766329376662126, - "loss": 0.0338, + "epoch": 0.07, + "learning_rate": 0.0002890949543668111, + "loss": 0.0333, "step": 14410 }, { - "epoch": 0.16, - "learning_rate": 0.0002766167218006097, - "loss": 0.0379, + "epoch": 0.07, + "learning_rate": 0.0002890873866737971, + "loss": 0.0472, "step": 14420 }, { - "epoch": 0.16, - "learning_rate": 0.0002766005059350068, - "loss": 0.035, + "epoch": 0.07, + "learning_rate": 0.0002890798189807831, + "loss": 0.0325, "step": 14430 }, { - "epoch": 0.16, - "learning_rate": 0.0002765842900694039, - "loss": 0.0392, + "epoch": 0.07, + "learning_rate": 0.0002890722512877691, + "loss": 0.0442, "step": 14440 }, { - "epoch": 0.16, - "learning_rate": 0.00027656807420380097, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.0002890646835947551, + "loss": 0.0373, "step": 14450 }, { - "epoch": 0.16, - "learning_rate": 0.0002765518583381981, - "loss": 0.035, + "epoch": 0.07, + "learning_rate": 0.000289057115901741, + "loss": 0.0391, "step": 14460 }, { - "epoch": 0.16, - "learning_rate": 0.00027653564247259515, - "loss": 0.037, + "epoch": 0.07, + "learning_rate": 0.00028904954820872705, + "loss": 0.0436, "step": 14470 }, { - "epoch": 0.16, - "learning_rate": 0.00027651942660699227, - "loss": 0.0522, + "epoch": 0.07, + "learning_rate": 0.00028904198051571303, + "loss": 0.037, "step": 14480 }, { - "epoch": 0.16, - "learning_rate": 0.00027650321074138934, - "loss": 0.0406, + "epoch": 0.07, + "learning_rate": 0.000289034412822699, + "loss": 0.0348, "step": 14490 }, { - "epoch": 0.16, - "learning_rate": 0.00027648699487578646, - "loss": 0.0317, + "epoch": 0.07, + "learning_rate": 0.000289026845129685, + "loss": 0.0468, "step": 14500 }, { - "epoch": 0.16, - "learning_rate": 0.0002764707790101835, - "loss": 0.0339, + "epoch": 0.07, + "learning_rate": 0.000289019277436671, + "loss": 0.0449, "step": 14510 }, { - "epoch": 0.16, - "learning_rate": 0.00027645456314458064, - "loss": 0.0346, + "epoch": 0.07, + "learning_rate": 0.00028901170974365695, + "loss": 0.035, "step": 14520 }, { - "epoch": 0.16, - "learning_rate": 0.0002764383472789777, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00028900414205064294, + "loss": 0.0357, "step": 14530 }, { - "epoch": 0.16, - "learning_rate": 0.00027642213141337483, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028899657435762897, + "loss": 0.0312, "step": 14540 }, { - "epoch": 0.16, - "learning_rate": 0.0002764059155477719, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.00028898900666461495, + "loss": 0.038, "step": 14550 }, { - "epoch": 0.16, - "learning_rate": 0.000276389699682169, + "epoch": 0.07, + "learning_rate": 0.00028898143897160093, "loss": 0.0329, "step": 14560 }, { - "epoch": 0.16, - "learning_rate": 0.00027637348381656613, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.0002889738712785869, + "loss": 0.0311, "step": 14570 }, { - "epoch": 0.16, - "learning_rate": 0.0002763572679509632, - "loss": 0.0306, + "epoch": 0.07, + "learning_rate": 0.0002889663035855729, + "loss": 0.0367, "step": 14580 }, { - "epoch": 0.16, - "learning_rate": 0.00027634105208536027, - "loss": 0.0375, + "epoch": 0.07, + "learning_rate": 0.0002889587358925589, + "loss": 0.0503, "step": 14590 }, { - "epoch": 0.16, - "learning_rate": 0.0002763248362197574, - "loss": 0.0532, + "epoch": 0.07, + "learning_rate": 0.0002889511681995449, + "loss": 0.0425, "step": 14600 }, { - "epoch": 0.16, - "learning_rate": 0.0002763086203541545, - "loss": 0.0337, + "epoch": 0.07, + "learning_rate": 0.0002889436005065309, + "loss": 0.0403, "step": 14610 }, { - "epoch": 0.16, - "learning_rate": 0.00027629240448855157, - "loss": 0.0334, + "epoch": 0.07, + "learning_rate": 0.0002889360328135169, + "loss": 0.0389, "step": 14620 }, { - "epoch": 0.16, - "learning_rate": 0.00027627618862294864, - "loss": 0.0396, + "epoch": 0.07, + "learning_rate": 0.00028892846512050286, + "loss": 0.0358, "step": 14630 }, { - "epoch": 0.16, - "learning_rate": 0.00027625997275734576, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.00028892089742748884, + "loss": 0.0336, "step": 14640 }, { - "epoch": 0.16, - "learning_rate": 0.0002762437568917429, - "loss": 0.0305, + "epoch": 0.07, + "learning_rate": 0.0002889133297344748, + "loss": 0.0622, "step": 14650 }, { - "epoch": 0.16, - "learning_rate": 0.00027622754102613994, - "loss": 0.0677, + "epoch": 0.07, + "learning_rate": 0.00028890576204146086, + "loss": 0.0343, "step": 14660 }, { - "epoch": 0.16, - "learning_rate": 0.000276211325160537, - "loss": 0.0329, + "epoch": 0.07, + "learning_rate": 0.00028889819434844684, + "loss": 0.0374, "step": 14670 }, { - "epoch": 0.16, - "learning_rate": 0.0002761951092949341, - "loss": 0.0365, + "epoch": 0.07, + "learning_rate": 0.0002888906266554328, + "loss": 0.0478, "step": 14680 }, { - "epoch": 0.16, - "learning_rate": 0.00027617889342933125, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.0002888830589624188, + "loss": 0.0415, "step": 14690 }, { - "epoch": 0.16, - "learning_rate": 0.00027616267756372837, - "loss": 0.0329, + "epoch": 0.07, + "learning_rate": 0.0002888754912694048, + "loss": 0.0346, "step": 14700 }, { - "epoch": 0.16, - "learning_rate": 0.00027614646169812543, - "loss": 0.0299, + "epoch": 0.07, + "learning_rate": 0.00028886792357639076, + "loss": 0.0348, "step": 14710 }, { - "epoch": 0.16, - "learning_rate": 0.0002761302458325225, - "loss": 0.0351, + "epoch": 0.07, + "learning_rate": 0.00028886035588337675, + "loss": 0.0324, "step": 14720 }, { - "epoch": 0.16, - "learning_rate": 0.0002761140299669196, - "loss": 0.0327, + "epoch": 0.07, + "learning_rate": 0.0002888527881903628, + "loss": 0.0433, "step": 14730 }, { - "epoch": 0.16, - "learning_rate": 0.00027609781410131674, - "loss": 0.0282, + "epoch": 0.07, + "learning_rate": 0.00028884522049734876, + "loss": 0.03, "step": 14740 }, { - "epoch": 0.16, - "learning_rate": 0.0002760815982357138, - "loss": 0.0343, + "epoch": 0.07, + "learning_rate": 0.00028883765280433474, + "loss": 0.0347, "step": 14750 }, { - "epoch": 0.16, - "learning_rate": 0.00027606538237011087, - "loss": 0.0454, + "epoch": 0.07, + "learning_rate": 0.0002888300851113207, + "loss": 0.0369, "step": 14760 }, { - "epoch": 0.16, - "learning_rate": 0.000276049166504508, - "loss": 0.0337, + "epoch": 0.07, + "learning_rate": 0.0002888225174183067, + "loss": 0.0439, "step": 14770 }, { - "epoch": 0.16, - "learning_rate": 0.0002760329506389051, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.0002888149497252927, + "loss": 0.0368, "step": 14780 }, { - "epoch": 0.16, - "learning_rate": 0.0002760167347733022, - "loss": 0.0344, + "epoch": 0.07, + "learning_rate": 0.0002888073820322787, + "loss": 0.0311, "step": 14790 }, { - "epoch": 0.16, - "learning_rate": 0.00027600051890769924, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.0002887998143392647, + "loss": 0.0356, "step": 14800 }, { - "epoch": 0.16, - "learning_rate": 0.00027598430304209636, - "loss": 0.0326, + "epoch": 0.07, + "learning_rate": 0.0002887922466462507, + "loss": 0.0304, "step": 14810 }, { - "epoch": 0.16, - "learning_rate": 0.0002759680871764935, - "loss": 0.0306, + "epoch": 0.07, + "learning_rate": 0.00028878467895323667, + "loss": 0.0304, "step": 14820 }, { - "epoch": 0.16, - "learning_rate": 0.00027595187131089055, - "loss": 0.0312, + "epoch": 0.07, + "learning_rate": 0.00028877711126022265, + "loss": 0.037, "step": 14830 }, { - "epoch": 0.16, - "learning_rate": 0.00027593565544528766, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.00028876954356720863, + "loss": 0.0331, "step": 14840 }, { - "epoch": 0.16, - "learning_rate": 0.00027591943957968473, - "loss": 0.0378, + "epoch": 0.07, + "learning_rate": 0.0002887619758741946, + "loss": 0.0329, "step": 14850 }, { - "epoch": 0.16, - "learning_rate": 0.00027590322371408185, - "loss": 0.0327, + "epoch": 0.07, + "learning_rate": 0.00028875440818118065, + "loss": 0.0359, "step": 14860 }, { - "epoch": 0.16, - "learning_rate": 0.0002758870078484789, - "loss": 0.0366, + "epoch": 0.08, + "learning_rate": 0.00028874684048816663, + "loss": 0.0347, "step": 14870 }, { - "epoch": 0.16, - "learning_rate": 0.00027587079198287604, - "loss": 0.0323, + "epoch": 0.08, + "learning_rate": 0.0002887392727951526, + "loss": 0.0534, "step": 14880 }, { - "epoch": 0.16, - "learning_rate": 0.0002758545761172731, - "loss": 0.0324, + "epoch": 0.08, + "learning_rate": 0.0002887317051021386, + "loss": 0.0317, "step": 14890 }, { - "epoch": 0.16, - "learning_rate": 0.0002758383602516702, - "loss": 0.0303, + "epoch": 0.08, + "learning_rate": 0.0002887241374091246, + "loss": 0.0433, "step": 14900 }, { - "epoch": 0.16, - "learning_rate": 0.0002758221443860673, - "loss": 0.0319, + "epoch": 0.08, + "learning_rate": 0.00028871656971611056, + "loss": 0.0429, "step": 14910 }, { - "epoch": 0.16, - "learning_rate": 0.0002758059285204644, - "loss": 0.029, + "epoch": 0.08, + "learning_rate": 0.0002887090020230966, + "loss": 0.0369, "step": 14920 }, { - "epoch": 0.16, - "learning_rate": 0.00027578971265486147, - "loss": 0.0378, + "epoch": 0.08, + "learning_rate": 0.0002887014343300826, + "loss": 0.0347, "step": 14930 }, { - "epoch": 0.16, - "learning_rate": 0.0002757734967892586, - "loss": 0.0318, + "epoch": 0.08, + "learning_rate": 0.00028869386663706855, + "loss": 0.0352, "step": 14940 }, { - "epoch": 0.16, - "learning_rate": 0.00027575728092365566, - "loss": 0.0315, + "epoch": 0.08, + "learning_rate": 0.00028868629894405454, + "loss": 0.0322, "step": 14950 }, { - "epoch": 0.16, - "learning_rate": 0.0002757410650580528, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.0002886787312510405, + "loss": 0.0314, "step": 14960 }, { - "epoch": 0.16, - "learning_rate": 0.00027572484919244984, - "loss": 0.028, + "epoch": 0.08, + "learning_rate": 0.0002886711635580265, + "loss": 0.0342, "step": 14970 }, { - "epoch": 0.16, - "learning_rate": 0.00027570863332684696, - "loss": 0.0338, + "epoch": 0.08, + "learning_rate": 0.00028866359586501253, + "loss": 0.0588, "step": 14980 }, { - "epoch": 0.16, - "learning_rate": 0.00027569241746124403, - "loss": 0.0344, + "epoch": 0.08, + "learning_rate": 0.0002886560281719985, + "loss": 0.0336, "step": 14990 }, { - "epoch": 0.16, - "learning_rate": 0.00027567620159564115, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002886484604789845, + "loss": 0.0316, "step": 15000 }, { - "epoch": 0.16, - "eval_cer": 0.9216250866431449, - "eval_loss": 0.02385568805038929, - "eval_runtime": 119.8391, - "eval_samples_per_second": 16.689, - "eval_steps_per_second": 4.172, + "epoch": 0.08, + "eval_cer": 0.9145216868978086, + "eval_loss": 0.025017283856868744, + "eval_runtime": 116.429, + "eval_samples_per_second": 17.178, + "eval_steps_per_second": 4.294, "step": 15000 }, { - "epoch": 0.16, - "learning_rate": 0.00027565998573003827, - "loss": 0.0339, + "epoch": 0.08, + "learning_rate": 0.0002886408927859705, + "loss": 0.0325, "step": 15010 }, { - "epoch": 0.16, - "learning_rate": 0.00027564376986443533, - "loss": 0.033, + "epoch": 0.08, + "learning_rate": 0.00028863332509295646, + "loss": 0.0274, "step": 15020 }, { - "epoch": 0.16, - "learning_rate": 0.0002756275539988324, - "loss": 0.0324, + "epoch": 0.08, + "learning_rate": 0.00028862575739994244, + "loss": 0.0345, "step": 15030 }, { - "epoch": 0.16, - "learning_rate": 0.0002756113381332295, - "loss": 0.0325, + "epoch": 0.08, + "learning_rate": 0.0002886181897069284, + "loss": 0.0322, "step": 15040 }, { - "epoch": 0.16, - "learning_rate": 0.00027559512226762664, - "loss": 0.0323, + "epoch": 0.08, + "learning_rate": 0.00028861062201391446, + "loss": 0.0358, "step": 15050 }, { - "epoch": 0.16, - "learning_rate": 0.0002755789064020237, - "loss": 0.036, + "epoch": 0.08, + "learning_rate": 0.00028860305432090044, + "loss": 0.0312, "step": 15060 }, { - "epoch": 0.16, - "learning_rate": 0.00027556269053642077, - "loss": 0.0282, + "epoch": 0.08, + "learning_rate": 0.0002885954866278864, + "loss": 0.0317, "step": 15070 }, { - "epoch": 0.16, - "learning_rate": 0.0002755464746708179, - "loss": 0.0303, + "epoch": 0.08, + "learning_rate": 0.0002885879189348724, + "loss": 0.0374, "step": 15080 }, { - "epoch": 0.16, - "learning_rate": 0.000275530258805215, - "loss": 0.0312, + "epoch": 0.08, + "learning_rate": 0.0002885803512418584, + "loss": 0.0311, "step": 15090 }, { - "epoch": 0.16, - "learning_rate": 0.0002755140429396121, - "loss": 0.0379, + "epoch": 0.08, + "learning_rate": 0.00028857278354884437, + "loss": 0.0347, "step": 15100 }, { - "epoch": 0.16, - "learning_rate": 0.0002754978270740092, - "loss": 0.0365, + "epoch": 0.08, + "learning_rate": 0.0002885652158558304, + "loss": 0.0314, "step": 15110 }, { - "epoch": 0.16, - "learning_rate": 0.00027548161120840626, - "loss": 0.0379, + "epoch": 0.08, + "learning_rate": 0.0002885576481628164, + "loss": 0.0334, "step": 15120 }, { - "epoch": 0.16, - "learning_rate": 0.0002754653953428034, - "loss": 0.0324, + "epoch": 0.08, + "learning_rate": 0.00028855008046980236, + "loss": 0.0437, "step": 15130 }, { - "epoch": 0.16, - "learning_rate": 0.0002754491794772005, - "loss": 0.0353, + "epoch": 0.08, + "learning_rate": 0.00028854251277678835, + "loss": 0.0346, "step": 15140 }, { - "epoch": 0.16, - "learning_rate": 0.00027543296361159757, - "loss": 0.0393, + "epoch": 0.08, + "learning_rate": 0.00028853494508377433, + "loss": 0.0357, "step": 15150 }, { - "epoch": 0.16, - "learning_rate": 0.00027541674774599463, - "loss": 0.0372, + "epoch": 0.08, + "learning_rate": 0.0002885273773907603, + "loss": 0.0331, "step": 15160 }, { - "epoch": 0.16, - "learning_rate": 0.00027540053188039175, - "loss": 0.0328, + "epoch": 0.08, + "learning_rate": 0.00028851980969774634, + "loss": 0.0358, "step": 15170 }, { - "epoch": 0.16, - "learning_rate": 0.00027538431601478887, - "loss": 0.0334, + "epoch": 0.08, + "learning_rate": 0.0002885122420047323, + "loss": 0.0401, "step": 15180 }, { - "epoch": 0.16, - "learning_rate": 0.00027536810014918594, - "loss": 0.0279, + "epoch": 0.08, + "learning_rate": 0.0002885046743117183, + "loss": 0.0337, "step": 15190 }, { - "epoch": 0.16, - "learning_rate": 0.000275351884283583, - "loss": 0.0302, + "epoch": 0.08, + "learning_rate": 0.0002884971066187043, + "loss": 0.0365, "step": 15200 }, { - "epoch": 0.16, - "learning_rate": 0.0002753356684179801, - "loss": 0.0296, + "epoch": 0.08, + "learning_rate": 0.00028848953892569027, + "loss": 0.0399, "step": 15210 }, { - "epoch": 0.16, - "learning_rate": 0.00027531945255237724, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.00028848197123267625, + "loss": 0.0353, "step": 15220 }, { - "epoch": 0.16, - "learning_rate": 0.0002753032366867743, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.00028847440353966223, + "loss": 0.0325, "step": 15230 }, { - "epoch": 0.16, - "learning_rate": 0.0002752870208211714, - "loss": 0.0319, + "epoch": 0.08, + "learning_rate": 0.00028846683584664827, + "loss": 0.0345, "step": 15240 }, { - "epoch": 0.16, - "learning_rate": 0.0002752708049555685, - "loss": 0.0311, + "epoch": 0.08, + "learning_rate": 0.00028845926815363425, + "loss": 0.0326, "step": 15250 }, { - "epoch": 0.16, - "learning_rate": 0.0002752545890899656, - "loss": 0.032, + "epoch": 0.08, + "learning_rate": 0.00028845170046062023, + "loss": 0.0296, "step": 15260 }, { - "epoch": 0.17, - "learning_rate": 0.0002752383732243627, - "loss": 0.0331, + "epoch": 0.08, + "learning_rate": 0.0002884441327676062, + "loss": 0.033, "step": 15270 }, { - "epoch": 0.17, - "learning_rate": 0.0002752221573587598, - "loss": 0.0332, + "epoch": 0.08, + "learning_rate": 0.0002884365650745922, + "loss": 0.0354, "step": 15280 }, { - "epoch": 0.17, - "learning_rate": 0.00027520594149315687, - "loss": 0.0326, + "epoch": 0.08, + "learning_rate": 0.0002884289973815782, + "loss": 0.0502, "step": 15290 }, { - "epoch": 0.17, - "learning_rate": 0.000275189725627554, - "loss": 0.0321, + "epoch": 0.08, + "learning_rate": 0.0002884214296885642, + "loss": 0.0442, "step": 15300 }, { - "epoch": 0.17, - "learning_rate": 0.0002751735097619511, - "loss": 0.0314, + "epoch": 0.08, + "learning_rate": 0.0002884138619955502, + "loss": 0.0323, "step": 15310 }, { - "epoch": 0.17, - "learning_rate": 0.00027515729389634817, - "loss": 0.0362, + "epoch": 0.08, + "learning_rate": 0.0002884062943025362, + "loss": 0.0361, "step": 15320 }, { - "epoch": 0.17, - "learning_rate": 0.00027514107803074524, - "loss": 0.0332, + "epoch": 0.08, + "learning_rate": 0.00028839872660952216, + "loss": 0.0331, "step": 15330 }, { - "epoch": 0.17, - "learning_rate": 0.00027512486216514236, - "loss": 0.0332, + "epoch": 0.08, + "learning_rate": 0.00028839115891650814, + "loss": 0.0325, "step": 15340 }, { - "epoch": 0.17, - "learning_rate": 0.0002751086462995395, - "loss": 0.0323, + "epoch": 0.08, + "learning_rate": 0.0002883835912234941, + "loss": 0.032, "step": 15350 }, { - "epoch": 0.17, - "learning_rate": 0.00027509243043393654, - "loss": 0.0311, + "epoch": 0.08, + "learning_rate": 0.0002883760235304801, + "loss": 0.0329, "step": 15360 }, { - "epoch": 0.17, - "learning_rate": 0.0002750762145683336, - "loss": 0.0361, + "epoch": 0.08, + "learning_rate": 0.00028836845583746614, + "loss": 0.0304, "step": 15370 }, { - "epoch": 0.17, - "learning_rate": 0.00027505999870273073, - "loss": 0.0292, + "epoch": 0.08, + "learning_rate": 0.0002883608881444521, + "loss": 0.038, "step": 15380 }, { - "epoch": 0.17, - "learning_rate": 0.00027504378283712785, - "loss": 0.0363, + "epoch": 0.08, + "learning_rate": 0.0002883533204514381, + "loss": 0.0385, "step": 15390 }, { - "epoch": 0.17, - "learning_rate": 0.0002750275669715249, - "loss": 0.0298, + "epoch": 0.08, + "learning_rate": 0.0002883457527584241, + "loss": 0.0355, "step": 15400 }, { - "epoch": 0.17, - "learning_rate": 0.00027501135110592203, - "loss": 0.0325, + "epoch": 0.08, + "learning_rate": 0.00028833818506541006, + "loss": 0.0344, "step": 15410 }, { - "epoch": 0.17, - "learning_rate": 0.0002749951352403191, - "loss": 0.0326, + "epoch": 0.08, + "learning_rate": 0.00028833061737239604, + "loss": 0.0325, "step": 15420 }, { - "epoch": 0.17, - "learning_rate": 0.0002749789193747162, - "loss": 0.0287, + "epoch": 0.08, + "learning_rate": 0.0002883230496793821, + "loss": 0.0305, "step": 15430 }, { - "epoch": 0.17, - "learning_rate": 0.0002749627035091133, - "loss": 0.0327, + "epoch": 0.08, + "learning_rate": 0.00028831548198636806, + "loss": 0.0391, "step": 15440 }, { - "epoch": 0.17, - "learning_rate": 0.0002749464876435104, - "loss": 0.0345, + "epoch": 0.08, + "learning_rate": 0.00028830791429335404, + "loss": 0.0369, "step": 15450 }, { - "epoch": 0.17, - "learning_rate": 0.00027493027177790747, - "loss": 0.0315, + "epoch": 0.08, + "learning_rate": 0.00028830034660034, + "loss": 0.0324, "step": 15460 }, { - "epoch": 0.17, - "learning_rate": 0.0002749140559123046, - "loss": 0.0324, + "epoch": 0.08, + "learning_rate": 0.000288292778907326, + "loss": 0.0283, "step": 15470 }, { - "epoch": 0.17, - "learning_rate": 0.00027489784004670165, - "loss": 0.0285, + "epoch": 0.08, + "learning_rate": 0.000288285211214312, + "loss": 0.0287, "step": 15480 }, { - "epoch": 0.17, - "learning_rate": 0.0002748816241810988, - "loss": 0.0358, + "epoch": 0.08, + "learning_rate": 0.000288277643521298, + "loss": 0.0327, "step": 15490 }, { - "epoch": 0.17, - "learning_rate": 0.00027486540831549584, - "loss": 0.0278, + "epoch": 0.08, + "learning_rate": 0.000288270075828284, + "loss": 0.0333, "step": 15500 }, { - "epoch": 0.17, - "learning_rate": 0.00027484919244989296, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.00028826250813527, + "loss": 0.0343, "step": 15510 }, { - "epoch": 0.17, - "learning_rate": 0.00027483297658429, - "loss": 0.0288, + "epoch": 0.08, + "learning_rate": 0.00028825494044225597, + "loss": 0.0327, "step": 15520 }, { - "epoch": 0.17, - "learning_rate": 0.00027481676071868715, - "loss": 0.0287, + "epoch": 0.08, + "learning_rate": 0.00028824737274924195, + "loss": 0.0358, "step": 15530 }, { - "epoch": 0.17, - "learning_rate": 0.0002748005448530842, - "loss": 0.0304, + "epoch": 0.08, + "learning_rate": 0.00028823980505622793, + "loss": 0.0328, "step": 15540 }, { - "epoch": 0.17, - "learning_rate": 0.00027478432898748133, - "loss": 0.0296, + "epoch": 0.08, + "learning_rate": 0.0002882322373632139, + "loss": 0.0307, "step": 15550 }, { - "epoch": 0.17, - "learning_rate": 0.0002747681131218784, - "loss": 0.0351, + "epoch": 0.08, + "learning_rate": 0.00028822466967019995, + "loss": 0.032, "step": 15560 }, { - "epoch": 0.17, - "learning_rate": 0.0002747518972562755, - "loss": 0.0388, + "epoch": 0.08, + "learning_rate": 0.00028821710197718593, + "loss": 0.0351, "step": 15570 }, { - "epoch": 0.17, - "learning_rate": 0.00027473568139067264, - "loss": 0.0285, + "epoch": 0.08, + "learning_rate": 0.0002882095342841719, + "loss": 0.036, "step": 15580 }, { - "epoch": 0.17, - "learning_rate": 0.0002747194655250697, - "loss": 0.0303, + "epoch": 0.08, + "learning_rate": 0.0002882019665911579, + "loss": 0.0309, "step": 15590 }, { - "epoch": 0.17, - "learning_rate": 0.00027470324965946677, - "loss": 0.034, + "epoch": 0.08, + "learning_rate": 0.00028819439889814387, + "loss": 0.0341, "step": 15600 }, { - "epoch": 0.17, - "learning_rate": 0.0002746870337938639, - "loss": 0.034, + "epoch": 0.08, + "learning_rate": 0.00028818683120512985, + "loss": 0.0327, "step": 15610 }, { - "epoch": 0.17, - "learning_rate": 0.000274670817928261, - "loss": 0.0346, + "epoch": 0.08, + "learning_rate": 0.0002881792635121159, + "loss": 0.0377, "step": 15620 }, { - "epoch": 0.17, - "learning_rate": 0.0002746546020626581, - "loss": 0.0328, + "epoch": 0.08, + "learning_rate": 0.00028817169581910187, + "loss": 0.0316, "step": 15630 }, { - "epoch": 0.17, - "learning_rate": 0.00027463838619705514, - "loss": 0.0349, + "epoch": 0.08, + "learning_rate": 0.00028816412812608785, + "loss": 0.0298, "step": 15640 }, { - "epoch": 0.17, - "learning_rate": 0.00027462217033145226, - "loss": 0.0416, + "epoch": 0.08, + "learning_rate": 0.00028815656043307383, + "loss": 0.0327, "step": 15650 }, { - "epoch": 0.17, - "learning_rate": 0.0002746059544658494, - "loss": 0.0331, + "epoch": 0.08, + "learning_rate": 0.0002881489927400598, + "loss": 0.0333, "step": 15660 }, { - "epoch": 0.17, - "learning_rate": 0.00027458973860024644, - "loss": 0.0298, + "epoch": 0.08, + "learning_rate": 0.0002881414250470458, + "loss": 0.0334, "step": 15670 }, { - "epoch": 0.17, - "learning_rate": 0.0002745735227346435, - "loss": 0.032, + "epoch": 0.08, + "learning_rate": 0.00028813385735403183, + "loss": 0.0327, "step": 15680 }, { - "epoch": 0.17, - "learning_rate": 0.00027455730686904063, - "loss": 0.0292, + "epoch": 0.08, + "learning_rate": 0.0002881262896610178, + "loss": 0.0317, "step": 15690 }, { - "epoch": 0.17, - "learning_rate": 0.00027454109100343775, - "loss": 0.0345, + "epoch": 0.08, + "learning_rate": 0.0002881187219680038, + "loss": 0.0317, "step": 15700 }, { - "epoch": 0.17, - "learning_rate": 0.00027452487513783487, - "loss": 0.0346, + "epoch": 0.08, + "learning_rate": 0.0002881111542749898, + "loss": 0.0326, "step": 15710 }, { - "epoch": 0.17, - "learning_rate": 0.00027450865927223193, - "loss": 0.0345, + "epoch": 0.08, + "learning_rate": 0.00028810358658197576, + "loss": 0.0316, "step": 15720 }, { - "epoch": 0.17, - "learning_rate": 0.000274492443406629, - "loss": 0.0314, + "epoch": 0.08, + "learning_rate": 0.00028809601888896174, + "loss": 0.0351, "step": 15730 }, { - "epoch": 0.17, - "learning_rate": 0.0002744762275410261, - "loss": 0.0317, + "epoch": 0.08, + "learning_rate": 0.0002880884511959477, + "loss": 0.0318, "step": 15740 }, { - "epoch": 0.17, - "learning_rate": 0.00027446001167542324, - "loss": 0.0286, + "epoch": 0.08, + "learning_rate": 0.0002880808835029337, + "loss": 0.0348, "step": 15750 }, { - "epoch": 0.17, - "learning_rate": 0.0002744437958098203, - "loss": 0.0296, + "epoch": 0.08, + "learning_rate": 0.0002880733158099197, + "loss": 0.0315, "step": 15760 }, { - "epoch": 0.17, - "learning_rate": 0.00027442757994421737, - "loss": 0.0315, + "epoch": 0.08, + "learning_rate": 0.00028806574811690566, + "loss": 0.0285, "step": 15770 }, { - "epoch": 0.17, - "learning_rate": 0.0002744113640786145, - "loss": 0.035, + "epoch": 0.08, + "learning_rate": 0.00028805818042389165, + "loss": 0.0318, "step": 15780 }, { - "epoch": 0.17, - "learning_rate": 0.0002743951482130116, - "loss": 0.0319, + "epoch": 0.08, + "learning_rate": 0.0002880506127308777, + "loss": 0.0326, "step": 15790 }, { - "epoch": 0.17, - "learning_rate": 0.0002743789323474087, - "loss": 0.0354, + "epoch": 0.08, + "learning_rate": 0.00028804304503786366, + "loss": 0.0285, "step": 15800 }, { - "epoch": 0.17, - "learning_rate": 0.00027436271648180574, - "loss": 0.0364, + "epoch": 0.08, + "learning_rate": 0.00028803547734484964, + "loss": 0.034, "step": 15810 }, { - "epoch": 0.17, - "learning_rate": 0.00027434650061620286, + "epoch": 0.08, + "learning_rate": 0.0002880279096518356, "loss": 0.0324, "step": 15820 }, { - "epoch": 0.17, - "learning_rate": 0.0002743302847506, - "loss": 0.0357, + "epoch": 0.08, + "learning_rate": 0.0002880203419588216, + "loss": 0.0292, "step": 15830 }, { - "epoch": 0.17, - "learning_rate": 0.00027431406888499705, - "loss": 0.0317, + "epoch": 0.08, + "learning_rate": 0.0002880127742658076, + "loss": 0.0298, "step": 15840 }, { - "epoch": 0.17, - "learning_rate": 0.00027429785301939417, - "loss": 0.0329, + "epoch": 0.08, + "learning_rate": 0.0002880052065727936, + "loss": 0.0283, "step": 15850 }, { - "epoch": 0.17, - "learning_rate": 0.00027428163715379123, - "loss": 0.0335, + "epoch": 0.08, + "learning_rate": 0.0002879976388797796, + "loss": 0.0338, "step": 15860 }, { - "epoch": 0.17, - "learning_rate": 0.00027426542128818835, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002879900711867656, + "loss": 0.0364, "step": 15870 }, { - "epoch": 0.17, - "learning_rate": 0.0002742492054225855, - "loss": 0.0319, + "epoch": 0.08, + "learning_rate": 0.00028798250349375157, + "loss": 0.028, "step": 15880 }, { - "epoch": 0.17, - "learning_rate": 0.00027423298955698254, - "loss": 0.032, + "epoch": 0.08, + "learning_rate": 0.00028797493580073755, + "loss": 0.0322, "step": 15890 }, { - "epoch": 0.17, - "learning_rate": 0.0002742167736913796, - "loss": 0.0304, + "epoch": 0.08, + "learning_rate": 0.00028796736810772353, + "loss": 0.0321, "step": 15900 }, { - "epoch": 0.17, - "learning_rate": 0.0002742005578257767, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.00028795980041470957, + "loss": 0.0291, "step": 15910 }, { - "epoch": 0.17, - "learning_rate": 0.00027418434196017384, - "loss": 0.031, + "epoch": 0.08, + "learning_rate": 0.00028795223272169555, + "loss": 0.032, "step": 15920 }, { - "epoch": 0.17, - "learning_rate": 0.0002741681260945709, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.00028794466502868153, + "loss": 0.0289, "step": 15930 }, { - "epoch": 0.17, - "learning_rate": 0.000274151910228968, - "loss": 0.0323, + "epoch": 0.08, + "learning_rate": 0.0002879370973356675, + "loss": 0.0352, "step": 15940 }, { - "epoch": 0.17, - "learning_rate": 0.0002741356943633651, - "loss": 0.0321, + "epoch": 0.08, + "learning_rate": 0.0002879295296426535, + "loss": 0.032, "step": 15950 }, { - "epoch": 0.17, - "learning_rate": 0.0002741194784977622, - "loss": 0.0306, + "epoch": 0.08, + "learning_rate": 0.0002879219619496395, + "loss": 0.0366, "step": 15960 }, { - "epoch": 0.17, - "learning_rate": 0.0002741032626321593, - "loss": 0.0321, + "epoch": 0.08, + "learning_rate": 0.00028791439425662546, + "loss": 0.0315, "step": 15970 }, { - "epoch": 0.17, - "learning_rate": 0.00027408704676655635, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.0002879068265636115, + "loss": 0.0363, "step": 15980 }, { - "epoch": 0.17, - "learning_rate": 0.00027407083090095347, - "loss": 0.0311, + "epoch": 0.08, + "learning_rate": 0.0002878992588705975, + "loss": 0.0299, "step": 15990 }, { - "epoch": 0.17, - "learning_rate": 0.0002740546150353506, - "loss": 0.029, + "epoch": 0.08, + "learning_rate": 0.00028789169117758345, + "loss": 0.0304, "step": 16000 }, { - "epoch": 0.17, - "eval_cer": 0.9216103203928865, - "eval_loss": 0.02347717247903347, - "eval_runtime": 120.1178, - "eval_samples_per_second": 16.65, - "eval_steps_per_second": 4.163, + "epoch": 0.08, + "eval_cer": 0.9144945158062973, + "eval_loss": 0.02421427145600319, + "eval_runtime": 116.6835, + "eval_samples_per_second": 17.14, + "eval_steps_per_second": 4.285, "step": 16000 }, { - "epoch": 0.17, - "learning_rate": 0.00027403839916974765, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.00028788412348456944, + "loss": 0.0314, "step": 16010 }, { - "epoch": 0.17, - "learning_rate": 0.00027402218330414477, - "loss": 0.0301, + "epoch": 0.08, + "learning_rate": 0.0002878765557915554, + "loss": 0.0338, "step": 16020 }, { - "epoch": 0.17, - "learning_rate": 0.00027400596743854184, - "loss": 0.0358, + "epoch": 0.08, + "learning_rate": 0.0002878689880985414, + "loss": 0.0299, "step": 16030 }, { - "epoch": 0.17, - "learning_rate": 0.00027398975157293896, - "loss": 0.0314, + "epoch": 0.08, + "learning_rate": 0.00028786142040552743, + "loss": 0.0328, "step": 16040 }, { - "epoch": 0.17, - "learning_rate": 0.000273973535707336, - "loss": 0.03, + "epoch": 0.08, + "learning_rate": 0.0002878538527125134, + "loss": 0.0309, "step": 16050 }, { - "epoch": 0.17, - "learning_rate": 0.00027395731984173314, - "loss": 0.0341, + "epoch": 0.08, + "learning_rate": 0.0002878462850194994, + "loss": 0.0302, "step": 16060 }, { - "epoch": 0.17, - "learning_rate": 0.0002739411039761302, - "loss": 0.0302, + "epoch": 0.08, + "learning_rate": 0.0002878387173264854, + "loss": 0.0344, "step": 16070 }, { - "epoch": 0.17, - "learning_rate": 0.00027392488811052733, - "loss": 0.0337, + "epoch": 0.08, + "learning_rate": 0.00028783114963347136, + "loss": 0.0316, "step": 16080 }, { - "epoch": 0.17, - "learning_rate": 0.0002739086722449244, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.00028782358194045734, + "loss": 0.034, "step": 16090 }, { - "epoch": 0.17, - "learning_rate": 0.0002738924563793215, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.0002878160142474433, + "loss": 0.0352, "step": 16100 }, { - "epoch": 0.17, - "learning_rate": 0.0002738762405137186, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.00028780844655442936, + "loss": 0.0281, "step": 16110 }, { - "epoch": 0.17, - "learning_rate": 0.0002738600246481157, - "loss": 0.0338, + "epoch": 0.08, + "learning_rate": 0.00028780087886141534, + "loss": 0.0263, "step": 16120 }, { - "epoch": 0.17, - "learning_rate": 0.00027384380878251276, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.0002877933111684013, + "loss": 0.0265, "step": 16130 }, { - "epoch": 0.17, - "learning_rate": 0.0002738275929169099, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.0002877857434753873, + "loss": 0.0284, "step": 16140 }, { - "epoch": 0.17, - "learning_rate": 0.000273811377051307, - "loss": 0.0278, + "epoch": 0.08, + "learning_rate": 0.0002877781757823733, + "loss": 0.0324, "step": 16150 }, { - "epoch": 0.17, - "learning_rate": 0.00027379516118570407, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.00028777060808935927, + "loss": 0.0283, "step": 16160 }, { - "epoch": 0.17, - "learning_rate": 0.00027377894532010114, - "loss": 0.0295, + "epoch": 0.08, + "learning_rate": 0.0002877630403963453, + "loss": 0.033, "step": 16170 }, { - "epoch": 0.17, - "learning_rate": 0.00027376272945449826, - "loss": 0.0292, + "epoch": 0.08, + "learning_rate": 0.0002877554727033313, + "loss": 0.0318, "step": 16180 }, { - "epoch": 0.18, - "learning_rate": 0.0002737465135888954, - "loss": 0.0307, + "epoch": 0.08, + "learning_rate": 0.00028774790501031726, + "loss": 0.0317, "step": 16190 }, { - "epoch": 0.18, - "learning_rate": 0.00027373029772329244, - "loss": 0.0276, + "epoch": 0.08, + "learning_rate": 0.00028774033731730325, + "loss": 0.0316, "step": 16200 }, { - "epoch": 0.18, - "learning_rate": 0.0002737140818576895, - "loss": 0.0327, + "epoch": 0.08, + "learning_rate": 0.00028773276962428923, + "loss": 0.0288, "step": 16210 }, { - "epoch": 0.18, - "learning_rate": 0.0002736978659920866, - "loss": 0.0308, + "epoch": 0.08, + "learning_rate": 0.0002877252019312752, + "loss": 0.0331, "step": 16220 }, { - "epoch": 0.18, - "learning_rate": 0.00027368165012648375, - "loss": 0.0306, + "epoch": 0.08, + "learning_rate": 0.00028771763423826124, + "loss": 0.03, "step": 16230 }, { - "epoch": 0.18, - "learning_rate": 0.0002736654342608808, - "loss": 0.0286, + "epoch": 0.08, + "learning_rate": 0.0002877100665452472, + "loss": 0.0282, "step": 16240 }, { - "epoch": 0.18, - "learning_rate": 0.0002736492183952779, - "loss": 0.028, + "epoch": 0.08, + "learning_rate": 0.0002877024988522332, + "loss": 0.0327, "step": 16250 }, { - "epoch": 0.18, - "learning_rate": 0.000273633002529675, - "loss": 0.0331, + "epoch": 0.08, + "learning_rate": 0.0002876949311592192, + "loss": 0.0297, "step": 16260 }, { - "epoch": 0.18, - "learning_rate": 0.0002736167866640721, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.00028768736346620517, + "loss": 0.0416, "step": 16270 }, { - "epoch": 0.18, - "learning_rate": 0.0002736005707984692, - "loss": 0.0292, + "epoch": 0.08, + "learning_rate": 0.00028767979577319115, + "loss": 0.0328, "step": 16280 }, { - "epoch": 0.18, - "learning_rate": 0.0002735843549328663, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.00028767222808017713, + "loss": 0.028, "step": 16290 }, { - "epoch": 0.18, - "learning_rate": 0.00027356813906726337, - "loss": 0.0296, + "epoch": 0.08, + "learning_rate": 0.00028766466038716317, + "loss": 0.0305, "step": 16300 }, { - "epoch": 0.18, - "learning_rate": 0.0002735519232016605, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.00028765709269414915, + "loss": 0.0321, "step": 16310 }, { - "epoch": 0.18, - "learning_rate": 0.0002735357073360576, - "loss": 0.0332, + "epoch": 0.08, + "learning_rate": 0.00028764952500113513, + "loss": 0.0368, "step": 16320 }, { - "epoch": 0.18, - "learning_rate": 0.0002735194914704547, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.0002876419573081211, + "loss": 0.0294, "step": 16330 }, { - "epoch": 0.18, - "learning_rate": 0.00027350327560485174, - "loss": 0.0307, + "epoch": 0.08, + "learning_rate": 0.0002876343896151071, + "loss": 0.028, "step": 16340 }, { - "epoch": 0.18, - "learning_rate": 0.00027348705973924886, - "loss": 0.0331, + "epoch": 0.08, + "learning_rate": 0.0002876268219220931, + "loss": 0.031, "step": 16350 }, { - "epoch": 0.18, - "learning_rate": 0.000273470843873646, - "loss": 0.0316, + "epoch": 0.08, + "learning_rate": 0.0002876192542290791, + "loss": 0.0304, "step": 16360 }, { - "epoch": 0.18, - "learning_rate": 0.00027345462800804304, - "loss": 0.0305, + "epoch": 0.08, + "learning_rate": 0.0002876116865360651, + "loss": 0.0365, "step": 16370 }, { - "epoch": 0.18, - "learning_rate": 0.0002734384121424401, - "loss": 0.0228, + "epoch": 0.08, + "learning_rate": 0.0002876041188430511, + "loss": 0.0327, "step": 16380 }, { - "epoch": 0.18, - "learning_rate": 0.00027342219627683723, - "loss": 0.0338, + "epoch": 0.08, + "learning_rate": 0.00028759655115003706, + "loss": 0.0309, "step": 16390 }, { - "epoch": 0.18, - "learning_rate": 0.00027340598041123435, - "loss": 0.0278, + "epoch": 0.08, + "learning_rate": 0.00028758898345702304, + "loss": 0.0306, "step": 16400 }, { - "epoch": 0.18, - "learning_rate": 0.0002733897645456314, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.000287581415764009, + "loss": 0.0296, "step": 16410 }, { - "epoch": 0.18, - "learning_rate": 0.00027337354868002854, - "loss": 0.0287, + "epoch": 0.08, + "learning_rate": 0.000287573848070995, + "loss": 0.032, "step": 16420 }, { - "epoch": 0.18, - "learning_rate": 0.0002733573328144256, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.00028756628037798104, + "loss": 0.0331, "step": 16430 }, { - "epoch": 0.18, - "learning_rate": 0.0002733411169488227, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.000287558712684967, + "loss": 0.0354, "step": 16440 }, { - "epoch": 0.18, - "learning_rate": 0.0002733249010832198, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.000287551144991953, + "loss": 0.0395, "step": 16450 }, { - "epoch": 0.18, - "learning_rate": 0.0002733086852176169, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.000287543577298939, + "loss": 0.0339, "step": 16460 }, { - "epoch": 0.18, - "learning_rate": 0.00027329246935201397, - "loss": 0.0282, + "epoch": 0.08, + "learning_rate": 0.00028753600960592496, + "loss": 0.0355, "step": 16470 }, { - "epoch": 0.18, - "learning_rate": 0.0002732762534864111, - "loss": 0.0302, + "epoch": 0.08, + "learning_rate": 0.00028752844191291094, + "loss": 0.0343, "step": 16480 }, { - "epoch": 0.18, - "learning_rate": 0.00027326003762080816, - "loss": 0.0302, + "epoch": 0.08, + "learning_rate": 0.000287520874219897, + "loss": 0.0391, "step": 16490 }, { - "epoch": 0.18, - "learning_rate": 0.0002732438217552053, - "loss": 0.0384, + "epoch": 0.08, + "learning_rate": 0.00028751330652688296, + "loss": 0.0339, "step": 16500 }, { - "epoch": 0.18, - "learning_rate": 0.00027322760588960234, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.00028750573883386894, + "loss": 0.0301, "step": 16510 }, { - "epoch": 0.18, - "learning_rate": 0.00027321139002399946, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.0002874981711408549, + "loss": 0.0293, "step": 16520 }, { - "epoch": 0.18, - "learning_rate": 0.00027319517415839653, - "loss": 0.0322, + "epoch": 0.08, + "learning_rate": 0.0002874906034478409, + "loss": 0.03, "step": 16530 }, { - "epoch": 0.18, - "learning_rate": 0.00027317895829279365, - "loss": 0.0287, + "epoch": 0.08, + "learning_rate": 0.0002874830357548269, + "loss": 0.0332, "step": 16540 }, { - "epoch": 0.18, - "learning_rate": 0.0002731627424271907, - "loss": 0.0313, + "epoch": 0.08, + "learning_rate": 0.0002874754680618129, + "loss": 0.033, "step": 16550 }, { - "epoch": 0.18, - "learning_rate": 0.00027314652656158783, - "loss": 0.0275, + "epoch": 0.08, + "learning_rate": 0.0002874679003687989, + "loss": 0.0313, "step": 16560 }, { - "epoch": 0.18, - "learning_rate": 0.00027313031069598495, - "loss": 0.0295, + "epoch": 0.08, + "learning_rate": 0.0002874603326757849, + "loss": 0.0316, "step": 16570 }, { - "epoch": 0.18, - "learning_rate": 0.000273114094830382, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.00028745276498277087, + "loss": 0.0291, "step": 16580 }, { - "epoch": 0.18, - "learning_rate": 0.00027309787896477914, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.00028744519728975685, + "loss": 0.0332, "step": 16590 }, { - "epoch": 0.18, - "learning_rate": 0.0002730816630991762, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.00028743762959674283, + "loss": 0.03, "step": 16600 }, { - "epoch": 0.18, - "learning_rate": 0.0002730654472335733, - "loss": 0.0329, + "epoch": 0.08, + "learning_rate": 0.0002874300619037288, + "loss": 0.0315, "step": 16610 }, { - "epoch": 0.18, - "learning_rate": 0.0002730492313679704, - "loss": 0.031, + "epoch": 0.08, + "learning_rate": 0.00028742249421071485, + "loss": 0.0341, "step": 16620 }, { - "epoch": 0.18, - "learning_rate": 0.0002730330155023675, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.00028741492651770083, + "loss": 0.0323, "step": 16630 }, { - "epoch": 0.18, - "learning_rate": 0.0002730167996367646, - "loss": 0.0347, + "epoch": 0.08, + "learning_rate": 0.0002874073588246868, + "loss": 0.0294, "step": 16640 }, { - "epoch": 0.18, - "learning_rate": 0.0002730005837711617, - "loss": 0.0328, + "epoch": 0.08, + "learning_rate": 0.0002873997911316728, + "loss": 0.0272, "step": 16650 }, { - "epoch": 0.18, - "learning_rate": 0.00027298436790555876, - "loss": 0.0301, + "epoch": 0.08, + "learning_rate": 0.00028739222343865877, + "loss": 0.0345, "step": 16660 }, { - "epoch": 0.18, - "learning_rate": 0.0002729681520399559, - "loss": 0.0338, + "epoch": 0.08, + "learning_rate": 0.00028738465574564475, + "loss": 0.0328, "step": 16670 }, { - "epoch": 0.18, - "learning_rate": 0.00027295193617435295, - "loss": 0.0308, + "epoch": 0.08, + "learning_rate": 0.0002873770880526308, + "loss": 0.0294, "step": 16680 }, { - "epoch": 0.18, - "learning_rate": 0.00027293572030875007, - "loss": 0.0322, + "epoch": 0.08, + "learning_rate": 0.00028736952035961677, + "loss": 0.0301, "step": 16690 }, { - "epoch": 0.18, - "learning_rate": 0.00027291950444314713, - "loss": 0.0375, + "epoch": 0.08, + "learning_rate": 0.00028736195266660275, + "loss": 0.0301, "step": 16700 }, { - "epoch": 0.18, - "learning_rate": 0.00027290328857754425, - "loss": 0.0334, + "epoch": 0.08, + "learning_rate": 0.00028735438497358873, + "loss": 0.0299, "step": 16710 }, { - "epoch": 0.18, - "learning_rate": 0.00027288707271194137, - "loss": 0.0394, + "epoch": 0.08, + "learning_rate": 0.0002873468172805747, + "loss": 0.0355, "step": 16720 }, { - "epoch": 0.18, - "learning_rate": 0.00027287085684633844, - "loss": 0.0323, + "epoch": 0.08, + "learning_rate": 0.0002873392495875607, + "loss": 0.0324, "step": 16730 }, { - "epoch": 0.18, - "learning_rate": 0.0002728546409807355, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.00028733168189454673, + "loss": 0.0323, "step": 16740 }, { - "epoch": 0.18, - "learning_rate": 0.0002728384251151326, - "loss": 0.036, + "epoch": 0.08, + "learning_rate": 0.0002873241142015327, + "loss": 0.0399, "step": 16750 }, { - "epoch": 0.18, - "learning_rate": 0.00027282220924952974, - "loss": 0.033, + "epoch": 0.08, + "learning_rate": 0.0002873165465085187, + "loss": 0.034, "step": 16760 }, { - "epoch": 0.18, - "learning_rate": 0.0002728059933839268, - "loss": 0.0298, + "epoch": 0.08, + "learning_rate": 0.0002873089788155047, + "loss": 0.036, "step": 16770 }, { - "epoch": 0.18, - "learning_rate": 0.0002727897775183239, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.00028730141112249066, + "loss": 0.0351, "step": 16780 }, { - "epoch": 0.18, - "learning_rate": 0.000272773561652721, - "loss": 0.0288, + "epoch": 0.08, + "learning_rate": 0.00028729384342947664, + "loss": 0.033, "step": 16790 }, { - "epoch": 0.18, - "learning_rate": 0.0002727573457871181, - "loss": 0.034, + "epoch": 0.08, + "learning_rate": 0.0002872862757364626, + "loss": 0.0324, "step": 16800 }, { - "epoch": 0.18, - "learning_rate": 0.0002727411299215152, - "loss": 0.0326, + "epoch": 0.08, + "learning_rate": 0.00028727870804344866, + "loss": 0.0323, "step": 16810 }, { - "epoch": 0.18, - "learning_rate": 0.00027272491405591225, - "loss": 0.0315, + "epoch": 0.08, + "learning_rate": 0.00028727114035043464, + "loss": 0.0301, "step": 16820 }, { - "epoch": 0.18, - "learning_rate": 0.00027270869819030936, - "loss": 0.0299, + "epoch": 0.08, + "learning_rate": 0.0002872635726574206, + "loss": 0.0378, "step": 16830 }, { - "epoch": 0.18, - "learning_rate": 0.0002726924823247065, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.0002872560049644066, + "loss": 0.0318, "step": 16840 }, { - "epoch": 0.18, - "learning_rate": 0.00027267626645910355, - "loss": 0.0285, + "epoch": 0.09, + "learning_rate": 0.0002872484372713926, + "loss": 0.0299, "step": 16850 }, { - "epoch": 0.18, - "learning_rate": 0.00027266005059350067, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.00028724086957837856, + "loss": 0.0302, "step": 16860 }, { - "epoch": 0.18, - "learning_rate": 0.00027264383472789774, - "loss": 0.0305, + "epoch": 0.09, + "learning_rate": 0.0002872333018853646, + "loss": 0.0349, "step": 16870 }, { - "epoch": 0.18, - "learning_rate": 0.00027262761886229486, - "loss": 0.0282, + "epoch": 0.09, + "learning_rate": 0.0002872257341923506, + "loss": 0.0315, "step": 16880 }, { - "epoch": 0.18, - "learning_rate": 0.000272611402996692, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.00028721816649933656, + "loss": 0.0354, "step": 16890 }, { - "epoch": 0.18, - "learning_rate": 0.00027259518713108904, - "loss": 0.0337, + "epoch": 0.09, + "learning_rate": 0.00028721059880632254, + "loss": 0.0333, "step": 16900 }, { - "epoch": 0.18, - "learning_rate": 0.0002725789712654861, - "loss": 0.0309, + "epoch": 0.09, + "learning_rate": 0.0002872030311133085, + "loss": 0.0322, "step": 16910 }, { - "epoch": 0.18, - "learning_rate": 0.0002725627553998832, - "loss": 0.0318, + "epoch": 0.09, + "learning_rate": 0.0002871954634202945, + "loss": 0.0345, "step": 16920 }, { - "epoch": 0.18, - "learning_rate": 0.00027254653953428035, - "loss": 0.0355, + "epoch": 0.09, + "learning_rate": 0.0002871878957272805, + "loss": 0.0307, "step": 16930 }, { - "epoch": 0.18, - "learning_rate": 0.0002725303236686774, - "loss": 0.0271, + "epoch": 0.09, + "learning_rate": 0.0002871803280342665, + "loss": 0.032, "step": 16940 }, { - "epoch": 0.18, - "learning_rate": 0.0002725141078030745, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.0002871727603412525, + "loss": 0.0293, "step": 16950 }, { - "epoch": 0.18, - "learning_rate": 0.0002724978919374716, - "loss": 0.0326, + "epoch": 0.09, + "learning_rate": 0.0002871651926482385, + "loss": 0.0304, "step": 16960 }, { - "epoch": 0.18, - "learning_rate": 0.0002724816760718687, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.00028715762495522447, + "loss": 0.0278, "step": 16970 }, { - "epoch": 0.18, - "learning_rate": 0.0002724654602062658, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028715005726221045, + "loss": 0.0296, "step": 16980 }, { - "epoch": 0.18, - "learning_rate": 0.00027244924434066285, - "loss": 0.0271, + "epoch": 0.09, + "learning_rate": 0.00028714248956919643, + "loss": 0.0333, "step": 16990 }, { - "epoch": 0.18, - "learning_rate": 0.00027243302847505997, - "loss": 0.0295, + "epoch": 0.09, + "learning_rate": 0.0002871349218761824, + "loss": 0.0302, "step": 17000 }, { - "epoch": 0.18, - "eval_cer": 0.9216494075259235, - "eval_loss": 0.021790610626339912, - "eval_runtime": 120.0679, - "eval_samples_per_second": 16.657, - "eval_steps_per_second": 4.164, + "epoch": 0.09, + "eval_cer": 0.9145527395738214, + "eval_loss": 0.023293539881706238, + "eval_runtime": 117.3978, + "eval_samples_per_second": 17.036, + "eval_steps_per_second": 4.259, "step": 17000 }, { - "epoch": 0.18, - "learning_rate": 0.0002724168126094571, - "loss": 0.0334, + "epoch": 0.09, + "learning_rate": 0.0002871273541831684, + "loss": 0.0279, "step": 17010 }, { - "epoch": 0.18, - "learning_rate": 0.00027240059674385415, - "loss": 0.0319, + "epoch": 0.09, + "learning_rate": 0.0002871197864901544, + "loss": 0.0322, "step": 17020 }, { - "epoch": 0.18, - "learning_rate": 0.0002723843808782513, - "loss": 0.0292, + "epoch": 0.09, + "learning_rate": 0.00028711221879714036, + "loss": 0.0283, "step": 17030 }, { - "epoch": 0.18, - "learning_rate": 0.00027236816501264834, - "loss": 0.0341, + "epoch": 0.09, + "learning_rate": 0.0002871046511041264, + "loss": 0.0282, "step": 17040 }, { - "epoch": 0.18, - "learning_rate": 0.00027235194914704546, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.0002870970834111124, + "loss": 0.0307, "step": 17050 }, { - "epoch": 0.18, - "learning_rate": 0.0002723357332814425, - "loss": 0.0326, + "epoch": 0.09, + "learning_rate": 0.00028708951571809836, + "loss": 0.0334, "step": 17060 }, { - "epoch": 0.18, - "learning_rate": 0.00027231951741583964, - "loss": 0.0292, + "epoch": 0.09, + "learning_rate": 0.00028708194802508434, + "loss": 0.0319, "step": 17070 }, { - "epoch": 0.18, - "learning_rate": 0.0002723033015502367, - "loss": 0.0256, + "epoch": 0.09, + "learning_rate": 0.0002870743803320703, + "loss": 0.0328, "step": 17080 }, { - "epoch": 0.18, - "learning_rate": 0.00027228708568463383, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.0002870668126390563, + "loss": 0.027, "step": 17090 }, { - "epoch": 0.18, - "learning_rate": 0.0002722708698190309, - "loss": 0.0276, + "epoch": 0.09, + "learning_rate": 0.00028705924494604234, + "loss": 0.0343, "step": 17100 }, { - "epoch": 0.18, - "learning_rate": 0.000272254653953428, - "loss": 0.0272, + "epoch": 0.09, + "learning_rate": 0.0002870516772530283, + "loss": 0.0314, "step": 17110 }, { - "epoch": 0.19, - "learning_rate": 0.0002722384380878251, - "loss": 0.0291, + "epoch": 0.09, + "learning_rate": 0.0002870441095600143, + "loss": 0.0286, "step": 17120 }, { - "epoch": 0.19, - "learning_rate": 0.0002722222222222222, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002870365418670003, + "loss": 0.0317, "step": 17130 }, { - "epoch": 0.19, - "learning_rate": 0.00027220600635661927, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.00028702897417398626, + "loss": 0.0329, "step": 17140 }, { - "epoch": 0.19, - "learning_rate": 0.0002721897904910164, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.00028702140648097224, + "loss": 0.0308, "step": 17150 }, { - "epoch": 0.19, - "learning_rate": 0.0002721735746254135, - "loss": 0.029, + "epoch": 0.09, + "learning_rate": 0.0002870138387879582, + "loss": 0.0304, "step": 17160 }, { - "epoch": 0.19, - "learning_rate": 0.00027215735875981057, - "loss": 0.0338, + "epoch": 0.09, + "learning_rate": 0.00028700627109494426, + "loss": 0.0315, "step": 17170 }, { - "epoch": 0.19, - "learning_rate": 0.00027214114289420764, - "loss": 0.0339, + "epoch": 0.09, + "learning_rate": 0.00028699870340193024, + "loss": 0.0325, "step": 17180 }, { - "epoch": 0.19, - "learning_rate": 0.00027212492702860476, - "loss": 0.032, + "epoch": 0.09, + "learning_rate": 0.0002869911357089162, + "loss": 0.0328, "step": 17190 }, { - "epoch": 0.19, - "learning_rate": 0.0002721087111630019, - "loss": 0.0319, + "epoch": 0.09, + "learning_rate": 0.0002869835680159022, + "loss": 0.0369, "step": 17200 }, { - "epoch": 0.19, - "learning_rate": 0.00027209249529739894, - "loss": 0.0308, + "epoch": 0.09, + "learning_rate": 0.0002869760003228882, + "loss": 0.0303, "step": 17210 }, { - "epoch": 0.19, - "learning_rate": 0.000272076279431796, - "loss": 0.0342, + "epoch": 0.09, + "learning_rate": 0.00028696843262987417, + "loss": 0.0252, "step": 17220 }, { - "epoch": 0.19, - "learning_rate": 0.00027206006356619313, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.0002869608649368602, + "loss": 0.0312, "step": 17230 }, { - "epoch": 0.19, - "learning_rate": 0.00027204384770059025, - "loss": 0.031, + "epoch": 0.09, + "learning_rate": 0.0002869532972438462, + "loss": 0.0317, "step": 17240 }, { - "epoch": 0.19, - "learning_rate": 0.0002720276318349873, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.00028694572955083217, + "loss": 0.0286, "step": 17250 }, { - "epoch": 0.19, - "learning_rate": 0.0002720114159693844, - "loss": 0.0314, + "epoch": 0.09, + "learning_rate": 0.00028693816185781815, + "loss": 0.0246, "step": 17260 }, { - "epoch": 0.19, - "learning_rate": 0.0002719952001037815, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.00028693059416480413, + "loss": 0.0347, "step": 17270 }, { - "epoch": 0.19, - "learning_rate": 0.0002719789842381786, - "loss": 0.0343, + "epoch": 0.09, + "learning_rate": 0.0002869230264717901, + "loss": 0.0277, "step": 17280 }, { - "epoch": 0.19, - "learning_rate": 0.0002719627683725757, - "loss": 0.0292, + "epoch": 0.09, + "learning_rate": 0.00028691545877877615, + "loss": 0.0274, "step": 17290 }, { - "epoch": 0.19, - "learning_rate": 0.0002719465525069728, - "loss": 0.0296, + "epoch": 0.09, + "learning_rate": 0.0002869078910857621, + "loss": 0.0322, "step": 17300 }, { - "epoch": 0.19, - "learning_rate": 0.00027193033664136987, + "epoch": 0.09, + "learning_rate": 0.0002869003233927481, "loss": 0.0295, "step": 17310 }, { - "epoch": 0.19, - "learning_rate": 0.000271914120775767, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.0002868927556997341, + "loss": 0.0297, "step": 17320 }, { - "epoch": 0.19, - "learning_rate": 0.0002718979049101641, - "loss": 0.0334, + "epoch": 0.09, + "learning_rate": 0.00028688518800672007, + "loss": 0.0277, "step": 17330 }, { - "epoch": 0.19, - "learning_rate": 0.0002718816890445612, - "loss": 0.0357, + "epoch": 0.09, + "learning_rate": 0.00028687762031370605, + "loss": 0.0328, "step": 17340 }, { - "epoch": 0.19, - "learning_rate": 0.00027186547317895824, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.00028687005262069203, + "loss": 0.0314, "step": 17350 }, { - "epoch": 0.19, - "learning_rate": 0.00027184925731335536, - "loss": 0.0285, + "epoch": 0.09, + "learning_rate": 0.00028686248492767807, + "loss": 0.0325, "step": 17360 }, { - "epoch": 0.19, - "learning_rate": 0.0002718330414477525, - "loss": 0.0282, + "epoch": 0.09, + "learning_rate": 0.00028685491723466405, + "loss": 0.0294, "step": 17370 }, { - "epoch": 0.19, - "learning_rate": 0.00027181682558214955, - "loss": 0.0299, + "epoch": 0.09, + "learning_rate": 0.00028684734954165003, + "loss": 0.0308, "step": 17380 }, { - "epoch": 0.19, - "learning_rate": 0.0002718006097165466, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.000286839781848636, + "loss": 0.0306, "step": 17390 }, { - "epoch": 0.19, - "learning_rate": 0.00027178439385094373, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.000286832214155622, + "loss": 0.0317, "step": 17400 }, { - "epoch": 0.19, - "learning_rate": 0.00027176817798534085, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.000286824646462608, + "loss": 0.0297, "step": 17410 }, { - "epoch": 0.19, - "learning_rate": 0.0002717519621197379, - "loss": 0.0294, + "epoch": 0.09, + "learning_rate": 0.000286817078769594, + "loss": 0.0334, "step": 17420 }, { - "epoch": 0.19, - "learning_rate": 0.00027173574625413504, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.00028680951107658, + "loss": 0.0304, "step": 17430 }, { - "epoch": 0.19, - "learning_rate": 0.0002717195303885321, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.000286801943383566, + "loss": 0.0283, "step": 17440 }, { - "epoch": 0.19, - "learning_rate": 0.0002717033145229292, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.00028679437569055196, + "loss": 0.032, "step": 17450 }, { - "epoch": 0.19, - "learning_rate": 0.00027168709865732634, - "loss": 0.034, + "epoch": 0.09, + "learning_rate": 0.00028678680799753794, + "loss": 0.0244, "step": 17460 }, { - "epoch": 0.19, - "learning_rate": 0.0002716708827917234, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.0002867792403045239, + "loss": 0.0285, "step": 17470 }, { - "epoch": 0.19, - "learning_rate": 0.0002716546669261205, - "loss": 0.0311, + "epoch": 0.09, + "learning_rate": 0.00028677167261150996, + "loss": 0.0329, "step": 17480 }, { - "epoch": 0.19, - "learning_rate": 0.0002716384510605176, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028676410491849594, + "loss": 0.034, "step": 17490 }, { - "epoch": 0.19, - "learning_rate": 0.0002716222351949147, - "loss": 0.0298, + "epoch": 0.09, + "learning_rate": 0.0002867565372254819, + "loss": 0.0267, "step": 17500 }, { - "epoch": 0.19, - "learning_rate": 0.0002716060193293118, - "loss": 0.0251, + "epoch": 0.09, + "learning_rate": 0.0002867489695324679, + "loss": 0.0285, "step": 17510 }, { - "epoch": 0.19, - "learning_rate": 0.00027158980346370885, - "loss": 0.0316, + "epoch": 0.09, + "learning_rate": 0.0002867414018394539, + "loss": 0.0289, "step": 17520 }, { - "epoch": 0.19, - "learning_rate": 0.00027157358759810597, - "loss": 0.0299, + "epoch": 0.09, + "learning_rate": 0.00028673383414643986, + "loss": 0.0278, "step": 17530 }, { - "epoch": 0.19, - "learning_rate": 0.0002715573717325031, - "loss": 0.0294, + "epoch": 0.09, + "learning_rate": 0.00028672626645342584, + "loss": 0.035, "step": 17540 }, { - "epoch": 0.19, - "learning_rate": 0.00027154115586690015, - "loss": 0.0302, + "epoch": 0.09, + "learning_rate": 0.0002867186987604119, + "loss": 0.0308, "step": 17550 }, { - "epoch": 0.19, - "learning_rate": 0.0002715249400012972, - "loss": 0.0296, + "epoch": 0.09, + "learning_rate": 0.00028671113106739786, + "loss": 0.0327, "step": 17560 }, { - "epoch": 0.19, - "learning_rate": 0.00027150872413569434, - "loss": 0.0295, + "epoch": 0.09, + "learning_rate": 0.00028670356337438384, + "loss": 0.0316, "step": 17570 }, { - "epoch": 0.19, - "learning_rate": 0.00027149250827009146, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.0002866959956813698, + "loss": 0.0309, "step": 17580 }, { - "epoch": 0.19, - "learning_rate": 0.0002714762924044885, - "loss": 0.0344, + "epoch": 0.09, + "learning_rate": 0.0002866884279883558, + "loss": 0.0327, "step": 17590 }, { - "epoch": 0.19, - "learning_rate": 0.00027146007653888564, - "loss": 0.0359, + "epoch": 0.09, + "learning_rate": 0.0002866808602953418, + "loss": 0.0384, "step": 17600 }, { - "epoch": 0.19, - "learning_rate": 0.0002714438606732827, - "loss": 0.0316, + "epoch": 0.09, + "learning_rate": 0.0002866732926023278, + "loss": 0.0315, "step": 17610 }, { - "epoch": 0.19, - "learning_rate": 0.00027142764480767983, - "loss": 0.0295, + "epoch": 0.09, + "learning_rate": 0.0002866657249093138, + "loss": 0.0297, "step": 17620 }, { - "epoch": 0.19, - "learning_rate": 0.0002714114289420769, - "loss": 0.0304, + "epoch": 0.09, + "learning_rate": 0.0002866581572162998, + "loss": 0.0297, "step": 17630 }, { - "epoch": 0.19, - "learning_rate": 0.000271395213076474, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.00028665058952328577, + "loss": 0.0306, "step": 17640 }, { - "epoch": 0.19, - "learning_rate": 0.0002713789972108711, - "loss": 0.0254, + "epoch": 0.09, + "learning_rate": 0.00028664302183027175, + "loss": 0.0346, "step": 17650 }, { - "epoch": 0.19, - "learning_rate": 0.0002713627813452682, - "loss": 0.0326, + "epoch": 0.09, + "learning_rate": 0.00028663545413725773, + "loss": 0.0285, "step": 17660 }, { - "epoch": 0.19, - "learning_rate": 0.00027134656547966526, - "loss": 0.0259, + "epoch": 0.09, + "learning_rate": 0.0002866278864442437, + "loss": 0.0316, "step": 17670 }, { - "epoch": 0.19, - "learning_rate": 0.0002713303496140624, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.00028662031875122975, + "loss": 0.0325, "step": 17680 }, { - "epoch": 0.19, - "learning_rate": 0.00027131413374845945, - "loss": 0.0314, + "epoch": 0.09, + "learning_rate": 0.00028661275105821573, + "loss": 0.0299, "step": 17690 }, { - "epoch": 0.19, - "learning_rate": 0.00027129791788285657, - "loss": 0.0261, + "epoch": 0.09, + "learning_rate": 0.0002866051833652017, + "loss": 0.0311, "step": 17700 }, { - "epoch": 0.19, - "learning_rate": 0.00027128170201725363, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.0002865976156721877, + "loss": 0.0324, "step": 17710 }, { - "epoch": 0.19, - "learning_rate": 0.00027126548615165075, - "loss": 0.0327, + "epoch": 0.09, + "learning_rate": 0.00028659004797917367, + "loss": 0.0285, "step": 17720 }, { - "epoch": 0.19, - "learning_rate": 0.0002712492702860479, - "loss": 0.033, + "epoch": 0.09, + "learning_rate": 0.00028658248028615965, + "loss": 0.0352, "step": 17730 }, { - "epoch": 0.19, - "learning_rate": 0.00027123305442044494, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.0002865749125931457, + "loss": 0.0326, "step": 17740 }, { - "epoch": 0.19, - "learning_rate": 0.000271216838554842, - "loss": 0.0336, + "epoch": 0.09, + "learning_rate": 0.00028656734490013167, + "loss": 0.0296, "step": 17750 }, { - "epoch": 0.19, - "learning_rate": 0.0002712006226892391, - "loss": 0.0324, + "epoch": 0.09, + "learning_rate": 0.00028655977720711765, + "loss": 0.0295, "step": 17760 }, { - "epoch": 0.19, - "learning_rate": 0.00027118440682363625, - "loss": 0.0343, + "epoch": 0.09, + "learning_rate": 0.00028655220951410363, + "loss": 0.0297, "step": 17770 }, { - "epoch": 0.19, - "learning_rate": 0.0002711681909580333, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.0002865446418210896, + "loss": 0.0272, "step": 17780 }, { - "epoch": 0.19, - "learning_rate": 0.0002711519750924304, - "loss": 0.0307, + "epoch": 0.09, + "learning_rate": 0.0002865370741280756, + "loss": 0.0346, "step": 17790 }, { - "epoch": 0.19, - "learning_rate": 0.0002711357592268275, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028652950643506163, + "loss": 0.0318, "step": 17800 }, { - "epoch": 0.19, - "learning_rate": 0.0002711195433612246, - "loss": 0.0314, + "epoch": 0.09, + "learning_rate": 0.0002865219387420476, + "loss": 0.0374, "step": 17810 }, { - "epoch": 0.19, - "learning_rate": 0.0002711033274956217, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.0002865143710490336, + "loss": 0.0299, "step": 17820 }, { - "epoch": 0.19, - "learning_rate": 0.00027108711163001875, - "loss": 0.031, + "epoch": 0.09, + "learning_rate": 0.0002865068033560196, + "loss": 0.0341, "step": 17830 }, { - "epoch": 0.19, - "learning_rate": 0.00027107089576441587, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.00028649923566300556, + "loss": 0.0345, "step": 17840 }, { - "epoch": 0.19, - "learning_rate": 0.000271054679898813, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.00028649166796999154, + "loss": 0.0286, "step": 17850 }, { - "epoch": 0.19, - "learning_rate": 0.00027103846403321005, - "loss": 0.0322, + "epoch": 0.09, + "learning_rate": 0.0002864841002769775, + "loss": 0.0388, "step": 17860 }, { - "epoch": 0.19, - "learning_rate": 0.00027102224816760717, - "loss": 0.0311, + "epoch": 0.09, + "learning_rate": 0.00028647653258396356, + "loss": 0.0298, "step": 17870 }, { - "epoch": 0.19, - "learning_rate": 0.00027100603230200424, - "loss": 0.0267, + "epoch": 0.09, + "learning_rate": 0.00028646896489094954, + "loss": 0.0301, "step": 17880 }, { - "epoch": 0.19, - "learning_rate": 0.00027098981643640136, - "loss": 0.0296, + "epoch": 0.09, + "learning_rate": 0.0002864613971979355, + "loss": 0.0287, "step": 17890 }, { - "epoch": 0.19, - "learning_rate": 0.0002709736005707985, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.0002864538295049215, + "loss": 0.0287, "step": 17900 }, { - "epoch": 0.19, - "learning_rate": 0.00027095738470519554, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.0002864462618119075, + "loss": 0.0306, "step": 17910 }, { - "epoch": 0.19, - "learning_rate": 0.0002709411688395926, - "loss": 0.0321, + "epoch": 0.09, + "learning_rate": 0.00028643869411889346, + "loss": 0.035, "step": 17920 }, { - "epoch": 0.19, - "learning_rate": 0.00027092495297398973, - "loss": 0.0308, + "epoch": 0.09, + "learning_rate": 0.0002864311264258795, + "loss": 0.033, "step": 17930 }, { - "epoch": 0.19, - "learning_rate": 0.00027090873710838685, - "loss": 0.0323, + "epoch": 0.09, + "learning_rate": 0.0002864235587328655, + "loss": 0.0329, "step": 17940 }, { - "epoch": 0.19, - "learning_rate": 0.0002708925212427839, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.00028641599103985146, + "loss": 0.0307, "step": 17950 }, { - "epoch": 0.19, - "learning_rate": 0.000270876305377181, - "loss": 0.0328, + "epoch": 0.09, + "learning_rate": 0.00028640842334683744, + "loss": 0.0367, "step": 17960 }, { - "epoch": 0.19, - "learning_rate": 0.0002708600895115781, - "loss": 0.0306, + "epoch": 0.09, + "learning_rate": 0.0002864008556538234, + "loss": 0.0327, "step": 17970 }, { - "epoch": 0.19, - "learning_rate": 0.0002708438736459752, - "loss": 0.0327, + "epoch": 0.09, + "learning_rate": 0.0002863932879608094, + "loss": 0.032, "step": 17980 }, { - "epoch": 0.19, - "learning_rate": 0.0002708276577803723, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028638572026779544, + "loss": 0.0309, "step": 17990 }, { - "epoch": 0.19, - "learning_rate": 0.00027081144191476935, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.0002863781525747814, + "loss": 0.03, "step": 18000 }, { - "epoch": 0.19, - "eval_cer": 0.921588605318977, - "eval_loss": 0.021395886316895485, - "eval_runtime": 120.389, - "eval_samples_per_second": 16.613, - "eval_steps_per_second": 4.153, + "epoch": 0.09, + "eval_cer": 0.9144838414489178, + "eval_loss": 0.022705839946866035, + "eval_runtime": 117.5421, + "eval_samples_per_second": 17.015, + "eval_steps_per_second": 4.254, "step": 18000 }, { - "epoch": 0.19, - "learning_rate": 0.00027079522604916647, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.0002863705848817674, + "loss": 0.0372, "step": 18010 }, { - "epoch": 0.19, - "learning_rate": 0.0002707790101835636, - "loss": 0.0335, + "epoch": 0.09, + "learning_rate": 0.0002863630171887534, + "loss": 0.0282, "step": 18020 }, { - "epoch": 0.19, - "learning_rate": 0.0002707627943179607, - "loss": 0.0313, + "epoch": 0.09, + "learning_rate": 0.00028635544949573937, + "loss": 0.0285, "step": 18030 }, { - "epoch": 0.2, - "learning_rate": 0.0002707465784523578, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028634788180272535, + "loss": 0.0286, "step": 18040 }, { - "epoch": 0.2, - "learning_rate": 0.00027073036258675484, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.00028634031410971133, + "loss": 0.0281, "step": 18050 }, { - "epoch": 0.2, - "learning_rate": 0.00027071414672115196, - "loss": 0.0297, + "epoch": 0.09, + "learning_rate": 0.00028633274641669737, + "loss": 0.0328, "step": 18060 }, { - "epoch": 0.2, - "learning_rate": 0.0002706979308555491, - "loss": 0.0343, + "epoch": 0.09, + "learning_rate": 0.00028632517872368335, + "loss": 0.0322, "step": 18070 }, { - "epoch": 0.2, - "learning_rate": 0.00027068171498994615, - "loss": 0.0283, + "epoch": 0.09, + "learning_rate": 0.00028631761103066933, + "loss": 0.0291, "step": 18080 }, { - "epoch": 0.2, - "learning_rate": 0.0002706654991243432, - "loss": 0.0266, + "epoch": 0.09, + "learning_rate": 0.0002863100433376553, + "loss": 0.0304, "step": 18090 }, { - "epoch": 0.2, - "learning_rate": 0.00027064928325874033, - "loss": 0.0344, + "epoch": 0.09, + "learning_rate": 0.0002863024756446413, + "loss": 0.0311, "step": 18100 }, { - "epoch": 0.2, - "learning_rate": 0.00027063306739313745, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.0002862949079516273, + "loss": 0.0275, "step": 18110 }, { - "epoch": 0.2, - "learning_rate": 0.0002706168515275345, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.0002862873402586133, + "loss": 0.0325, "step": 18120 }, { - "epoch": 0.2, - "learning_rate": 0.0002706006356619316, - "loss": 0.0344, + "epoch": 0.09, + "learning_rate": 0.0002862797725655993, + "loss": 0.0323, "step": 18130 }, { - "epoch": 0.2, - "learning_rate": 0.0002705844197963287, - "loss": 0.029, + "epoch": 0.09, + "learning_rate": 0.00028627220487258527, + "loss": 0.0348, "step": 18140 }, { - "epoch": 0.2, - "learning_rate": 0.0002705682039307258, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.00028626463717957125, + "loss": 0.0337, "step": 18150 }, { - "epoch": 0.2, - "learning_rate": 0.0002705519880651229, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028625706948655724, + "loss": 0.0313, "step": 18160 }, { - "epoch": 0.2, - "learning_rate": 0.00027053577219952, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.0002862495017935432, + "loss": 0.039, "step": 18170 }, { - "epoch": 0.2, - "learning_rate": 0.0002705195563339171, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.0002862419341005292, + "loss": 0.0294, "step": 18180 }, { - "epoch": 0.2, - "learning_rate": 0.0002705033404683142, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.00028623436640751523, + "loss": 0.0348, "step": 18190 }, { - "epoch": 0.2, - "learning_rate": 0.00027048712460271126, - "loss": 0.0288, + "epoch": 0.09, + "learning_rate": 0.0002862267987145012, + "loss": 0.0318, "step": 18200 }, { - "epoch": 0.2, - "learning_rate": 0.0002704709087371084, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.0002862192310214872, + "loss": 0.0327, "step": 18210 }, { - "epoch": 0.2, - "learning_rate": 0.00027045469287150545, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.0002862116633284732, + "loss": 0.0282, "step": 18220 }, { - "epoch": 0.2, - "learning_rate": 0.00027043847700590257, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.00028620409563545916, + "loss": 0.025, "step": 18230 }, { - "epoch": 0.2, - "learning_rate": 0.00027042226114029963, - "loss": 0.0313, + "epoch": 0.09, + "learning_rate": 0.00028619652794244514, + "loss": 0.0287, "step": 18240 }, { - "epoch": 0.2, - "learning_rate": 0.00027040604527469675, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.0002861889602494311, + "loss": 0.0319, "step": 18250 }, { - "epoch": 0.2, - "learning_rate": 0.0002703898294090938, - "loss": 0.0238, + "epoch": 0.09, + "learning_rate": 0.0002861813925564171, + "loss": 0.0291, "step": 18260 }, { - "epoch": 0.2, - "learning_rate": 0.00027037361354349094, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.0002861738248634031, + "loss": 0.0253, "step": 18270 }, { - "epoch": 0.2, - "learning_rate": 0.000270357397677888, - "loss": 0.0282, + "epoch": 0.09, + "learning_rate": 0.00028616625717038907, + "loss": 0.0311, "step": 18280 }, { - "epoch": 0.2, - "learning_rate": 0.0002703411818122851, - "loss": 0.0286, + "epoch": 0.09, + "learning_rate": 0.0002861586894773751, + "loss": 0.0287, "step": 18290 }, { - "epoch": 0.2, - "learning_rate": 0.0002703249659466822, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.0002861511217843611, + "loss": 0.0257, "step": 18300 }, { - "epoch": 0.2, - "learning_rate": 0.0002703087500810793, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.00028614355409134707, + "loss": 0.0315, "step": 18310 }, { - "epoch": 0.2, - "learning_rate": 0.0002702925342154764, - "loss": 0.0248, + "epoch": 0.09, + "learning_rate": 0.00028613598639833305, + "loss": 0.0318, "step": 18320 }, { - "epoch": 0.2, - "learning_rate": 0.0002702763183498735, - "loss": 0.0292, + "epoch": 0.09, + "learning_rate": 0.00028612841870531903, + "loss": 0.0262, "step": 18330 }, { - "epoch": 0.2, - "learning_rate": 0.0002702601024842706, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.000286120851012305, + "loss": 0.0273, "step": 18340 }, { - "epoch": 0.2, - "learning_rate": 0.0002702438866186677, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.00028611328331929105, + "loss": 0.0336, "step": 18350 }, { - "epoch": 0.2, - "learning_rate": 0.00027022767075306474, - "loss": 0.0287, + "epoch": 0.09, + "learning_rate": 0.000286105715626277, + "loss": 0.0279, "step": 18360 }, { - "epoch": 0.2, - "learning_rate": 0.00027021145488746186, - "loss": 0.03, + "epoch": 0.09, + "learning_rate": 0.000286098147933263, + "loss": 0.0287, "step": 18370 }, { - "epoch": 0.2, - "learning_rate": 0.000270195239021859, - "loss": 0.0285, + "epoch": 0.09, + "learning_rate": 0.000286090580240249, + "loss": 0.036, "step": 18380 }, { - "epoch": 0.2, - "learning_rate": 0.00027017902315625605, - "loss": 0.0234, + "epoch": 0.09, + "learning_rate": 0.00028608301254723497, + "loss": 0.0276, "step": 18390 }, { - "epoch": 0.2, - "learning_rate": 0.0002701628072906531, - "loss": 0.0266, + "epoch": 0.09, + "learning_rate": 0.00028607544485422095, + "loss": 0.0329, "step": 18400 }, { - "epoch": 0.2, - "learning_rate": 0.00027014659142505024, - "loss": 0.0294, + "epoch": 0.09, + "learning_rate": 0.00028606787716120693, + "loss": 0.0358, "step": 18410 }, { - "epoch": 0.2, - "learning_rate": 0.00027013037555944736, - "loss": 0.0313, + "epoch": 0.09, + "learning_rate": 0.00028606030946819297, + "loss": 0.0325, "step": 18420 }, { - "epoch": 0.2, - "learning_rate": 0.0002701141596938444, - "loss": 0.0285, + "epoch": 0.09, + "learning_rate": 0.00028605274177517895, + "loss": 0.0329, "step": 18430 }, { - "epoch": 0.2, - "learning_rate": 0.00027009794382824154, - "loss": 0.0252, + "epoch": 0.09, + "learning_rate": 0.00028604517408216493, + "loss": 0.0289, "step": 18440 }, { - "epoch": 0.2, - "learning_rate": 0.0002700817279626386, - "loss": 0.0297, + "epoch": 0.09, + "learning_rate": 0.0002860376063891509, + "loss": 0.0284, "step": 18450 }, { - "epoch": 0.2, - "learning_rate": 0.0002700655120970357, - "loss": 0.028, + "epoch": 0.09, + "learning_rate": 0.0002860300386961369, + "loss": 0.0318, "step": 18460 }, { - "epoch": 0.2, - "learning_rate": 0.00027004929623143285, - "loss": 0.0297, + "epoch": 0.09, + "learning_rate": 0.0002860224710031229, + "loss": 0.0249, "step": 18470 }, { - "epoch": 0.2, - "learning_rate": 0.0002700330803658299, - "loss": 0.0306, + "epoch": 0.09, + "learning_rate": 0.0002860149033101089, + "loss": 0.0263, "step": 18480 }, { - "epoch": 0.2, - "learning_rate": 0.000270016864500227, - "loss": 0.0242, + "epoch": 0.09, + "learning_rate": 0.0002860073356170949, + "loss": 0.0298, "step": 18490 }, { - "epoch": 0.2, - "learning_rate": 0.0002700006486346241, - "loss": 0.0296, + "epoch": 0.09, + "learning_rate": 0.0002859997679240809, + "loss": 0.0277, "step": 18500 }, { - "epoch": 0.2, - "learning_rate": 0.0002699844327690212, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028599220023106686, + "loss": 0.0284, "step": 18510 }, { - "epoch": 0.2, - "learning_rate": 0.0002699682169034183, - "loss": 0.0288, + "epoch": 0.09, + "learning_rate": 0.00028598463253805284, + "loss": 0.0301, "step": 18520 }, { - "epoch": 0.2, - "learning_rate": 0.00026995200103781535, - "loss": 0.0288, + "epoch": 0.09, + "learning_rate": 0.0002859770648450388, + "loss": 0.0301, "step": 18530 }, { - "epoch": 0.2, - "learning_rate": 0.00026993578517221247, - "loss": 0.0295, + "epoch": 0.09, + "learning_rate": 0.00028596949715202486, + "loss": 0.0339, "step": 18540 }, { - "epoch": 0.2, - "learning_rate": 0.0002699195693066096, - "loss": 0.0321, + "epoch": 0.09, + "learning_rate": 0.00028596192945901084, + "loss": 0.0324, "step": 18550 }, { - "epoch": 0.2, - "learning_rate": 0.00026990335344100665, - "loss": 0.0283, + "epoch": 0.09, + "learning_rate": 0.0002859543617659968, + "loss": 0.0304, "step": 18560 }, { - "epoch": 0.2, - "learning_rate": 0.0002698871375754037, - "loss": 0.0298, + "epoch": 0.09, + "learning_rate": 0.0002859467940729828, + "loss": 0.031, "step": 18570 }, { - "epoch": 0.2, - "learning_rate": 0.00026987092170980084, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.0002859392263799688, + "loss": 0.0351, "step": 18580 }, { - "epoch": 0.2, - "learning_rate": 0.00026985470584419796, - "loss": 0.0253, + "epoch": 0.09, + "learning_rate": 0.00028593165868695476, + "loss": 0.0335, "step": 18590 }, { - "epoch": 0.2, - "learning_rate": 0.000269838489978595, - "loss": 0.0339, + "epoch": 0.09, + "learning_rate": 0.00028592409099394074, + "loss": 0.0335, "step": 18600 }, { - "epoch": 0.2, - "learning_rate": 0.00026982227411299214, - "loss": 0.0248, + "epoch": 0.09, + "learning_rate": 0.0002859165233009268, + "loss": 0.0265, "step": 18610 }, { - "epoch": 0.2, - "learning_rate": 0.0002698060582473892, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028590895560791276, + "loss": 0.0344, "step": 18620 }, { - "epoch": 0.2, - "learning_rate": 0.00026978984238178633, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.00028590138791489874, + "loss": 0.0333, "step": 18630 }, { - "epoch": 0.2, - "learning_rate": 0.0002697736265161834, - "loss": 0.0587, + "epoch": 0.09, + "learning_rate": 0.0002858938202218847, + "loss": 0.0277, "step": 18640 }, { - "epoch": 0.2, - "learning_rate": 0.0002697574106505805, - "loss": 0.0643, + "epoch": 0.09, + "learning_rate": 0.0002858862525288707, + "loss": 0.0324, "step": 18650 }, { - "epoch": 0.2, - "learning_rate": 0.0002697411947849776, - "loss": 0.0374, + "epoch": 0.09, + "learning_rate": 0.0002858786848358567, + "loss": 0.0307, "step": 18660 }, { - "epoch": 0.2, - "learning_rate": 0.0002697249789193747, - "loss": 0.0332, + "epoch": 0.09, + "learning_rate": 0.0002858711171428427, + "loss": 0.0319, "step": 18670 }, { - "epoch": 0.2, - "learning_rate": 0.00026970876305377177, - "loss": 0.0342, + "epoch": 0.09, + "learning_rate": 0.0002858635494498287, + "loss": 0.0381, "step": 18680 }, { - "epoch": 0.2, - "learning_rate": 0.0002696925471881689, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.0002858559817568147, + "loss": 0.0307, "step": 18690 }, { - "epoch": 0.2, - "learning_rate": 0.00026967633132256595, - "loss": 0.0283, + "epoch": 0.09, + "learning_rate": 0.00028584841406380067, + "loss": 0.0364, "step": 18700 }, { - "epoch": 0.2, - "learning_rate": 0.00026966011545696307, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.00028584084637078665, + "loss": 0.034, "step": 18710 }, { - "epoch": 0.2, - "learning_rate": 0.0002696438995913602, - "loss": 0.0361, + "epoch": 0.09, + "learning_rate": 0.00028583327867777263, + "loss": 0.0288, "step": 18720 }, { - "epoch": 0.2, - "learning_rate": 0.00026962768372575726, - "loss": 0.036, + "epoch": 0.09, + "learning_rate": 0.0002858257109847586, + "loss": 0.0339, "step": 18730 }, { - "epoch": 0.2, - "learning_rate": 0.0002696114678601544, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.00028581814329174465, + "loss": 0.0319, "step": 18740 }, { - "epoch": 0.2, - "learning_rate": 0.00026959525199455144, - "loss": 0.0298, + "epoch": 0.09, + "learning_rate": 0.00028581057559873063, + "loss": 0.0273, "step": 18750 }, { - "epoch": 0.2, - "learning_rate": 0.00026957903612894856, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.0002858030079057166, + "loss": 0.0301, "step": 18760 }, { - "epoch": 0.2, - "learning_rate": 0.00026956282026334563, - "loss": 0.0389, + "epoch": 0.09, + "learning_rate": 0.0002857954402127026, + "loss": 0.0277, "step": 18770 }, { - "epoch": 0.2, - "learning_rate": 0.00026954660439774275, - "loss": 0.0305, + "epoch": 0.09, + "learning_rate": 0.00028578787251968857, + "loss": 0.0278, "step": 18780 }, { - "epoch": 0.2, - "learning_rate": 0.0002695303885321398, - "loss": 0.0445, + "epoch": 0.09, + "learning_rate": 0.00028578030482667455, + "loss": 0.0277, "step": 18790 }, { - "epoch": 0.2, - "learning_rate": 0.00026951417266653693, - "loss": 0.0261, + "epoch": 0.09, + "learning_rate": 0.0002857727371336606, + "loss": 0.0293, "step": 18800 }, { - "epoch": 0.2, - "learning_rate": 0.000269497956800934, - "loss": 0.0324, + "epoch": 0.09, + "learning_rate": 0.00028576516944064657, + "loss": 0.029, "step": 18810 }, { - "epoch": 0.2, - "learning_rate": 0.0002694817409353311, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.00028575760174763255, + "loss": 0.0273, "step": 18820 }, { - "epoch": 0.2, - "learning_rate": 0.0002694655250697282, - "loss": 0.0305, + "epoch": 0.09, + "learning_rate": 0.00028575003405461853, + "loss": 0.0286, "step": 18830 }, { - "epoch": 0.2, - "learning_rate": 0.0002694493092041253, - "loss": 0.0272, + "epoch": 0.1, + "learning_rate": 0.0002857424663616045, + "loss": 0.0345, "step": 18840 }, { - "epoch": 0.2, - "learning_rate": 0.00026943309333852237, - "loss": 0.0339, + "epoch": 0.1, + "learning_rate": 0.0002857348986685905, + "loss": 0.0305, "step": 18850 }, { - "epoch": 0.2, - "learning_rate": 0.0002694168774729195, - "loss": 0.0312, + "epoch": 0.1, + "learning_rate": 0.00028572733097557653, + "loss": 0.0274, "step": 18860 }, { - "epoch": 0.2, - "learning_rate": 0.00026940066160731656, - "loss": 0.0403, + "epoch": 0.1, + "learning_rate": 0.0002857197632825625, + "loss": 0.0319, "step": 18870 }, { - "epoch": 0.2, - "learning_rate": 0.0002693844457417137, - "loss": 0.0301, + "epoch": 0.1, + "learning_rate": 0.0002857121955895485, + "loss": 0.0284, "step": 18880 }, { - "epoch": 0.2, - "learning_rate": 0.00026936822987611074, - "loss": 0.0408, + "epoch": 0.1, + "learning_rate": 0.0002857046278965345, + "loss": 0.0303, "step": 18890 }, { - "epoch": 0.2, - "learning_rate": 0.00026935201401050786, - "loss": 0.0542, + "epoch": 0.1, + "learning_rate": 0.00028569706020352046, + "loss": 0.0354, "step": 18900 }, { - "epoch": 0.2, - "learning_rate": 0.000269335798144905, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.00028568949251050644, + "loss": 0.0368, "step": 18910 }, { - "epoch": 0.2, - "learning_rate": 0.00026931958227930205, - "loss": 0.033, + "epoch": 0.1, + "learning_rate": 0.0002856819248174924, + "loss": 0.0355, "step": 18920 }, { - "epoch": 0.2, - "learning_rate": 0.0002693033664136991, - "loss": 0.0299, + "epoch": 0.1, + "learning_rate": 0.00028567435712447846, + "loss": 0.0382, "step": 18930 }, { - "epoch": 0.2, - "learning_rate": 0.00026928715054809623, - "loss": 0.0296, + "epoch": 0.1, + "learning_rate": 0.00028566678943146444, + "loss": 0.0309, "step": 18940 }, { - "epoch": 0.2, - "learning_rate": 0.00026927093468249335, - "loss": 0.027, + "epoch": 0.1, + "learning_rate": 0.0002856592217384504, + "loss": 0.0295, "step": 18950 }, { - "epoch": 0.2, - "learning_rate": 0.0002692547188168904, - "loss": 0.0291, + "epoch": 0.1, + "learning_rate": 0.0002856516540454364, + "loss": 0.0314, "step": 18960 }, { - "epoch": 0.21, - "learning_rate": 0.0002692385029512875, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.0002856440863524224, + "loss": 0.033, "step": 18970 }, { - "epoch": 0.21, - "learning_rate": 0.0002692222870856846, - "loss": 0.0283, + "epoch": 0.1, + "learning_rate": 0.00028563651865940836, + "loss": 0.0307, "step": 18980 }, { - "epoch": 0.21, - "learning_rate": 0.0002692060712200817, - "loss": 0.0291, + "epoch": 0.1, + "learning_rate": 0.0002856289509663944, + "loss": 0.0315, "step": 18990 }, { - "epoch": 0.21, - "learning_rate": 0.0002691898553544788, - "loss": 0.0274, + "epoch": 0.1, + "learning_rate": 0.0002856213832733804, + "loss": 0.0316, "step": 19000 }, { - "epoch": 0.21, - "eval_cer": 0.9216233494372321, - "eval_loss": 0.022243507206439972, - "eval_runtime": 120.016, - "eval_samples_per_second": 16.664, - "eval_steps_per_second": 4.166, + "epoch": 0.1, + "eval_cer": 0.9144974269946735, + "eval_loss": 0.022285686805844307, + "eval_runtime": 117.4593, + "eval_samples_per_second": 17.027, + "eval_steps_per_second": 4.257, "step": 19000 }, { - "epoch": 0.21, - "learning_rate": 0.00026917363948887585, - "loss": 0.0291, + "epoch": 0.1, + "learning_rate": 0.00028561381558036636, + "loss": 0.0299, "step": 19010 }, { - "epoch": 0.21, - "learning_rate": 0.000269157423623273, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.00028560624788735234, + "loss": 0.0285, "step": 19020 }, { - "epoch": 0.21, - "learning_rate": 0.0002691412077576701, - "loss": 0.0274, + "epoch": 0.1, + "learning_rate": 0.0002855986801943383, + "loss": 0.0294, "step": 19030 }, { - "epoch": 0.21, - "learning_rate": 0.0002691249918920672, - "loss": 0.0343, + "epoch": 0.1, + "learning_rate": 0.0002855911125013243, + "loss": 0.0314, "step": 19040 }, { - "epoch": 0.21, - "learning_rate": 0.0002691087760264643, - "loss": 0.03, + "epoch": 0.1, + "learning_rate": 0.00028558354480831034, + "loss": 0.0298, "step": 19050 }, { - "epoch": 0.21, - "learning_rate": 0.00026909256016086134, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.0002855759771152963, + "loss": 0.0323, "step": 19060 }, { - "epoch": 0.21, - "learning_rate": 0.00026907634429525846, - "loss": 0.0292, + "epoch": 0.1, + "learning_rate": 0.0002855684094222823, + "loss": 0.031, "step": 19070 }, { - "epoch": 0.21, - "learning_rate": 0.0002690601284296556, - "loss": 0.0297, + "epoch": 0.1, + "learning_rate": 0.0002855608417292683, + "loss": 0.0292, "step": 19080 }, { - "epoch": 0.21, - "learning_rate": 0.00026904391256405265, - "loss": 0.031, + "epoch": 0.1, + "learning_rate": 0.00028555327403625427, + "loss": 0.0276, "step": 19090 }, { - "epoch": 0.21, - "learning_rate": 0.0002690276966984497, - "loss": 0.0278, + "epoch": 0.1, + "learning_rate": 0.00028554570634324025, + "loss": 0.0284, "step": 19100 }, { - "epoch": 0.21, - "learning_rate": 0.00026901148083284684, - "loss": 0.031, + "epoch": 0.1, + "learning_rate": 0.00028553813865022623, + "loss": 0.0268, "step": 19110 }, { - "epoch": 0.21, - "learning_rate": 0.00026899526496724396, - "loss": 0.0353, + "epoch": 0.1, + "learning_rate": 0.00028553057095721227, + "loss": 0.0259, "step": 19120 }, { - "epoch": 0.21, - "learning_rate": 0.000268979049101641, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.00028552300326419825, + "loss": 0.0297, "step": 19130 }, { - "epoch": 0.21, - "learning_rate": 0.0002689628332360381, - "loss": 0.0328, + "epoch": 0.1, + "learning_rate": 0.00028551543557118423, + "loss": 0.0303, "step": 19140 }, { - "epoch": 0.21, - "learning_rate": 0.0002689466173704352, - "loss": 0.0299, + "epoch": 0.1, + "learning_rate": 0.0002855078678781702, + "loss": 0.0296, "step": 19150 }, { - "epoch": 0.21, - "learning_rate": 0.0002689304015048323, - "loss": 0.0296, + "epoch": 0.1, + "learning_rate": 0.0002855003001851562, + "loss": 0.028, "step": 19160 }, { - "epoch": 0.21, - "learning_rate": 0.0002689141856392294, - "loss": 0.0277, + "epoch": 0.1, + "learning_rate": 0.0002854927324921422, + "loss": 0.0298, "step": 19170 }, { - "epoch": 0.21, - "learning_rate": 0.0002688979697736265, - "loss": 0.0293, + "epoch": 0.1, + "learning_rate": 0.0002854851647991282, + "loss": 0.0316, "step": 19180 }, { - "epoch": 0.21, - "learning_rate": 0.0002688817539080236, - "loss": 0.0296, + "epoch": 0.1, + "learning_rate": 0.0002854775971061142, + "loss": 0.0261, "step": 19190 }, { - "epoch": 0.21, - "learning_rate": 0.0002688655380424207, - "loss": 0.0283, + "epoch": 0.1, + "learning_rate": 0.00028547002941310017, + "loss": 0.03, "step": 19200 }, { - "epoch": 0.21, - "learning_rate": 0.00026884932217681776, - "loss": 0.0287, + "epoch": 0.1, + "learning_rate": 0.00028546246172008615, + "loss": 0.035, "step": 19210 }, { - "epoch": 0.21, - "learning_rate": 0.0002688331063112149, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.00028545489402707214, + "loss": 0.0365, "step": 19220 }, { - "epoch": 0.21, - "learning_rate": 0.00026881689044561195, - "loss": 0.0254, + "epoch": 0.1, + "learning_rate": 0.0002854473263340581, + "loss": 0.0318, "step": 19230 }, { - "epoch": 0.21, - "learning_rate": 0.00026880067458000907, - "loss": 0.0301, + "epoch": 0.1, + "learning_rate": 0.0002854397586410441, + "loss": 0.0317, "step": 19240 }, { - "epoch": 0.21, - "learning_rate": 0.00026878445871440613, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028543219094803013, + "loss": 0.0303, "step": 19250 }, { - "epoch": 0.21, - "learning_rate": 0.00026876824284880325, - "loss": 0.029, + "epoch": 0.1, + "learning_rate": 0.0002854246232550161, + "loss": 0.0304, "step": 19260 }, { - "epoch": 0.21, - "learning_rate": 0.0002687520269832003, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.0002854170555620021, + "loss": 0.0328, "step": 19270 }, { - "epoch": 0.21, - "learning_rate": 0.00026873581111759744, - "loss": 0.0298, + "epoch": 0.1, + "learning_rate": 0.0002854094878689881, + "loss": 0.0278, "step": 19280 }, { - "epoch": 0.21, - "learning_rate": 0.0002687195952519945, - "loss": 0.0276, + "epoch": 0.1, + "learning_rate": 0.00028540192017597406, + "loss": 0.0338, "step": 19290 }, { - "epoch": 0.21, - "learning_rate": 0.0002687033793863916, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.00028539435248296004, + "loss": 0.0286, "step": 19300 }, { - "epoch": 0.21, - "learning_rate": 0.0002686871635207887, - "loss": 0.0269, + "epoch": 0.1, + "learning_rate": 0.0002853867847899461, + "loss": 0.0311, "step": 19310 }, { - "epoch": 0.21, - "learning_rate": 0.0002686709476551858, - "loss": 0.0346, + "epoch": 0.1, + "learning_rate": 0.00028537921709693206, + "loss": 0.0334, "step": 19320 }, { - "epoch": 0.21, - "learning_rate": 0.0002686547317895829, - "loss": 0.0328, + "epoch": 0.1, + "learning_rate": 0.00028537164940391804, + "loss": 0.0312, "step": 19330 }, { - "epoch": 0.21, - "learning_rate": 0.00026863851592398, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.000285364081710904, + "loss": 0.03, "step": 19340 }, { - "epoch": 0.21, - "learning_rate": 0.0002686223000583771, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028535651401789, + "loss": 0.0294, "step": 19350 }, { - "epoch": 0.21, - "learning_rate": 0.0002686060841927742, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.000285348946324876, + "loss": 0.027, "step": 19360 }, { - "epoch": 0.21, - "learning_rate": 0.00026858986832717125, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.000285341378631862, + "loss": 0.0306, "step": 19370 }, { - "epoch": 0.21, - "learning_rate": 0.00026857365246156837, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.000285333810938848, + "loss": 0.0287, "step": 19380 }, { - "epoch": 0.21, - "learning_rate": 0.0002685574365959655, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.000285326243245834, + "loss": 0.0291, "step": 19390 }, { - "epoch": 0.21, - "learning_rate": 0.00026854122073036255, - "loss": 0.0307, + "epoch": 0.1, + "learning_rate": 0.00028531867555281996, + "loss": 0.0293, "step": 19400 }, { - "epoch": 0.21, - "learning_rate": 0.0002685250048647596, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.00028531110785980595, + "loss": 0.0271, "step": 19410 }, { - "epoch": 0.21, - "learning_rate": 0.00026850878899915674, - "loss": 0.0336, + "epoch": 0.1, + "learning_rate": 0.0002853035401667919, + "loss": 0.0244, "step": 19420 }, { - "epoch": 0.21, - "learning_rate": 0.00026849257313355386, - "loss": 0.0304, + "epoch": 0.1, + "learning_rate": 0.0002852959724737779, + "loss": 0.026, "step": 19430 }, { - "epoch": 0.21, - "learning_rate": 0.0002684763572679509, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.00028528840478076394, + "loss": 0.0297, "step": 19440 }, { - "epoch": 0.21, - "learning_rate": 0.00026846014140234804, - "loss": 0.0359, + "epoch": 0.1, + "learning_rate": 0.0002852808370877499, + "loss": 0.0319, "step": 19450 }, { - "epoch": 0.21, - "learning_rate": 0.0002684439255367451, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.0002852732693947359, + "loss": 0.0329, "step": 19460 }, { - "epoch": 0.21, - "learning_rate": 0.00026842770967114223, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.0002852657017017219, + "loss": 0.027, "step": 19470 }, { - "epoch": 0.21, - "learning_rate": 0.00026841149380553935, - "loss": 0.0276, + "epoch": 0.1, + "learning_rate": 0.00028525813400870787, + "loss": 0.0247, "step": 19480 }, { - "epoch": 0.21, - "learning_rate": 0.0002683952779399364, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028525056631569385, + "loss": 0.0297, "step": 19490 }, { - "epoch": 0.21, - "learning_rate": 0.0002683790620743335, - "loss": 0.0272, + "epoch": 0.1, + "learning_rate": 0.00028524299862267983, + "loss": 0.0291, "step": 19500 }, { - "epoch": 0.21, - "learning_rate": 0.0002683628462087306, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.0002852354309296658, + "loss": 0.0279, "step": 19510 }, { - "epoch": 0.21, - "learning_rate": 0.0002683466303431277, - "loss": 0.028, + "epoch": 0.1, + "learning_rate": 0.0002852278632366518, + "loss": 0.0299, "step": 19520 }, { - "epoch": 0.21, - "learning_rate": 0.0002683304144775248, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.0002852202955436378, + "loss": 0.0304, "step": 19530 }, { - "epoch": 0.21, - "learning_rate": 0.00026831419861192185, - "loss": 0.0276, + "epoch": 0.1, + "learning_rate": 0.0002852127278506238, + "loss": 0.0317, "step": 19540 }, { - "epoch": 0.21, - "learning_rate": 0.00026829798274631897, - "loss": 0.0282, + "epoch": 0.1, + "learning_rate": 0.0002852051601576098, + "loss": 0.0305, "step": 19550 }, { - "epoch": 0.21, - "learning_rate": 0.0002682817668807161, - "loss": 0.0262, + "epoch": 0.1, + "learning_rate": 0.0002851975924645958, + "loss": 0.027, "step": 19560 }, { - "epoch": 0.21, - "learning_rate": 0.00026826555101511316, - "loss": 0.0274, + "epoch": 0.1, + "learning_rate": 0.00028519002477158176, + "loss": 0.0297, "step": 19570 }, { - "epoch": 0.21, - "learning_rate": 0.0002682493351495102, + "epoch": 0.1, + "learning_rate": 0.00028518245707856774, "loss": 0.028, "step": 19580 }, { - "epoch": 0.21, - "learning_rate": 0.00026823311928390734, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.0002851748893855537, + "loss": 0.028, "step": 19590 }, { - "epoch": 0.21, - "learning_rate": 0.00026821690341830446, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.00028516732169253976, + "loss": 0.032, "step": 19600 }, { - "epoch": 0.21, - "learning_rate": 0.0002682006875527016, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.00028515975399952574, + "loss": 0.0251, "step": 19610 }, { - "epoch": 0.21, - "learning_rate": 0.00026818447168709865, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.0002851521863065117, + "loss": 0.0283, "step": 19620 }, { - "epoch": 0.21, - "learning_rate": 0.0002681682558214957, - "loss": 0.0328, + "epoch": 0.1, + "learning_rate": 0.0002851446186134977, + "loss": 0.0369, "step": 19630 }, { - "epoch": 0.21, - "learning_rate": 0.00026815203995589283, - "loss": 0.0333, + "epoch": 0.1, + "learning_rate": 0.0002851370509204837, + "loss": 0.0311, "step": 19640 }, { - "epoch": 0.21, - "learning_rate": 0.00026813582409028995, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.00028512948322746966, + "loss": 0.0303, "step": 19650 }, { - "epoch": 0.21, - "learning_rate": 0.000268119608224687, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.00028512191553445564, + "loss": 0.0286, "step": 19660 }, { - "epoch": 0.21, - "learning_rate": 0.0002681033923590841, - "loss": 0.0427, + "epoch": 0.1, + "learning_rate": 0.0002851143478414417, + "loss": 0.0365, "step": 19670 }, { - "epoch": 0.21, - "learning_rate": 0.0002680871764934812, - "loss": 0.0323, + "epoch": 0.1, + "learning_rate": 0.00028510678014842766, + "loss": 0.0292, "step": 19680 }, { - "epoch": 0.21, - "learning_rate": 0.0002680709606278783, - "loss": 0.0248, + "epoch": 0.1, + "learning_rate": 0.00028509921245541364, + "loss": 0.0282, "step": 19690 }, { - "epoch": 0.21, - "learning_rate": 0.0002680547447622754, - "loss": 0.0286, + "epoch": 0.1, + "learning_rate": 0.0002850916447623996, + "loss": 0.0279, "step": 19700 }, { - "epoch": 0.21, - "learning_rate": 0.00026803852889667245, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.0002850840770693856, + "loss": 0.0292, "step": 19710 }, { - "epoch": 0.21, - "learning_rate": 0.0002680223130310696, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.0002850765093763716, + "loss": 0.0304, "step": 19720 }, { - "epoch": 0.21, - "learning_rate": 0.0002680060971654667, - "loss": 0.0254, + "epoch": 0.1, + "learning_rate": 0.0002850689416833576, + "loss": 0.0246, "step": 19730 }, { - "epoch": 0.21, - "learning_rate": 0.00026798988129986376, - "loss": 0.029, + "epoch": 0.1, + "learning_rate": 0.0002850613739903436, + "loss": 0.0289, "step": 19740 }, { - "epoch": 0.21, - "learning_rate": 0.0002679736654342609, - "loss": 0.0293, + "epoch": 0.1, + "learning_rate": 0.0002850538062973296, + "loss": 0.0257, "step": 19750 }, { - "epoch": 0.21, - "learning_rate": 0.00026795744956865795, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.00028504623860431557, + "loss": 0.0324, "step": 19760 }, { - "epoch": 0.21, - "learning_rate": 0.00026794123370305507, - "loss": 0.0297, + "epoch": 0.1, + "learning_rate": 0.00028503867091130155, + "loss": 0.0291, "step": 19770 }, { - "epoch": 0.21, - "learning_rate": 0.00026792501783745213, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.00028503110321828753, + "loss": 0.0306, "step": 19780 }, { - "epoch": 0.21, - "learning_rate": 0.00026790880197184925, - "loss": 0.0282, + "epoch": 0.1, + "learning_rate": 0.00028502353552527357, + "loss": 0.0287, "step": 19790 }, { - "epoch": 0.21, - "learning_rate": 0.0002678925861062463, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.00028501596783225955, + "loss": 0.0239, "step": 19800 }, { - "epoch": 0.21, - "learning_rate": 0.00026787637024064344, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028500840013924553, + "loss": 0.0271, "step": 19810 }, { - "epoch": 0.21, - "learning_rate": 0.0002678601543750405, - "loss": 0.0316, + "epoch": 0.1, + "learning_rate": 0.0002850008324462315, + "loss": 0.0309, "step": 19820 }, { - "epoch": 0.21, - "learning_rate": 0.0002678439385094376, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.0002849932647532175, + "loss": 0.0273, "step": 19830 }, { - "epoch": 0.21, - "learning_rate": 0.0002678277226438347, - "loss": 0.0368, + "epoch": 0.1, + "learning_rate": 0.0002849856970602035, + "loss": 0.0309, "step": 19840 }, { - "epoch": 0.21, - "learning_rate": 0.0002678115067782318, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.00028497812936718945, + "loss": 0.0265, "step": 19850 }, { - "epoch": 0.21, - "learning_rate": 0.00026779529091262887, - "loss": 0.0332, + "epoch": 0.1, + "learning_rate": 0.0002849705616741755, + "loss": 0.0284, "step": 19860 }, { - "epoch": 0.21, - "learning_rate": 0.000267779075047026, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.00028496299398116147, + "loss": 0.0309, "step": 19870 }, { - "epoch": 0.21, - "learning_rate": 0.00026776285918142306, - "loss": 0.0275, + "epoch": 0.1, + "learning_rate": 0.00028495542628814745, + "loss": 0.0278, "step": 19880 }, { - "epoch": 0.22, - "learning_rate": 0.0002677466433158202, - "loss": 0.0289, + "epoch": 0.1, + "learning_rate": 0.00028494785859513343, + "loss": 0.0259, "step": 19890 }, { - "epoch": 0.22, - "learning_rate": 0.00026773042745021724, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.0002849402909021194, + "loss": 0.0321, "step": 19900 }, { - "epoch": 0.22, - "learning_rate": 0.00026771421158461436, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.0002849327232091054, + "loss": 0.0266, "step": 19910 }, { - "epoch": 0.22, - "learning_rate": 0.0002676979957190115, - "loss": 0.0305, + "epoch": 0.1, + "learning_rate": 0.00028492515551609143, + "loss": 0.0298, "step": 19920 }, { - "epoch": 0.22, - "learning_rate": 0.00026768177985340855, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.0002849175878230774, + "loss": 0.0257, "step": 19930 }, { - "epoch": 0.22, - "learning_rate": 0.0002676655639878056, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.0002849100201300634, + "loss": 0.0303, "step": 19940 }, { - "epoch": 0.22, - "learning_rate": 0.00026764934812220273, - "loss": 0.0317, + "epoch": 0.1, + "learning_rate": 0.0002849024524370494, + "loss": 0.0253, "step": 19950 }, { - "epoch": 0.22, - "learning_rate": 0.00026763313225659985, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.00028489488474403536, + "loss": 0.0291, "step": 19960 }, { - "epoch": 0.22, - "learning_rate": 0.0002676169163909969, - "loss": 0.0508, + "epoch": 0.1, + "learning_rate": 0.00028488731705102134, + "loss": 0.0324, "step": 19970 }, { - "epoch": 0.22, - "learning_rate": 0.000267600700525394, - "loss": 0.0264, + "epoch": 0.1, + "learning_rate": 0.0002848797493580073, + "loss": 0.0314, "step": 19980 }, { - "epoch": 0.22, - "learning_rate": 0.0002675844846597911, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.00028487218166499336, + "loss": 0.0295, "step": 19990 }, { - "epoch": 0.22, - "learning_rate": 0.0002675682687941882, - "loss": 0.0317, + "epoch": 0.1, + "learning_rate": 0.00028486461397197934, + "loss": 0.0302, "step": 20000 }, { - "epoch": 0.22, - "eval_cer": 0.9216077145840174, - "eval_loss": 0.02043878473341465, - "eval_runtime": 120.3911, - "eval_samples_per_second": 16.613, - "eval_steps_per_second": 4.153, + "epoch": 0.1, + "eval_cer": 0.9145546803660722, + "eval_loss": 0.023069359362125397, + "eval_runtime": 117.5456, + "eval_samples_per_second": 17.015, + "eval_steps_per_second": 4.254, "step": 20000 }, { - "epoch": 0.22, - "learning_rate": 0.0002675520529285853, - "loss": 0.0298, + "epoch": 0.1, + "learning_rate": 0.0002848570462789653, + "loss": 0.0283, "step": 20010 }, { - "epoch": 0.22, - "learning_rate": 0.00026753583706298236, - "loss": 0.0325, + "epoch": 0.1, + "learning_rate": 0.0002848494785859513, + "loss": 0.0321, "step": 20020 }, { - "epoch": 0.22, - "learning_rate": 0.0002675196211973795, - "loss": 0.0254, + "epoch": 0.1, + "learning_rate": 0.0002848419108929373, + "loss": 0.0329, "step": 20030 }, { - "epoch": 0.22, - "learning_rate": 0.0002675034053317766, - "loss": 0.0263, + "epoch": 0.1, + "learning_rate": 0.00028483434319992326, + "loss": 0.0282, "step": 20040 }, { - "epoch": 0.22, - "learning_rate": 0.0002674871894661737, - "loss": 0.0387, + "epoch": 0.1, + "learning_rate": 0.0002848267755069093, + "loss": 0.0307, "step": 20050 }, { - "epoch": 0.22, - "learning_rate": 0.0002674709736005708, - "loss": 0.0298, + "epoch": 0.1, + "learning_rate": 0.0002848192078138953, + "loss": 0.0305, "step": 20060 }, { - "epoch": 0.22, - "learning_rate": 0.00026745475773496785, - "loss": 0.0299, + "epoch": 0.1, + "learning_rate": 0.00028481164012088126, + "loss": 0.0291, "step": 20070 }, { - "epoch": 0.22, - "learning_rate": 0.00026743854186936497, - "loss": 0.031, + "epoch": 0.1, + "learning_rate": 0.00028480407242786724, + "loss": 0.0331, "step": 20080 }, { - "epoch": 0.22, - "learning_rate": 0.0002674223260037621, + "epoch": 0.1, + "learning_rate": 0.0002847965047348532, "loss": 0.0245, "step": 20090 }, { - "epoch": 0.22, - "learning_rate": 0.00026740611013815915, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.0002847889370418392, + "loss": 0.0304, "step": 20100 }, { - "epoch": 0.22, - "learning_rate": 0.0002673898942725562, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.00028478136934882524, + "loss": 0.0276, "step": 20110 }, { - "epoch": 0.22, - "learning_rate": 0.00026737367840695334, - "loss": 0.0301, + "epoch": 0.1, + "learning_rate": 0.0002847738016558112, + "loss": 0.023, "step": 20120 }, { - "epoch": 0.22, - "learning_rate": 0.00026735746254135046, - "loss": 0.0328, + "epoch": 0.1, + "learning_rate": 0.0002847662339627972, + "loss": 0.0354, "step": 20130 }, { - "epoch": 0.22, - "learning_rate": 0.0002673412466757475, - "loss": 0.0368, + "epoch": 0.1, + "learning_rate": 0.0002847586662697832, + "loss": 0.0302, "step": 20140 }, { - "epoch": 0.22, - "learning_rate": 0.0002673250308101446, - "loss": 0.029, + "epoch": 0.1, + "learning_rate": 0.00028475109857676917, + "loss": 0.0276, "step": 20150 }, { - "epoch": 0.22, - "learning_rate": 0.0002673088149445417, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.00028474353088375515, + "loss": 0.0319, "step": 20160 }, { - "epoch": 0.22, - "learning_rate": 0.00026729259907893883, - "loss": 0.0297, + "epoch": 0.1, + "learning_rate": 0.00028473596319074113, + "loss": 0.0318, "step": 20170 }, { - "epoch": 0.22, - "learning_rate": 0.0002672763832133359, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.00028472839549772717, + "loss": 0.0328, "step": 20180 }, { - "epoch": 0.22, - "learning_rate": 0.000267260167347733, - "loss": 0.0292, + "epoch": 0.1, + "learning_rate": 0.00028472082780471315, + "loss": 0.0325, "step": 20190 }, { - "epoch": 0.22, - "learning_rate": 0.0002672439514821301, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.00028471326011169913, + "loss": 0.0266, "step": 20200 }, { - "epoch": 0.22, - "learning_rate": 0.0002672277356165272, - "loss": 0.0288, + "epoch": 0.1, + "learning_rate": 0.0002847056924186851, + "loss": 0.0299, "step": 20210 }, { - "epoch": 0.22, - "learning_rate": 0.0002672115197509243, - "loss": 0.0341, + "epoch": 0.1, + "learning_rate": 0.0002846981247256711, + "loss": 0.032, "step": 20220 }, { - "epoch": 0.22, - "learning_rate": 0.0002671953038853214, - "loss": 0.0311, + "epoch": 0.1, + "learning_rate": 0.0002846905570326571, + "loss": 0.0276, "step": 20230 }, { - "epoch": 0.22, - "learning_rate": 0.00026717908801971845, - "loss": 0.0314, + "epoch": 0.1, + "learning_rate": 0.0002846829893396431, + "loss": 0.0329, "step": 20240 }, { - "epoch": 0.22, - "learning_rate": 0.00026716287215411557, - "loss": 0.0449, + "epoch": 0.1, + "learning_rate": 0.0002846754216466291, + "loss": 0.034, "step": 20250 }, { - "epoch": 0.22, - "learning_rate": 0.0002671466562885127, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.0002846678539536151, + "loss": 0.0277, "step": 20260 }, { - "epoch": 0.22, - "learning_rate": 0.00026713044042290976, - "loss": 0.0386, + "epoch": 0.1, + "learning_rate": 0.00028466028626060105, + "loss": 0.0356, "step": 20270 }, { - "epoch": 0.22, - "learning_rate": 0.0002671142245573068, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.00028465271856758704, + "loss": 0.0342, "step": 20280 }, { - "epoch": 0.22, - "learning_rate": 0.00026709800869170394, - "loss": 0.0306, + "epoch": 0.1, + "learning_rate": 0.000284645150874573, + "loss": 0.0367, "step": 20290 }, { - "epoch": 0.22, - "learning_rate": 0.00026708179282610106, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.000284637583181559, + "loss": 0.0308, "step": 20300 }, { - "epoch": 0.22, - "learning_rate": 0.00026706557696049813, - "loss": 0.028, + "epoch": 0.1, + "learning_rate": 0.00028463001548854503, + "loss": 0.0358, "step": 20310 }, { - "epoch": 0.22, - "learning_rate": 0.0002670493610948952, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.000284622447795531, + "loss": 0.0264, "step": 20320 }, { - "epoch": 0.22, - "learning_rate": 0.0002670331452292923, - "loss": 0.026, + "epoch": 0.1, + "learning_rate": 0.000284614880102517, + "loss": 0.0355, "step": 20330 }, { - "epoch": 0.22, - "learning_rate": 0.00026701692936368943, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.000284607312409503, + "loss": 0.0305, "step": 20340 }, { - "epoch": 0.22, - "learning_rate": 0.0002670007134980865, - "loss": 0.0223, + "epoch": 0.1, + "learning_rate": 0.00028459974471648896, + "loss": 0.0311, "step": 20350 }, { - "epoch": 0.22, - "learning_rate": 0.0002669844976324836, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.00028459217702347494, + "loss": 0.0282, "step": 20360 }, { - "epoch": 0.22, - "learning_rate": 0.0002669682817668807, - "loss": 0.0269, + "epoch": 0.1, + "learning_rate": 0.000284584609330461, + "loss": 0.0418, "step": 20370 }, { - "epoch": 0.22, - "learning_rate": 0.0002669520659012778, - "loss": 0.0323, + "epoch": 0.1, + "learning_rate": 0.00028457704163744696, + "loss": 0.0341, "step": 20380 }, { - "epoch": 0.22, - "learning_rate": 0.00026693585003567487, - "loss": 0.0266, + "epoch": 0.1, + "learning_rate": 0.00028456947394443294, + "loss": 0.0329, "step": 20390 }, { - "epoch": 0.22, - "learning_rate": 0.000266919634170072, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.0002845619062514189, + "loss": 0.0361, "step": 20400 }, { - "epoch": 0.22, - "learning_rate": 0.00026690341830446905, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.0002845543385584049, + "loss": 0.0252, "step": 20410 }, { - "epoch": 0.22, - "learning_rate": 0.0002668872024388662, - "loss": 0.0298, + "epoch": 0.1, + "learning_rate": 0.0002845467708653909, + "loss": 0.0322, "step": 20420 }, { - "epoch": 0.22, - "learning_rate": 0.00026687098657326324, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.0002845392031723769, + "loss": 0.0348, "step": 20430 }, { - "epoch": 0.22, - "learning_rate": 0.00026685477070766036, - "loss": 0.0393, + "epoch": 0.1, + "learning_rate": 0.0002845316354793629, + "loss": 0.0338, "step": 20440 }, { - "epoch": 0.22, - "learning_rate": 0.0002668385548420574, - "loss": 0.0351, + "epoch": 0.1, + "learning_rate": 0.0002845240677863489, + "loss": 0.0335, "step": 20450 }, { - "epoch": 0.22, - "learning_rate": 0.00026682233897645455, - "loss": 0.0343, + "epoch": 0.1, + "learning_rate": 0.00028451650009333486, + "loss": 0.0374, "step": 20460 }, { - "epoch": 0.22, - "learning_rate": 0.0002668061231108516, - "loss": 0.0337, + "epoch": 0.1, + "learning_rate": 0.00028450893240032085, + "loss": 0.0308, "step": 20470 }, { - "epoch": 0.22, - "learning_rate": 0.00026678990724524873, - "loss": 0.0297, + "epoch": 0.1, + "learning_rate": 0.00028450136470730683, + "loss": 0.0306, "step": 20480 }, { - "epoch": 0.22, - "learning_rate": 0.00026677369137964585, - "loss": 0.0314, + "epoch": 0.1, + "learning_rate": 0.0002844937970142928, + "loss": 0.0352, "step": 20490 }, { - "epoch": 0.22, - "learning_rate": 0.0002667574755140429, - "loss": 0.0264, + "epoch": 0.1, + "learning_rate": 0.00028448622932127884, + "loss": 0.0332, "step": 20500 }, { - "epoch": 0.22, - "learning_rate": 0.00026674125964844, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.0002844786616282648, + "loss": 0.0285, "step": 20510 }, { - "epoch": 0.22, - "learning_rate": 0.0002667250437828371, - "loss": 0.0329, + "epoch": 0.1, + "learning_rate": 0.0002844710939352508, + "loss": 0.0285, "step": 20520 }, { - "epoch": 0.22, - "learning_rate": 0.0002667088279172342, - "loss": 0.0273, + "epoch": 0.1, + "learning_rate": 0.0002844635262422368, + "loss": 0.0246, "step": 20530 }, { - "epoch": 0.22, - "learning_rate": 0.0002666926120516313, - "loss": 0.0347, + "epoch": 0.1, + "learning_rate": 0.00028445595854922277, + "loss": 0.0316, "step": 20540 }, { - "epoch": 0.22, - "learning_rate": 0.00026667639618602835, - "loss": 0.0327, + "epoch": 0.1, + "learning_rate": 0.00028444839085620875, + "loss": 0.0396, "step": 20550 }, { - "epoch": 0.22, - "learning_rate": 0.0002666601803204255, - "loss": 0.0309, + "epoch": 0.1, + "learning_rate": 0.0002844408231631948, + "loss": 0.0393, "step": 20560 }, { - "epoch": 0.22, - "learning_rate": 0.0002666439644548226, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.00028443325547018077, + "loss": 0.0275, "step": 20570 }, { - "epoch": 0.22, - "learning_rate": 0.00026662774858921966, - "loss": 0.0309, + "epoch": 0.1, + "learning_rate": 0.00028442568777716675, + "loss": 0.0317, "step": 20580 }, { - "epoch": 0.22, - "learning_rate": 0.0002666115327236167, - "loss": 0.0315, + "epoch": 0.1, + "learning_rate": 0.00028441812008415273, + "loss": 0.0321, "step": 20590 }, { - "epoch": 0.22, - "learning_rate": 0.00026659531685801384, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.0002844105523911387, + "loss": 0.0297, "step": 20600 }, { - "epoch": 0.22, - "learning_rate": 0.00026657910099241096, - "loss": 0.0237, + "epoch": 0.1, + "learning_rate": 0.0002844029846981247, + "loss": 0.0265, "step": 20610 }, { - "epoch": 0.22, - "learning_rate": 0.0002665628851268081, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.00028439541700511073, + "loss": 0.0292, "step": 20620 }, { - "epoch": 0.22, - "learning_rate": 0.00026654666926120515, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.0002843878493120967, + "loss": 0.031, "step": 20630 }, { - "epoch": 0.22, - "learning_rate": 0.0002665304533956022, - "loss": 0.0466, + "epoch": 0.1, + "learning_rate": 0.0002843802816190827, + "loss": 0.0291, "step": 20640 }, { - "epoch": 0.22, - "learning_rate": 0.00026651423752999933, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.0002843727139260687, + "loss": 0.0292, "step": 20650 }, { - "epoch": 0.22, - "learning_rate": 0.00026649802166439645, - "loss": 0.026, + "epoch": 0.1, + "learning_rate": 0.00028436514623305466, + "loss": 0.0298, "step": 20660 }, { - "epoch": 0.22, - "learning_rate": 0.0002664818057987935, - "loss": 0.026, + "epoch": 0.1, + "learning_rate": 0.00028435757854004064, + "loss": 0.0309, "step": 20670 }, { - "epoch": 0.22, - "learning_rate": 0.0002664655899331906, - "loss": 0.0326, + "epoch": 0.1, + "learning_rate": 0.0002843500108470266, + "loss": 0.0288, "step": 20680 }, { - "epoch": 0.22, - "learning_rate": 0.0002664493740675877, - "loss": 0.0262, + "epoch": 0.1, + "learning_rate": 0.00028434244315401265, + "loss": 0.026, "step": 20690 }, { - "epoch": 0.22, - "learning_rate": 0.0002664331582019848, - "loss": 0.0243, + "epoch": 0.1, + "learning_rate": 0.00028433487546099864, + "loss": 0.0324, "step": 20700 }, { - "epoch": 0.22, - "learning_rate": 0.0002664169423363819, - "loss": 0.0278, + "epoch": 0.1, + "learning_rate": 0.0002843273077679846, + "loss": 0.027, "step": 20710 }, { - "epoch": 0.22, - "learning_rate": 0.00026640072647077896, - "loss": 0.0297, + "epoch": 0.1, + "learning_rate": 0.0002843197400749706, + "loss": 0.0312, "step": 20720 }, { - "epoch": 0.22, - "learning_rate": 0.0002663845106051761, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.0002843121723819566, + "loss": 0.0291, "step": 20730 }, { - "epoch": 0.22, - "learning_rate": 0.0002663682947395732, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.00028430460468894256, + "loss": 0.0281, "step": 20740 }, { - "epoch": 0.22, - "learning_rate": 0.00026635207887397026, - "loss": 0.0273, + "epoch": 0.1, + "learning_rate": 0.00028429703699592854, + "loss": 0.0328, "step": 20750 }, { - "epoch": 0.22, - "learning_rate": 0.0002663358630083674, - "loss": 0.0252, + "epoch": 0.1, + "learning_rate": 0.0002842894693029145, + "loss": 0.0289, "step": 20760 }, { - "epoch": 0.22, - "learning_rate": 0.00026631964714276445, - "loss": 0.0302, + "epoch": 0.1, + "learning_rate": 0.0002842819016099005, + "loss": 0.0331, "step": 20770 }, { - "epoch": 0.22, - "learning_rate": 0.00026630343127716157, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.0002842743339168865, + "loss": 0.0302, "step": 20780 }, { - "epoch": 0.22, - "learning_rate": 0.00026628721541155863, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.0002842667662238725, + "loss": 0.0316, "step": 20790 }, { - "epoch": 0.22, - "learning_rate": 0.00026627099954595575, - "loss": 0.0278, + "epoch": 0.1, + "learning_rate": 0.0002842591985308585, + "loss": 0.0358, "step": 20800 }, { - "epoch": 0.22, - "learning_rate": 0.0002662547836803528, - "loss": 0.0279, + "epoch": 0.1, + "learning_rate": 0.0002842516308378445, + "loss": 0.03, "step": 20810 }, { - "epoch": 0.23, - "learning_rate": 0.00026623856781474994, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.00028424406314483047, + "loss": 0.0273, "step": 20820 }, { - "epoch": 0.23, - "learning_rate": 0.000266222351949147, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028423649545181645, + "loss": 0.0302, "step": 20830 }, { - "epoch": 0.23, - "learning_rate": 0.0002662061360835441, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028422892775880243, + "loss": 0.0328, "step": 20840 }, { - "epoch": 0.23, - "learning_rate": 0.0002661899202179412, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028422136006578847, + "loss": 0.0305, "step": 20850 }, { - "epoch": 0.23, - "learning_rate": 0.0002661737043523383, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028421379237277445, + "loss": 0.0309, "step": 20860 }, { - "epoch": 0.23, - "learning_rate": 0.00026615748848673543, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.00028420622467976043, + "loss": 0.0297, "step": 20870 }, { - "epoch": 0.23, - "learning_rate": 0.0002661412726211325, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002841986569867464, + "loss": 0.0318, "step": 20880 }, { - "epoch": 0.23, - "learning_rate": 0.00026612505675552956, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002841910892937324, + "loss": 0.0358, "step": 20890 }, { - "epoch": 0.23, - "learning_rate": 0.0002661088408899267, - "loss": 0.0285, + "epoch": 0.11, + "learning_rate": 0.0002841835216007184, + "loss": 0.0282, "step": 20900 }, { - "epoch": 0.23, - "learning_rate": 0.0002660926250243238, - "loss": 0.0311, + "epoch": 0.11, + "learning_rate": 0.00028417595390770435, + "loss": 0.0285, "step": 20910 }, { - "epoch": 0.23, - "learning_rate": 0.00026607640915872087, - "loss": 0.0282, + "epoch": 0.11, + "learning_rate": 0.0002841683862146904, + "loss": 0.0371, "step": 20920 }, { - "epoch": 0.23, - "learning_rate": 0.000266060193293118, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.00028416081852167637, + "loss": 0.0311, "step": 20930 }, { - "epoch": 0.23, - "learning_rate": 0.00026604397742751505, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028415325082866235, + "loss": 0.0481, "step": 20940 }, { - "epoch": 0.23, - "learning_rate": 0.00026602776156191217, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.00028414568313564833, + "loss": 0.0307, "step": 20950 }, { - "epoch": 0.23, - "learning_rate": 0.00026601154569630924, - "loss": 0.0301, + "epoch": 0.11, + "learning_rate": 0.0002841381154426343, + "loss": 0.031, "step": 20960 }, { - "epoch": 0.23, - "learning_rate": 0.00026599532983070636, - "loss": 0.0273, + "epoch": 0.11, + "learning_rate": 0.0002841305477496203, + "loss": 0.0286, "step": 20970 }, { - "epoch": 0.23, - "learning_rate": 0.0002659791139651034, - "loss": 0.0271, + "epoch": 0.11, + "learning_rate": 0.00028412298005660633, + "loss": 0.03, "step": 20980 }, { - "epoch": 0.23, - "learning_rate": 0.00026596289809950054, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.0002841154123635923, + "loss": 0.0331, "step": 20990 }, { - "epoch": 0.23, - "learning_rate": 0.0002659466822338976, + "epoch": 0.11, + "learning_rate": 0.0002841078446705783, "loss": 0.0248, "step": 21000 }, { - "epoch": 0.23, - "eval_cer": 0.9216103203928865, - "eval_loss": 0.020444829016923904, - "eval_runtime": 120.2567, - "eval_samples_per_second": 16.631, - "eval_steps_per_second": 4.158, + "epoch": 0.11, + "eval_cer": 0.9145119829365546, + "eval_loss": 0.021799687296152115, + "eval_runtime": 117.5088, + "eval_samples_per_second": 17.02, + "eval_steps_per_second": 4.255, "step": 21000 }, { - "epoch": 0.23, - "learning_rate": 0.00026593046636829473, - "loss": 0.0277, + "epoch": 0.11, + "learning_rate": 0.0002841002769775643, + "loss": 0.0341, "step": 21010 }, { - "epoch": 0.23, - "learning_rate": 0.0002659142505026918, - "loss": 0.0304, + "epoch": 0.11, + "learning_rate": 0.00028409270928455026, + "loss": 0.0298, "step": 21020 }, { - "epoch": 0.23, - "learning_rate": 0.0002658980346370889, + "epoch": 0.11, + "learning_rate": 0.00028408514159153624, "loss": 0.0277, "step": 21030 }, { - "epoch": 0.23, - "learning_rate": 0.000265881818771486, - "loss": 0.0313, + "epoch": 0.11, + "learning_rate": 0.0002840775738985222, + "loss": 0.0317, "step": 21040 }, { - "epoch": 0.23, - "learning_rate": 0.0002658656029058831, - "loss": 0.0321, + "epoch": 0.11, + "learning_rate": 0.00028407000620550826, + "loss": 0.0341, "step": 21050 }, { - "epoch": 0.23, - "learning_rate": 0.0002658493870402802, - "loss": 0.0262, + "epoch": 0.11, + "learning_rate": 0.00028406243851249424, + "loss": 0.0266, "step": 21060 }, { - "epoch": 0.23, - "learning_rate": 0.0002658331711746773, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.0002840548708194802, + "loss": 0.0294, "step": 21070 }, { - "epoch": 0.23, - "learning_rate": 0.00026581695530907435, - "loss": 0.0349, + "epoch": 0.11, + "learning_rate": 0.0002840473031264662, + "loss": 0.0324, "step": 21080 }, { - "epoch": 0.23, - "learning_rate": 0.00026580073944347147, - "loss": 0.0271, + "epoch": 0.11, + "learning_rate": 0.0002840397354334522, + "loss": 0.0352, "step": 21090 }, { - "epoch": 0.23, - "learning_rate": 0.0002657845235778686, - "loss": 0.0371, + "epoch": 0.11, + "learning_rate": 0.00028403216774043816, + "loss": 0.0292, "step": 21100 }, { - "epoch": 0.23, - "learning_rate": 0.00026576830771226566, - "loss": 0.0293, + "epoch": 0.11, + "learning_rate": 0.0002840246000474242, + "loss": 0.0342, "step": 21110 }, { - "epoch": 0.23, - "learning_rate": 0.0002657520918466627, - "loss": 0.0258, + "epoch": 0.11, + "learning_rate": 0.0002840170323544102, + "loss": 0.0298, "step": 21120 }, { - "epoch": 0.23, - "learning_rate": 0.00026573587598105984, - "loss": 0.0293, + "epoch": 0.11, + "learning_rate": 0.00028400946466139616, + "loss": 0.0297, "step": 21130 }, { - "epoch": 0.23, - "learning_rate": 0.00026571966011545696, - "loss": 0.0288, + "epoch": 0.11, + "learning_rate": 0.00028400189696838214, + "loss": 0.0291, "step": 21140 }, { - "epoch": 0.23, - "learning_rate": 0.000265703444249854, - "loss": 0.0282, + "epoch": 0.11, + "learning_rate": 0.0002839943292753681, + "loss": 0.0265, "step": 21150 }, { - "epoch": 0.23, - "learning_rate": 0.0002656872283842511, - "loss": 0.0323, + "epoch": 0.11, + "learning_rate": 0.0002839867615823541, + "loss": 0.0303, "step": 21160 }, { - "epoch": 0.23, - "learning_rate": 0.0002656710125186482, - "loss": 0.0274, + "epoch": 0.11, + "learning_rate": 0.00028397919388934014, + "loss": 0.0283, "step": 21170 }, { - "epoch": 0.23, - "learning_rate": 0.00026565479665304533, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.0002839716261963261, + "loss": 0.0293, "step": 21180 }, { - "epoch": 0.23, - "learning_rate": 0.0002656385807874424, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.0002839640585033121, + "loss": 0.0316, "step": 21190 }, { - "epoch": 0.23, - "learning_rate": 0.0002656223649218395, - "loss": 0.0291, + "epoch": 0.11, + "learning_rate": 0.0002839564908102981, + "loss": 0.0332, "step": 21200 }, { - "epoch": 0.23, - "learning_rate": 0.0002656061490562366, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.00028394892311728407, + "loss": 0.0376, "step": 21210 }, { - "epoch": 0.23, - "learning_rate": 0.0002655899331906337, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.00028394135542427005, + "loss": 0.0328, "step": 21220 }, { - "epoch": 0.23, - "learning_rate": 0.0002655737173250308, - "loss": 0.0274, + "epoch": 0.11, + "learning_rate": 0.00028393378773125603, + "loss": 0.0347, "step": 21230 }, { - "epoch": 0.23, - "learning_rate": 0.0002655575014594279, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.00028392622003824207, + "loss": 0.0322, "step": 21240 }, { - "epoch": 0.23, - "learning_rate": 0.00026554128559382495, - "loss": 0.0273, + "epoch": 0.11, + "learning_rate": 0.00028391865234522805, + "loss": 0.0329, "step": 21250 }, { - "epoch": 0.23, - "learning_rate": 0.0002655250697282221, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.00028391108465221403, + "loss": 0.0309, "step": 21260 }, { - "epoch": 0.23, - "learning_rate": 0.0002655088538626192, - "loss": 0.0266, + "epoch": 0.11, + "learning_rate": 0.0002839035169592, + "loss": 0.0357, "step": 21270 }, { - "epoch": 0.23, - "learning_rate": 0.00026549263799701626, - "loss": 0.0442, + "epoch": 0.11, + "learning_rate": 0.000283895949266186, + "loss": 0.0267, "step": 21280 }, { - "epoch": 0.23, - "learning_rate": 0.0002654764221314133, - "loss": 0.0368, + "epoch": 0.11, + "learning_rate": 0.000283888381573172, + "loss": 0.0262, "step": 21290 }, { - "epoch": 0.23, - "learning_rate": 0.00026546020626581044, - "loss": 0.0298, + "epoch": 0.11, + "learning_rate": 0.000283880813880158, + "loss": 0.0326, "step": 21300 }, { - "epoch": 0.23, - "learning_rate": 0.00026544399040020756, - "loss": 0.0337, + "epoch": 0.11, + "learning_rate": 0.000283873246187144, + "loss": 0.0297, "step": 21310 }, { - "epoch": 0.23, - "learning_rate": 0.00026542777453460463, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028386567849413, + "loss": 0.0262, "step": 21320 }, { - "epoch": 0.23, - "learning_rate": 0.0002654115586690017, - "loss": 0.0333, + "epoch": 0.11, + "learning_rate": 0.00028385811080111595, + "loss": 0.0247, "step": 21330 }, { - "epoch": 0.23, - "learning_rate": 0.0002653953428033988, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.00028385054310810194, + "loss": 0.0314, "step": 21340 }, { - "epoch": 0.23, - "learning_rate": 0.00026537912693779594, - "loss": 0.0329, + "epoch": 0.11, + "learning_rate": 0.0002838429754150879, + "loss": 0.0338, "step": 21350 }, { - "epoch": 0.23, - "learning_rate": 0.000265362911072193, - "loss": 0.0336, + "epoch": 0.11, + "learning_rate": 0.00028383540772207395, + "loss": 0.028, "step": 21360 }, { - "epoch": 0.23, - "learning_rate": 0.0002653466952065901, - "loss": 0.0282, + "epoch": 0.11, + "learning_rate": 0.00028382784002905993, + "loss": 0.0307, "step": 21370 }, { - "epoch": 0.23, - "learning_rate": 0.0002653304793409872, - "loss": 0.0274, + "epoch": 0.11, + "learning_rate": 0.0002838202723360459, + "loss": 0.0314, "step": 21380 }, { - "epoch": 0.23, - "learning_rate": 0.0002653142634753843, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002838127046430319, + "loss": 0.0284, "step": 21390 }, { - "epoch": 0.23, - "learning_rate": 0.00026529804760978137, - "loss": 0.0332, + "epoch": 0.11, + "learning_rate": 0.0002838051369500179, + "loss": 0.0304, "step": 21400 }, { - "epoch": 0.23, - "learning_rate": 0.0002652818317441785, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028379756925700386, + "loss": 0.0336, "step": 21410 }, { - "epoch": 0.23, - "learning_rate": 0.00026526561587857556, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.00028379000156398984, + "loss": 0.0312, "step": 21420 }, { - "epoch": 0.23, - "learning_rate": 0.0002652494000129727, - "loss": 0.0276, + "epoch": 0.11, + "learning_rate": 0.0002837824338709759, + "loss": 0.0311, "step": 21430 }, { - "epoch": 0.23, - "learning_rate": 0.00026523318414736974, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.00028377486617796186, + "loss": 0.0293, "step": 21440 }, { - "epoch": 0.23, - "learning_rate": 0.00026521696828176686, - "loss": 0.0316, + "epoch": 0.11, + "learning_rate": 0.00028376729848494784, + "loss": 0.0297, "step": 21450 }, { - "epoch": 0.23, - "learning_rate": 0.00026520075241616393, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.0002837597307919338, + "loss": 0.032, "step": 21460 }, { - "epoch": 0.23, - "learning_rate": 0.00026518453655056105, - "loss": 0.0302, + "epoch": 0.11, + "learning_rate": 0.0002837521630989198, + "loss": 0.0243, "step": 21470 }, { - "epoch": 0.23, - "learning_rate": 0.0002651683206849581, - "loss": 0.0316, + "epoch": 0.11, + "learning_rate": 0.0002837445954059058, + "loss": 0.0277, "step": 21480 }, { - "epoch": 0.23, - "learning_rate": 0.00026515210481935523, - "loss": 0.0273, + "epoch": 0.11, + "learning_rate": 0.0002837370277128918, + "loss": 0.0269, "step": 21490 }, { - "epoch": 0.23, - "learning_rate": 0.00026513588895375235, - "loss": 0.0256, + "epoch": 0.11, + "learning_rate": 0.0002837294600198778, + "loss": 0.0302, "step": 21500 }, { - "epoch": 0.23, - "learning_rate": 0.0002651196730881494, - "loss": 0.0251, + "epoch": 0.11, + "learning_rate": 0.0002837218923268638, + "loss": 0.0276, "step": 21510 }, { - "epoch": 0.23, - "learning_rate": 0.0002651034572225465, - "loss": 0.0313, + "epoch": 0.11, + "learning_rate": 0.00028371432463384976, + "loss": 0.0306, "step": 21520 }, { - "epoch": 0.23, - "learning_rate": 0.0002650872413569436, - "loss": 0.03, + "epoch": 0.11, + "learning_rate": 0.00028370675694083575, + "loss": 0.0309, "step": 21530 }, { - "epoch": 0.23, - "learning_rate": 0.0002650710254913407, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028369918924782173, + "loss": 0.029, "step": 21540 }, { - "epoch": 0.23, - "learning_rate": 0.0002650548096257378, - "loss": 0.0254, + "epoch": 0.11, + "learning_rate": 0.0002836916215548077, + "loss": 0.0354, "step": 21550 }, { - "epoch": 0.23, - "learning_rate": 0.00026503859376013486, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028368405386179374, + "loss": 0.039, "step": 21560 }, { - "epoch": 0.23, - "learning_rate": 0.000265022377894532, - "loss": 0.031, + "epoch": 0.11, + "learning_rate": 0.0002836764861687797, + "loss": 0.0296, "step": 21570 }, { - "epoch": 0.23, - "learning_rate": 0.0002650061620289291, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.0002836689184757657, + "loss": 0.0278, "step": 21580 }, { - "epoch": 0.23, - "learning_rate": 0.00026498994616332616, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.0002836613507827517, + "loss": 0.0293, "step": 21590 }, { - "epoch": 0.23, - "learning_rate": 0.0002649737302977233, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.00028365378308973767, + "loss": 0.0288, "step": 21600 }, { - "epoch": 0.23, - "learning_rate": 0.00026495751443212035, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.00028364621539672365, + "loss": 0.0281, "step": 21610 }, { - "epoch": 0.23, - "learning_rate": 0.00026494129856651747, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002836386477037097, + "loss": 0.0231, "step": 21620 }, { - "epoch": 0.23, - "learning_rate": 0.00026492508270091453, - "loss": 0.0255, + "epoch": 0.11, + "learning_rate": 0.00028363108001069567, + "loss": 0.0244, "step": 21630 }, { - "epoch": 0.23, - "learning_rate": 0.00026490886683531165, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.00028362351231768165, + "loss": 0.0288, "step": 21640 }, { - "epoch": 0.23, - "learning_rate": 0.0002648926509697087, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.00028361594462466763, + "loss": 0.0277, "step": 21650 }, { - "epoch": 0.23, - "learning_rate": 0.00026487643510410584, - "loss": 0.0257, + "epoch": 0.11, + "learning_rate": 0.0002836083769316536, + "loss": 0.0264, "step": 21660 }, { - "epoch": 0.23, - "learning_rate": 0.00026486021923850296, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.0002836008092386396, + "loss": 0.0247, "step": 21670 }, { - "epoch": 0.23, - "learning_rate": 0.0002648440033729, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028359324154562563, + "loss": 0.0261, "step": 21680 }, { - "epoch": 0.23, - "learning_rate": 0.0002648277875072971, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.0002835856738526116, + "loss": 0.0295, "step": 21690 }, { - "epoch": 0.23, - "learning_rate": 0.0002648115716416942, - "loss": 0.0259, + "epoch": 0.11, + "learning_rate": 0.0002835781061595976, + "loss": 0.0298, "step": 21700 }, { - "epoch": 0.23, - "learning_rate": 0.00026479535577609133, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002835705384665836, + "loss": 0.0272, "step": 21710 }, { - "epoch": 0.23, - "learning_rate": 0.0002647791399104884, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.00028356297077356956, + "loss": 0.0324, "step": 21720 }, { - "epoch": 0.23, - "learning_rate": 0.00026476292404488546, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.00028355540308055554, + "loss": 0.0303, "step": 21730 }, { - "epoch": 0.24, - "learning_rate": 0.0002647467081792826, - "loss": 0.0268, + "epoch": 0.11, + "learning_rate": 0.0002835478353875415, + "loss": 0.0288, "step": 21740 }, { - "epoch": 0.24, - "learning_rate": 0.0002647304923136797, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.00028354026769452755, + "loss": 0.0307, "step": 21750 }, { - "epoch": 0.24, - "learning_rate": 0.00026471427644807677, - "loss": 0.0316, + "epoch": 0.11, + "learning_rate": 0.00028353270000151354, + "loss": 0.0302, "step": 21760 }, { - "epoch": 0.24, - "learning_rate": 0.0002646980605824739, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.0002835251323084995, + "loss": 0.0283, "step": 21770 }, { - "epoch": 0.24, - "learning_rate": 0.00026468184471687095, - "loss": 0.0294, + "epoch": 0.11, + "learning_rate": 0.0002835175646154855, + "loss": 0.0261, "step": 21780 }, { - "epoch": 0.24, - "learning_rate": 0.00026466562885126807, - "loss": 0.0239, + "epoch": 0.11, + "learning_rate": 0.0002835099969224715, + "loss": 0.033, "step": 21790 }, { - "epoch": 0.24, - "learning_rate": 0.0002646494129856652, + "epoch": 0.11, + "learning_rate": 0.00028350242922945746, "loss": 0.0286, "step": 21800 }, { - "epoch": 0.24, - "learning_rate": 0.00026463319712006226, - "loss": 0.0334, + "epoch": 0.11, + "learning_rate": 0.0002834948615364435, + "loss": 0.0291, "step": 21810 }, { - "epoch": 0.24, - "learning_rate": 0.0002646169812544593, - "loss": 0.0255, + "epoch": 0.11, + "learning_rate": 0.0002834872938434295, + "loss": 0.0286, "step": 21820 }, { - "epoch": 0.24, - "learning_rate": 0.00026460076538885644, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.00028347972615041546, + "loss": 0.0283, "step": 21830 }, { - "epoch": 0.24, - "learning_rate": 0.00026458454952325356, - "loss": 0.0309, + "epoch": 0.11, + "learning_rate": 0.00028347215845740144, + "loss": 0.0422, "step": 21840 }, { - "epoch": 0.24, - "learning_rate": 0.0002645683336576506, - "loss": 0.0284, + "epoch": 0.11, + "learning_rate": 0.0002834645907643874, + "loss": 0.0347, "step": 21850 }, { - "epoch": 0.24, - "learning_rate": 0.0002645521177920477, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.0002834570230713734, + "loss": 0.0353, "step": 21860 }, { - "epoch": 0.24, - "learning_rate": 0.0002645359019264448, - "loss": 0.0314, + "epoch": 0.11, + "learning_rate": 0.00028344945537835944, + "loss": 0.0305, "step": 21870 }, { - "epoch": 0.24, - "learning_rate": 0.00026451968606084193, - "loss": 0.0273, + "epoch": 0.11, + "learning_rate": 0.0002834418876853454, + "loss": 0.0271, "step": 21880 }, { - "epoch": 0.24, - "learning_rate": 0.000264503470195239, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002834343199923314, + "loss": 0.0306, "step": 21890 }, { - "epoch": 0.24, - "learning_rate": 0.00026448725432963606, - "loss": 0.0251, + "epoch": 0.11, + "learning_rate": 0.0002834267522993174, + "loss": 0.03, "step": 21900 }, { - "epoch": 0.24, - "learning_rate": 0.0002644710384640332, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028341918460630337, + "loss": 0.0346, "step": 21910 }, { - "epoch": 0.24, - "learning_rate": 0.0002644548225984303, - "loss": 0.0211, + "epoch": 0.11, + "learning_rate": 0.00028341161691328935, + "loss": 0.03, "step": 21920 }, { - "epoch": 0.24, - "learning_rate": 0.00026443860673282737, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028340404922027533, + "loss": 0.0244, "step": 21930 }, { - "epoch": 0.24, - "learning_rate": 0.0002644223908672245, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.00028339648152726136, + "loss": 0.0304, "step": 21940 }, { - "epoch": 0.24, - "learning_rate": 0.00026440617500162155, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.00028338891383424735, + "loss": 0.0304, "step": 21950 }, { - "epoch": 0.24, - "learning_rate": 0.0002643899591360187, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028338134614123333, + "loss": 0.0289, "step": 21960 }, { - "epoch": 0.24, - "learning_rate": 0.00026437374327041574, - "loss": 0.0299, + "epoch": 0.11, + "learning_rate": 0.0002833737784482193, + "loss": 0.0245, "step": 21970 }, { - "epoch": 0.24, - "learning_rate": 0.00026435752740481286, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002833662107552053, + "loss": 0.0291, "step": 21980 }, { - "epoch": 0.24, - "learning_rate": 0.0002643413115392099, - "loss": 0.0299, + "epoch": 0.11, + "learning_rate": 0.00028335864306219127, + "loss": 0.0277, "step": 21990 }, { - "epoch": 0.24, - "learning_rate": 0.00026432509567360705, - "loss": 0.0258, + "epoch": 0.11, + "learning_rate": 0.00028335107536917725, + "loss": 0.026, "step": 22000 }, { - "epoch": 0.24, - "eval_cer": 0.9216268238490577, - "eval_loss": 0.019485387951135635, - "eval_runtime": 120.4283, - "eval_samples_per_second": 16.607, - "eval_steps_per_second": 4.152, + "epoch": 0.11, + "eval_cer": 0.9144663743186606, + "eval_loss": 0.021011509001255035, + "eval_runtime": 117.4912, + "eval_samples_per_second": 17.023, + "eval_steps_per_second": 4.256, "step": 22000 }, { - "epoch": 0.24, - "learning_rate": 0.0002643088798080041, - "loss": 0.0258, + "epoch": 0.11, + "learning_rate": 0.00028334350767616323, + "loss": 0.0327, "step": 22010 }, { - "epoch": 0.24, - "learning_rate": 0.00026429266394240123, - "loss": 0.0266, + "epoch": 0.11, + "learning_rate": 0.0002833359399831492, + "loss": 0.0257, "step": 22020 }, { - "epoch": 0.24, - "learning_rate": 0.0002642764480767983, - "loss": 0.0296, + "epoch": 0.11, + "learning_rate": 0.0002833283722901352, + "loss": 0.0277, "step": 22030 }, { - "epoch": 0.24, - "learning_rate": 0.0002642602322111954, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.00028332080459712123, + "loss": 0.0319, "step": 22040 }, { - "epoch": 0.24, - "learning_rate": 0.0002642440163455925, - "loss": 0.0365, + "epoch": 0.11, + "learning_rate": 0.0002833132369041072, + "loss": 0.0257, "step": 22050 }, { - "epoch": 0.24, - "learning_rate": 0.0002642278004799896, - "loss": 0.0311, + "epoch": 0.11, + "learning_rate": 0.0002833056692110932, + "loss": 0.0284, "step": 22060 }, { - "epoch": 0.24, - "learning_rate": 0.0002642115846143867, - "loss": 0.035, + "epoch": 0.11, + "learning_rate": 0.0002832981015180792, + "loss": 0.0336, "step": 22070 }, { - "epoch": 0.24, - "learning_rate": 0.0002641953687487838, - "loss": 0.0285, + "epoch": 0.11, + "learning_rate": 0.00028329053382506516, + "loss": 0.0331, "step": 22080 }, { - "epoch": 0.24, - "learning_rate": 0.00026417915288318085, - "loss": 0.028, + "epoch": 0.11, + "learning_rate": 0.00028328296613205114, + "loss": 0.0259, "step": 22090 }, { - "epoch": 0.24, - "learning_rate": 0.00026416293701757797, - "loss": 0.0277, + "epoch": 0.11, + "learning_rate": 0.0002832753984390371, + "loss": 0.03, "step": 22100 }, { - "epoch": 0.24, - "learning_rate": 0.0002641467211519751, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028326783074602316, + "loss": 0.0331, "step": 22110 }, { - "epoch": 0.24, - "learning_rate": 0.00026413050528637216, - "loss": 0.028, + "epoch": 0.11, + "learning_rate": 0.00028326026305300914, + "loss": 0.0306, "step": 22120 }, { - "epoch": 0.24, - "learning_rate": 0.0002641142894207692, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.0002832526953599951, + "loss": 0.0292, "step": 22130 }, { - "epoch": 0.24, - "learning_rate": 0.00026409807355516634, - "loss": 0.028, + "epoch": 0.11, + "learning_rate": 0.0002832451276669811, + "loss": 0.0302, "step": 22140 }, { - "epoch": 0.24, - "learning_rate": 0.00026408185768956346, - "loss": 0.0307, + "epoch": 0.11, + "learning_rate": 0.0002832375599739671, + "loss": 0.0326, "step": 22150 }, { - "epoch": 0.24, - "learning_rate": 0.00026406564182396053, - "loss": 0.0273, + "epoch": 0.11, + "learning_rate": 0.00028322999228095306, + "loss": 0.0353, "step": 22160 }, { - "epoch": 0.24, - "learning_rate": 0.0002640494259583576, - "loss": 0.0288, + "epoch": 0.11, + "learning_rate": 0.0002832224245879391, + "loss": 0.0253, "step": 22170 }, { - "epoch": 0.24, - "learning_rate": 0.0002640332100927547, - "loss": 0.0297, + "epoch": 0.11, + "learning_rate": 0.0002832148568949251, + "loss": 0.0283, "step": 22180 }, { - "epoch": 0.24, - "learning_rate": 0.00026401699422715183, - "loss": 0.0314, + "epoch": 0.11, + "learning_rate": 0.00028320728920191106, + "loss": 0.0256, "step": 22190 }, { - "epoch": 0.24, - "learning_rate": 0.0002640007783615489, - "loss": 0.0275, + "epoch": 0.11, + "learning_rate": 0.00028319972150889704, + "loss": 0.031, "step": 22200 }, { - "epoch": 0.24, - "learning_rate": 0.000263984562495946, - "loss": 0.0258, + "epoch": 0.11, + "learning_rate": 0.000283192153815883, + "loss": 0.0296, "step": 22210 }, { - "epoch": 0.24, - "learning_rate": 0.0002639683466303431, - "loss": 0.0315, + "epoch": 0.11, + "learning_rate": 0.000283184586122869, + "loss": 0.027, "step": 22220 }, { - "epoch": 0.24, - "learning_rate": 0.0002639521307647402, - "loss": 0.0347, + "epoch": 0.11, + "learning_rate": 0.00028317701842985504, + "loss": 0.0318, "step": 22230 }, { - "epoch": 0.24, - "learning_rate": 0.0002639359148991373, - "loss": 0.0277, + "epoch": 0.11, + "learning_rate": 0.000283169450736841, + "loss": 0.0297, "step": 22240 }, { - "epoch": 0.24, - "learning_rate": 0.0002639196990335344, - "loss": 0.0286, + "epoch": 0.11, + "learning_rate": 0.000283161883043827, + "loss": 0.0266, "step": 22250 }, { - "epoch": 0.24, - "learning_rate": 0.00026390348316793146, - "loss": 0.0313, + "epoch": 0.11, + "learning_rate": 0.000283154315350813, + "loss": 0.0307, "step": 22260 }, { - "epoch": 0.24, - "learning_rate": 0.0002638872673023286, - "loss": 0.0325, + "epoch": 0.11, + "learning_rate": 0.00028314674765779897, + "loss": 0.0264, "step": 22270 }, { - "epoch": 0.24, - "learning_rate": 0.0002638710514367257, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028313917996478495, + "loss": 0.028, "step": 22280 }, { - "epoch": 0.24, - "learning_rate": 0.00026385483557112276, - "loss": 0.0327, + "epoch": 0.11, + "learning_rate": 0.00028313161227177093, + "loss": 0.0313, "step": 22290 }, { - "epoch": 0.24, - "learning_rate": 0.00026383861970551983, - "loss": 0.0262, + "epoch": 0.11, + "learning_rate": 0.00028312404457875697, + "loss": 0.0223, "step": 22300 }, { - "epoch": 0.24, - "learning_rate": 0.00026382240383991695, - "loss": 0.0326, + "epoch": 0.11, + "learning_rate": 0.00028311647688574295, + "loss": 0.0285, "step": 22310 }, { - "epoch": 0.24, - "learning_rate": 0.00026380618797431407, - "loss": 0.03, + "epoch": 0.11, + "learning_rate": 0.00028310890919272893, + "loss": 0.0331, "step": 22320 }, { - "epoch": 0.24, - "learning_rate": 0.00026378997210871113, - "loss": 0.0275, + "epoch": 0.11, + "learning_rate": 0.0002831013414997149, + "loss": 0.0389, "step": 22330 }, { - "epoch": 0.24, - "learning_rate": 0.0002637737562431082, - "loss": 0.0447, + "epoch": 0.11, + "learning_rate": 0.0002830937738067009, + "loss": 0.037, "step": 22340 }, { - "epoch": 0.24, - "learning_rate": 0.0002637575403775053, - "loss": 0.0503, + "epoch": 0.11, + "learning_rate": 0.0002830862061136869, + "loss": 0.0304, "step": 22350 }, { - "epoch": 0.24, - "learning_rate": 0.00026374132451190244, - "loss": 0.0397, + "epoch": 0.11, + "learning_rate": 0.0002830786384206729, + "loss": 0.0333, "step": 22360 }, { - "epoch": 0.24, - "learning_rate": 0.00026372510864629956, - "loss": 0.0425, + "epoch": 0.11, + "learning_rate": 0.0002830710707276589, + "loss": 0.0416, "step": 22370 }, { - "epoch": 0.24, - "learning_rate": 0.0002637088927806966, - "loss": 0.0306, + "epoch": 0.11, + "learning_rate": 0.0002830635030346449, + "loss": 0.0273, "step": 22380 }, { - "epoch": 0.24, - "learning_rate": 0.0002636926769150937, - "loss": 0.0366, + "epoch": 0.11, + "learning_rate": 0.00028305593534163085, + "loss": 0.0299, "step": 22390 }, { - "epoch": 0.24, - "learning_rate": 0.0002636764610494908, - "loss": 0.0283, + "epoch": 0.11, + "learning_rate": 0.00028304836764861684, + "loss": 0.0309, "step": 22400 }, { - "epoch": 0.24, - "learning_rate": 0.00026366024518388793, - "loss": 0.0284, + "epoch": 0.11, + "learning_rate": 0.0002830407999556028, + "loss": 0.0304, "step": 22410 }, { - "epoch": 0.24, - "learning_rate": 0.000263644029318285, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.00028303323226258885, + "loss": 0.0312, "step": 22420 }, { - "epoch": 0.24, - "learning_rate": 0.00026362781345268206, - "loss": 0.0276, + "epoch": 0.11, + "learning_rate": 0.00028302566456957483, + "loss": 0.0316, "step": 22430 }, { - "epoch": 0.24, - "learning_rate": 0.0002636115975870792, - "loss": 0.0264, + "epoch": 0.11, + "learning_rate": 0.0002830180968765608, + "loss": 0.0328, "step": 22440 }, { - "epoch": 0.24, - "learning_rate": 0.0002635953817214763, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.0002830105291835468, + "loss": 0.0317, "step": 22450 }, { - "epoch": 0.24, - "learning_rate": 0.00026357916585587337, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.0002830029614905328, + "loss": 0.0324, "step": 22460 }, { - "epoch": 0.24, - "learning_rate": 0.00026356294999027043, - "loss": 0.0289, + "epoch": 0.11, + "learning_rate": 0.00028299539379751876, + "loss": 0.0302, "step": 22470 }, { - "epoch": 0.24, - "learning_rate": 0.00026354673412466755, - "loss": 0.0218, + "epoch": 0.11, + "learning_rate": 0.00028298782610450474, + "loss": 0.0318, "step": 22480 }, { - "epoch": 0.24, - "learning_rate": 0.00026353051825906467, - "loss": 0.0335, + "epoch": 0.11, + "learning_rate": 0.0002829802584114908, + "loss": 0.0316, "step": 22490 }, { - "epoch": 0.24, - "learning_rate": 0.00026351430239346174, - "loss": 0.0304, + "epoch": 0.11, + "learning_rate": 0.00028297269071847676, + "loss": 0.0309, "step": 22500 }, { - "epoch": 0.24, - "learning_rate": 0.00026349808652785886, - "loss": 0.0286, + "epoch": 0.11, + "learning_rate": 0.00028296512302546274, + "loss": 0.0304, "step": 22510 }, { - "epoch": 0.24, - "learning_rate": 0.0002634818706622559, - "loss": 0.0296, + "epoch": 0.11, + "learning_rate": 0.0002829575553324487, + "loss": 0.0312, "step": 22520 }, { - "epoch": 0.24, - "learning_rate": 0.00026346565479665304, - "loss": 0.0294, + "epoch": 0.11, + "learning_rate": 0.0002829499876394347, + "loss": 0.0314, "step": 22530 }, { - "epoch": 0.24, - "learning_rate": 0.0002634494389310501, - "loss": 0.0295, + "epoch": 0.11, + "learning_rate": 0.0002829424199464207, + "loss": 0.035, "step": 22540 }, { - "epoch": 0.24, - "learning_rate": 0.00026343322306544723, - "loss": 0.0267, + "epoch": 0.11, + "learning_rate": 0.0002829348522534067, + "loss": 0.0283, "step": 22550 }, { - "epoch": 0.24, - "learning_rate": 0.0002634170071998443, - "loss": 0.028, + "epoch": 0.11, + "learning_rate": 0.0002829272845603927, + "loss": 0.0304, "step": 22560 }, { - "epoch": 0.24, - "learning_rate": 0.0002634007913342414, - "loss": 0.0287, + "epoch": 0.11, + "learning_rate": 0.0002829197168673787, + "loss": 0.03, "step": 22570 }, { - "epoch": 0.24, - "learning_rate": 0.0002633845754686385, - "loss": 0.0312, + "epoch": 0.11, + "learning_rate": 0.00028291214917436466, + "loss": 0.0296, "step": 22580 }, { - "epoch": 0.24, - "learning_rate": 0.0002633683596030356, - "loss": 0.0336, + "epoch": 0.11, + "learning_rate": 0.00028290458148135065, + "loss": 0.0294, "step": 22590 }, { - "epoch": 0.24, - "learning_rate": 0.00026335214373743266, + "epoch": 0.11, + "learning_rate": 0.00028289701378833663, "loss": 0.0285, "step": 22600 }, { - "epoch": 0.24, - "learning_rate": 0.0002633359278718298, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.0002828894460953226, + "loss": 0.028, "step": 22610 }, { - "epoch": 0.24, - "learning_rate": 0.00026331971200622685, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.00028288187840230864, + "loss": 0.0311, "step": 22620 }, { - "epoch": 0.24, - "learning_rate": 0.00026330349614062397, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.0002828743107092946, + "loss": 0.029, "step": 22630 }, { - "epoch": 0.24, - "learning_rate": 0.00026328728027502103, - "loss": 0.0312, + "epoch": 0.11, + "learning_rate": 0.0002828667430162806, + "loss": 0.0341, "step": 22640 }, { - "epoch": 0.24, - "learning_rate": 0.00026327106440941815, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.0002828591753232666, + "loss": 0.0317, "step": 22650 }, { - "epoch": 0.24, - "learning_rate": 0.0002632548485438152, - "loss": 0.0313, + "epoch": 0.11, + "learning_rate": 0.00028285160763025257, + "loss": 0.0263, "step": 22660 }, { - "epoch": 0.25, - "learning_rate": 0.00026323863267821234, - "loss": 0.0268, + "epoch": 0.11, + "learning_rate": 0.00028284403993723855, + "loss": 0.0257, "step": 22670 }, { - "epoch": 0.25, - "learning_rate": 0.00026322241681260946, - "loss": 0.0263, + "epoch": 0.11, + "learning_rate": 0.0002828364722442246, + "loss": 0.0298, "step": 22680 }, { - "epoch": 0.25, - "learning_rate": 0.0002632062009470065, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028282890455121057, + "loss": 0.0329, "step": 22690 }, { - "epoch": 0.25, - "learning_rate": 0.0002631899850814036, - "loss": 0.0256, + "epoch": 0.11, + "learning_rate": 0.00028282133685819655, + "loss": 0.0311, "step": 22700 }, { - "epoch": 0.25, - "learning_rate": 0.0002631737692158007, - "loss": 0.025, + "epoch": 0.11, + "learning_rate": 0.00028281376916518253, + "loss": 0.0481, "step": 22710 }, { - "epoch": 0.25, - "learning_rate": 0.00026315755335019783, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.0002828062014721685, + "loss": 0.0289, "step": 22720 }, { - "epoch": 0.25, - "learning_rate": 0.0002631413374845949, - "loss": 0.0254, + "epoch": 0.11, + "learning_rate": 0.0002827986337791545, + "loss": 0.0321, "step": 22730 }, { - "epoch": 0.25, - "learning_rate": 0.00026312512161899196, - "loss": 0.0325, + "epoch": 0.11, + "learning_rate": 0.00028279106608614053, + "loss": 0.0291, "step": 22740 }, { - "epoch": 0.25, - "learning_rate": 0.0002631089057533891, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.0002827834983931265, + "loss": 0.0326, "step": 22750 }, { - "epoch": 0.25, - "learning_rate": 0.0002630926898877862, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.0002827759307001125, + "loss": 0.0284, "step": 22760 }, { - "epoch": 0.25, - "learning_rate": 0.00026307647402218327, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.0002827683630070985, + "loss": 0.0327, "step": 22770 }, { - "epoch": 0.25, - "learning_rate": 0.0002630602581565804, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.00028276079531408446, + "loss": 0.0308, "step": 22780 }, { - "epoch": 0.25, - "learning_rate": 0.00026304404229097745, - "loss": 0.0286, + "epoch": 0.11, + "learning_rate": 0.00028275322762107044, + "loss": 0.0304, "step": 22790 }, { - "epoch": 0.25, - "learning_rate": 0.0002630278264253746, - "loss": 0.0285, + "epoch": 0.12, + "learning_rate": 0.0002827456599280564, + "loss": 0.0265, "step": 22800 }, { - "epoch": 0.25, - "learning_rate": 0.0002630116105597717, - "loss": 0.0288, + "epoch": 0.12, + "learning_rate": 0.00028273809223504246, + "loss": 0.032, "step": 22810 }, { - "epoch": 0.25, - "learning_rate": 0.00026299539469416876, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028273052454202844, + "loss": 0.0385, "step": 22820 }, { - "epoch": 0.25, - "learning_rate": 0.0002629791788285658, - "loss": 0.0244, + "epoch": 0.12, + "learning_rate": 0.0002827229568490144, + "loss": 0.03, "step": 22830 }, { - "epoch": 0.25, - "learning_rate": 0.00026296296296296294, - "loss": 0.025, + "epoch": 0.12, + "learning_rate": 0.0002827153891560004, + "loss": 0.0387, "step": 22840 }, { - "epoch": 0.25, - "learning_rate": 0.00026294674709736006, - "loss": 0.025, + "epoch": 0.12, + "learning_rate": 0.0002827078214629864, + "loss": 0.0367, "step": 22850 }, { - "epoch": 0.25, - "learning_rate": 0.00026293053123175713, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.00028270025376997236, + "loss": 0.0381, "step": 22860 }, { - "epoch": 0.25, - "learning_rate": 0.0002629143153661542, - "loss": 0.0261, + "epoch": 0.12, + "learning_rate": 0.0002826926860769584, + "loss": 0.0264, "step": 22870 }, { - "epoch": 0.25, - "learning_rate": 0.0002628980995005513, - "loss": 0.0298, + "epoch": 0.12, + "learning_rate": 0.0002826851183839444, + "loss": 0.0268, "step": 22880 }, { - "epoch": 0.25, - "learning_rate": 0.00026288188363494843, - "loss": 0.0257, + "epoch": 0.12, + "learning_rate": 0.00028267755069093036, + "loss": 0.0304, "step": 22890 }, { - "epoch": 0.25, - "learning_rate": 0.0002628656677693455, - "loss": 0.0316, + "epoch": 0.12, + "learning_rate": 0.00028266998299791634, + "loss": 0.0339, "step": 22900 }, { - "epoch": 0.25, - "learning_rate": 0.00026284945190374257, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.0002826624153049023, + "loss": 0.0295, "step": 22910 }, { - "epoch": 0.25, - "learning_rate": 0.0002628332360381397, - "loss": 0.0278, + "epoch": 0.12, + "learning_rate": 0.0002826548476118883, + "loss": 0.0362, "step": 22920 }, { - "epoch": 0.25, - "learning_rate": 0.0002628170201725368, - "loss": 0.0284, + "epoch": 0.12, + "learning_rate": 0.00028264727991887434, + "loss": 0.0312, "step": 22930 }, { - "epoch": 0.25, - "learning_rate": 0.00026280080430693387, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.0002826397122258603, + "loss": 0.0301, "step": 22940 }, { - "epoch": 0.25, - "learning_rate": 0.000262784588441331, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.0002826321445328463, + "loss": 0.0318, "step": 22950 }, { - "epoch": 0.25, - "learning_rate": 0.00026276837257572806, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.0002826245768398323, + "loss": 0.0324, "step": 22960 }, { - "epoch": 0.25, - "learning_rate": 0.0002627521567101252, - "loss": 0.0271, + "epoch": 0.12, + "learning_rate": 0.00028261700914681827, + "loss": 0.0326, "step": 22970 }, { - "epoch": 0.25, - "learning_rate": 0.00026273594084452224, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.00028260944145380425, + "loss": 0.0282, "step": 22980 }, { - "epoch": 0.25, - "learning_rate": 0.00026271972497891936, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.00028260187376079023, + "loss": 0.0255, "step": 22990 }, { - "epoch": 0.25, - "learning_rate": 0.00026270350911331643, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.00028259430606777627, + "loss": 0.0325, "step": 23000 }, { - "epoch": 0.25, - "eval_cer": 0.9215642844361985, - "eval_loss": 0.018794536590576172, - "eval_runtime": 119.88, - "eval_samples_per_second": 16.683, - "eval_steps_per_second": 4.171, + "epoch": 0.12, + "eval_cer": 0.9145051901636767, + "eval_loss": 0.02104305848479271, + "eval_runtime": 117.2879, + "eval_samples_per_second": 17.052, + "eval_steps_per_second": 4.263, "step": 23000 }, { - "epoch": 0.25, - "learning_rate": 0.00026268729324771355, - "loss": 0.0282, + "epoch": 0.12, + "learning_rate": 0.00028258673837476225, + "loss": 0.0284, "step": 23010 }, { - "epoch": 0.25, - "learning_rate": 0.00026267107738211067, - "loss": 0.0299, + "epoch": 0.12, + "learning_rate": 0.00028257917068174823, + "loss": 0.0292, "step": 23020 }, { - "epoch": 0.25, - "learning_rate": 0.00026265486151650773, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.0002825716029887342, + "loss": 0.0379, "step": 23030 }, { - "epoch": 0.25, - "learning_rate": 0.0002626386456509048, - "loss": 0.0255, + "epoch": 0.12, + "learning_rate": 0.0002825640352957202, + "loss": 0.0286, "step": 23040 }, { - "epoch": 0.25, - "learning_rate": 0.0002626224297853019, - "loss": 0.0257, + "epoch": 0.12, + "learning_rate": 0.00028255646760270617, + "loss": 0.028, "step": 23050 }, { - "epoch": 0.25, - "learning_rate": 0.00026260621391969904, - "loss": 0.0253, + "epoch": 0.12, + "learning_rate": 0.0002825488999096922, + "loss": 0.0265, "step": 23060 }, { - "epoch": 0.25, - "learning_rate": 0.0002625899980540961, - "loss": 0.0266, + "epoch": 0.12, + "learning_rate": 0.0002825413322166782, + "loss": 0.0265, "step": 23070 }, { - "epoch": 0.25, - "learning_rate": 0.0002625737821884932, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.00028253376452366417, + "loss": 0.0236, "step": 23080 }, { - "epoch": 0.25, - "learning_rate": 0.0002625575663228903, - "loss": 0.0296, + "epoch": 0.12, + "learning_rate": 0.00028252619683065015, + "loss": 0.0313, "step": 23090 }, { - "epoch": 0.25, - "learning_rate": 0.0002625413504572874, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028251862913763613, + "loss": 0.0322, "step": 23100 }, { - "epoch": 0.25, - "learning_rate": 0.0002625251345916845, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.0002825110614446221, + "loss": 0.0246, "step": 23110 }, { - "epoch": 0.25, - "learning_rate": 0.0002625089187260816, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.0002825034937516081, + "loss": 0.0267, "step": 23120 }, { - "epoch": 0.25, - "learning_rate": 0.00026249270286047866, - "loss": 0.0263, + "epoch": 0.12, + "learning_rate": 0.00028249592605859413, + "loss": 0.0279, "step": 23130 }, { - "epoch": 0.25, - "learning_rate": 0.0002624764869948758, - "loss": 0.0239, + "epoch": 0.12, + "learning_rate": 0.0002824883583655801, + "loss": 0.0299, "step": 23140 }, { - "epoch": 0.25, - "learning_rate": 0.00026246027112927285, - "loss": 0.02, + "epoch": 0.12, + "learning_rate": 0.0002824807906725661, + "loss": 0.0319, "step": 23150 }, { - "epoch": 0.25, - "learning_rate": 0.00026244405526366997, - "loss": 0.0264, + "epoch": 0.12, + "learning_rate": 0.0002824732229795521, + "loss": 0.0298, "step": 23160 }, { - "epoch": 0.25, - "learning_rate": 0.00026242783939806703, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.00028246565528653806, + "loss": 0.0317, "step": 23170 }, { - "epoch": 0.25, - "learning_rate": 0.00026241162353246415, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.00028245808759352404, + "loss": 0.0303, "step": 23180 }, { - "epoch": 0.25, - "learning_rate": 0.0002623954076668612, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002824505199005101, + "loss": 0.0286, "step": 23190 }, { - "epoch": 0.25, - "learning_rate": 0.00026237919180125834, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.00028244295220749606, + "loss": 0.0312, "step": 23200 }, { - "epoch": 0.25, - "learning_rate": 0.0002623629759356554, - "loss": 0.0241, + "epoch": 0.12, + "learning_rate": 0.00028243538451448204, + "loss": 0.033, "step": 23210 }, { - "epoch": 0.25, - "learning_rate": 0.0002623467600700525, - "loss": 0.0303, + "epoch": 0.12, + "learning_rate": 0.000282427816821468, + "loss": 0.0292, "step": 23220 }, { - "epoch": 0.25, - "learning_rate": 0.0002623305442044496, - "loss": 0.0266, + "epoch": 0.12, + "learning_rate": 0.000282420249128454, + "loss": 0.0307, "step": 23230 }, { - "epoch": 0.25, - "learning_rate": 0.0002623143283388467, - "loss": 0.0269, + "epoch": 0.12, + "learning_rate": 0.00028241268143544, + "loss": 0.0273, "step": 23240 }, { - "epoch": 0.25, - "learning_rate": 0.00026229811247324383, - "loss": 0.0215, + "epoch": 0.12, + "learning_rate": 0.000282405113742426, + "loss": 0.0331, "step": 23250 }, { - "epoch": 0.25, - "learning_rate": 0.0002622818966076409, - "loss": 0.0261, + "epoch": 0.12, + "learning_rate": 0.00028239754604941195, + "loss": 0.028, "step": 23260 }, { - "epoch": 0.25, - "learning_rate": 0.00026226568074203796, - "loss": 0.025, + "epoch": 0.12, + "learning_rate": 0.0002823899783563979, + "loss": 0.0332, "step": 23270 }, { - "epoch": 0.25, - "learning_rate": 0.0002622494648764351, - "loss": 0.0272, + "epoch": 0.12, + "learning_rate": 0.0002823824106633839, + "loss": 0.026, "step": 23280 }, { - "epoch": 0.25, - "learning_rate": 0.0002622332490108322, - "loss": 0.0271, + "epoch": 0.12, + "learning_rate": 0.00028237484297036994, + "loss": 0.0326, "step": 23290 }, { - "epoch": 0.25, - "learning_rate": 0.00026221703314522926, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.0002823672752773559, + "loss": 0.0301, "step": 23300 }, { - "epoch": 0.25, - "learning_rate": 0.00026220081727962633, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002823597075843419, + "loss": 0.0236, "step": 23310 }, { - "epoch": 0.25, - "learning_rate": 0.00026218460141402345, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002823521398913279, + "loss": 0.0281, "step": 23320 }, { - "epoch": 0.25, - "learning_rate": 0.00026216838554842057, - "loss": 0.0266, + "epoch": 0.12, + "learning_rate": 0.00028234457219831387, + "loss": 0.0325, "step": 23330 }, { - "epoch": 0.25, - "learning_rate": 0.00026215216968281764, - "loss": 0.0215, + "epoch": 0.12, + "learning_rate": 0.00028233700450529985, + "loss": 0.0255, "step": 23340 }, { - "epoch": 0.25, - "learning_rate": 0.0002621359538172147, - "loss": 0.0284, + "epoch": 0.12, + "learning_rate": 0.00028232943681228583, + "loss": 0.0332, "step": 23350 }, { - "epoch": 0.25, - "learning_rate": 0.0002621197379516118, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028232186911927187, + "loss": 0.0365, "step": 23360 }, { - "epoch": 0.25, - "learning_rate": 0.00026210352208600894, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.00028231430142625785, + "loss": 0.0262, "step": 23370 }, { - "epoch": 0.25, - "learning_rate": 0.00026208730622040606, - "loss": 0.0293, + "epoch": 0.12, + "learning_rate": 0.00028230673373324383, + "loss": 0.03, "step": 23380 }, { - "epoch": 0.25, - "learning_rate": 0.0002620710903548031, - "loss": 0.0329, + "epoch": 0.12, + "learning_rate": 0.0002822991660402298, + "loss": 0.0291, "step": 23390 }, { - "epoch": 0.25, - "learning_rate": 0.0002620548744892002, - "loss": 0.0271, + "epoch": 0.12, + "learning_rate": 0.0002822915983472158, + "loss": 0.0318, "step": 23400 }, { - "epoch": 0.25, - "learning_rate": 0.0002620386586235973, - "loss": 0.0272, + "epoch": 0.12, + "learning_rate": 0.0002822840306542018, + "loss": 0.027, "step": 23410 }, { - "epoch": 0.25, - "learning_rate": 0.00026202244275799443, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002822764629611878, + "loss": 0.0291, "step": 23420 }, { - "epoch": 0.25, - "learning_rate": 0.0002620062268923915, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002822688952681738, + "loss": 0.0266, "step": 23430 }, { - "epoch": 0.25, - "learning_rate": 0.00026199001102678856, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.0002822613275751598, + "loss": 0.0257, "step": 23440 }, { - "epoch": 0.25, - "learning_rate": 0.0002619737951611857, - "loss": 0.029, + "epoch": 0.12, + "learning_rate": 0.00028225375988214576, + "loss": 0.0247, "step": 23450 }, { - "epoch": 0.25, - "learning_rate": 0.0002619575792955828, - "loss": 0.0253, + "epoch": 0.12, + "learning_rate": 0.00028224619218913174, + "loss": 0.0295, "step": 23460 }, { - "epoch": 0.25, - "learning_rate": 0.00026194136342997987, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.0002822386244961177, + "loss": 0.0279, "step": 23470 }, { - "epoch": 0.25, - "learning_rate": 0.00026192514756437693, - "loss": 0.0263, + "epoch": 0.12, + "learning_rate": 0.00028223105680310375, + "loss": 0.0316, "step": 23480 }, { - "epoch": 0.25, - "learning_rate": 0.00026190893169877405, - "loss": 0.0268, + "epoch": 0.12, + "learning_rate": 0.00028222348911008974, + "loss": 0.0258, "step": 23490 }, { - "epoch": 0.25, - "learning_rate": 0.0002618927158331712, - "loss": 0.0408, + "epoch": 0.12, + "learning_rate": 0.0002822159214170757, + "loss": 0.0262, "step": 23500 }, { - "epoch": 0.25, - "learning_rate": 0.00026187649996756824, - "loss": 0.0305, + "epoch": 0.12, + "learning_rate": 0.0002822083537240617, + "loss": 0.033, "step": 23510 }, { - "epoch": 0.25, - "learning_rate": 0.00026186028410196536, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.0002822007860310477, + "loss": 0.0299, "step": 23520 }, { - "epoch": 0.25, - "learning_rate": 0.0002618440682363624, - "loss": 0.0306, + "epoch": 0.12, + "learning_rate": 0.00028219321833803366, + "loss": 0.0252, "step": 23530 }, { - "epoch": 0.25, - "learning_rate": 0.00026182785237075954, - "loss": 0.0336, + "epoch": 0.12, + "learning_rate": 0.00028218565064501964, + "loss": 0.0287, "step": 23540 }, { - "epoch": 0.25, - "learning_rate": 0.0002618116365051566, - "loss": 0.0327, + "epoch": 0.12, + "learning_rate": 0.0002821780829520057, + "loss": 0.1276, "step": 23550 }, { - "epoch": 0.25, - "learning_rate": 0.00026179542063955373, - "loss": 0.028, + "epoch": 0.12, + "learning_rate": 0.00028217051525899166, + "loss": 0.0328, "step": 23560 }, { - "epoch": 0.25, - "learning_rate": 0.0002617792047739508, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.00028216294756597764, + "loss": 0.0346, "step": 23570 }, { - "epoch": 0.25, - "learning_rate": 0.0002617629889083479, - "loss": 0.0314, + "epoch": 0.12, + "learning_rate": 0.0002821553798729636, + "loss": 0.0323, "step": 23580 }, { - "epoch": 0.26, - "learning_rate": 0.000261746773042745, - "loss": 0.0295, + "epoch": 0.12, + "learning_rate": 0.0002821478121799496, + "loss": 0.0339, "step": 23590 }, { - "epoch": 0.26, - "learning_rate": 0.0002617305571771421, - "loss": 0.0256, + "epoch": 0.12, + "learning_rate": 0.0002821402444869356, + "loss": 0.0294, "step": 23600 }, { - "epoch": 0.26, - "learning_rate": 0.00026171434131153917, - "loss": 0.0263, + "epoch": 0.12, + "learning_rate": 0.0002821326767939216, + "loss": 0.0275, "step": 23610 }, { - "epoch": 0.26, - "learning_rate": 0.0002616981254459363, - "loss": 0.0272, + "epoch": 0.12, + "learning_rate": 0.0002821251091009076, + "loss": 0.0323, "step": 23620 }, { - "epoch": 0.26, - "learning_rate": 0.00026168190958033335, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.0002821175414078936, + "loss": 0.0292, "step": 23630 }, { - "epoch": 0.26, - "learning_rate": 0.00026166569371473047, - "loss": 0.0305, + "epoch": 0.12, + "learning_rate": 0.00028210997371487957, + "loss": 0.0291, "step": 23640 }, { - "epoch": 0.26, - "learning_rate": 0.00026164947784912754, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028210240602186555, + "loss": 0.0379, "step": 23650 }, { - "epoch": 0.26, - "learning_rate": 0.00026163326198352466, - "loss": 0.0257, + "epoch": 0.12, + "learning_rate": 0.00028209483832885153, + "loss": 0.0279, "step": 23660 }, { - "epoch": 0.26, - "learning_rate": 0.0002616170461179217, - "loss": 0.0241, + "epoch": 0.12, + "learning_rate": 0.00028208727063583756, + "loss": 0.0226, "step": 23670 }, { - "epoch": 0.26, - "learning_rate": 0.00026160083025231884, - "loss": 0.0232, + "epoch": 0.12, + "learning_rate": 0.00028207970294282355, + "loss": 0.0285, "step": 23680 }, { - "epoch": 0.26, - "learning_rate": 0.00026158461438671596, - "loss": 0.0265, + "epoch": 0.12, + "learning_rate": 0.0002820721352498095, + "loss": 0.0275, "step": 23690 }, { - "epoch": 0.26, - "learning_rate": 0.00026156839852111303, - "loss": 0.0316, + "epoch": 0.12, + "learning_rate": 0.0002820645675567955, + "loss": 0.0252, "step": 23700 }, { - "epoch": 0.26, - "learning_rate": 0.0002615521826555101, - "loss": 0.0284, + "epoch": 0.12, + "learning_rate": 0.0002820569998637815, + "loss": 0.0279, "step": 23710 }, { - "epoch": 0.26, - "learning_rate": 0.0002615359667899072, - "loss": 0.025, + "epoch": 0.12, + "learning_rate": 0.00028204943217076747, + "loss": 0.0306, "step": 23720 }, { - "epoch": 0.26, - "learning_rate": 0.00026151975092430433, + "epoch": 0.12, + "learning_rate": 0.00028204186447775345, "loss": 0.0272, "step": 23730 }, { - "epoch": 0.26, - "learning_rate": 0.0002615035350587014, - "loss": 0.0241, + "epoch": 0.12, + "learning_rate": 0.0002820342967847395, + "loss": 0.0456, "step": 23740 }, { - "epoch": 0.26, - "learning_rate": 0.0002614873191930985, - "loss": 0.0252, + "epoch": 0.12, + "learning_rate": 0.00028202672909172547, + "loss": 0.0343, "step": 23750 }, { - "epoch": 0.26, - "learning_rate": 0.0002614711033274956, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.00028201916139871145, + "loss": 0.0281, "step": 23760 }, { - "epoch": 0.26, - "learning_rate": 0.0002614548874618927, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.00028201159370569743, + "loss": 0.0254, "step": 23770 }, { - "epoch": 0.26, - "learning_rate": 0.00026143867159628977, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.0002820040260126834, + "loss": 0.0322, "step": 23780 }, { - "epoch": 0.26, - "learning_rate": 0.0002614224557306869, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.0002819964583196694, + "loss": 0.03, "step": 23790 }, { - "epoch": 0.26, - "learning_rate": 0.00026140623986508396, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.00028198889062665543, + "loss": 0.0271, "step": 23800 }, { - "epoch": 0.26, - "learning_rate": 0.0002613900239994811, - "loss": 0.0234, + "epoch": 0.12, + "learning_rate": 0.0002819813229336414, + "loss": 0.029, "step": 23810 }, { - "epoch": 0.26, - "learning_rate": 0.0002613738081338782, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.0002819737552406274, + "loss": 0.0246, "step": 23820 }, { - "epoch": 0.26, - "learning_rate": 0.00026135759226827526, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.0002819661875476134, + "loss": 0.0308, "step": 23830 }, { - "epoch": 0.26, - "learning_rate": 0.0002613413764026723, - "loss": 0.0448, + "epoch": 0.12, + "learning_rate": 0.00028195861985459936, + "loss": 0.027, "step": 23840 }, { - "epoch": 0.26, - "learning_rate": 0.00026132516053706945, - "loss": 0.0293, + "epoch": 0.12, + "learning_rate": 0.00028195105216158534, + "loss": 0.0289, "step": 23850 }, { - "epoch": 0.26, - "learning_rate": 0.00026130894467146657, - "loss": 0.0267, + "epoch": 0.12, + "learning_rate": 0.0002819434844685713, + "loss": 0.0263, "step": 23860 }, { - "epoch": 0.26, - "learning_rate": 0.00026129272880586363, - "loss": 0.0289, + "epoch": 0.12, + "learning_rate": 0.00028193591677555736, + "loss": 0.0278, "step": 23870 }, { - "epoch": 0.26, - "learning_rate": 0.0002612765129402607, - "loss": 0.0332, + "epoch": 0.12, + "learning_rate": 0.00028192834908254334, + "loss": 0.0247, "step": 23880 }, { - "epoch": 0.26, - "learning_rate": 0.0002612602970746578, - "loss": 0.0336, + "epoch": 0.12, + "learning_rate": 0.0002819207813895293, + "loss": 0.03, "step": 23890 }, { - "epoch": 0.26, - "learning_rate": 0.00026124408120905494, - "loss": 0.0275, + "epoch": 0.12, + "learning_rate": 0.0002819132136965153, + "loss": 0.031, "step": 23900 }, { - "epoch": 0.26, - "learning_rate": 0.000261227865343452, - "loss": 0.0261, + "epoch": 0.12, + "learning_rate": 0.0002819056460035013, + "loss": 0.0288, "step": 23910 }, { - "epoch": 0.26, - "learning_rate": 0.00026121164947784907, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.00028189807831048726, + "loss": 0.0339, "step": 23920 }, { - "epoch": 0.26, - "learning_rate": 0.0002611954336122462, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002818905106174733, + "loss": 0.0262, "step": 23930 }, { - "epoch": 0.26, - "learning_rate": 0.0002611792177466433, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.0002818829429244593, + "loss": 0.0301, "step": 23940 }, { - "epoch": 0.26, - "learning_rate": 0.00026116300188104043, - "loss": 0.0291, + "epoch": 0.12, + "learning_rate": 0.00028187537523144526, + "loss": 0.0292, "step": 23950 }, { - "epoch": 0.26, - "learning_rate": 0.0002611467860154375, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.00028186780753843124, + "loss": 0.0291, "step": 23960 }, { - "epoch": 0.26, - "learning_rate": 0.00026113057014983456, - "loss": 0.0274, + "epoch": 0.12, + "learning_rate": 0.0002818602398454172, + "loss": 0.0244, "step": 23970 }, { - "epoch": 0.26, - "learning_rate": 0.0002611143542842317, - "loss": 0.0258, + "epoch": 0.12, + "learning_rate": 0.0002818526721524032, + "loss": 0.0304, "step": 23980 }, { - "epoch": 0.26, - "learning_rate": 0.0002610981384186288, - "loss": 0.0264, + "epoch": 0.12, + "learning_rate": 0.00028184510445938924, + "loss": 0.0227, "step": 23990 }, { - "epoch": 0.26, - "learning_rate": 0.00026108192255302586, + "epoch": 0.12, + "learning_rate": 0.0002818375367663752, "loss": 0.0285, "step": 24000 }, { - "epoch": 0.26, - "eval_cer": 0.9215486495829838, - "eval_loss": 0.019064895808696747, - "eval_runtime": 119.9759, - "eval_samples_per_second": 16.67, - "eval_steps_per_second": 4.168, + "epoch": 0.12, + "eval_cer": 0.9144692855070369, + "eval_loss": 0.02072213776409626, + "eval_runtime": 117.2385, + "eval_samples_per_second": 17.059, + "eval_steps_per_second": 4.265, "step": 24000 }, { - "epoch": 0.26, - "learning_rate": 0.00026106570668742293, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002818299690733612, + "loss": 0.0287, "step": 24010 }, { - "epoch": 0.26, - "learning_rate": 0.00026104949082182005, - "loss": 0.0273, + "epoch": 0.12, + "learning_rate": 0.0002818224013803472, + "loss": 0.0316, "step": 24020 }, { - "epoch": 0.26, - "learning_rate": 0.00026103327495621717, - "loss": 0.0242, + "epoch": 0.12, + "learning_rate": 0.00028181483368733317, + "loss": 0.0248, "step": 24030 }, { - "epoch": 0.26, - "learning_rate": 0.00026101705909061424, - "loss": 0.0285, + "epoch": 0.12, + "learning_rate": 0.00028180726599431915, + "loss": 0.0284, "step": 24040 }, { - "epoch": 0.26, - "learning_rate": 0.0002610008432250113, - "loss": 0.0284, + "epoch": 0.12, + "learning_rate": 0.00028179969830130513, + "loss": 0.0252, "step": 24050 }, { - "epoch": 0.26, - "learning_rate": 0.0002609846273594084, - "loss": 0.0254, + "epoch": 0.12, + "learning_rate": 0.00028179213060829117, + "loss": 0.0277, "step": 24060 }, { - "epoch": 0.26, - "learning_rate": 0.00026096841149380554, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028178456291527715, + "loss": 0.0269, "step": 24070 }, { - "epoch": 0.26, - "learning_rate": 0.0002609521956282026, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.00028177699522226313, + "loss": 0.0237, "step": 24080 }, { - "epoch": 0.26, - "learning_rate": 0.0002609359797625997, - "loss": 0.0265, + "epoch": 0.12, + "learning_rate": 0.0002817694275292491, + "loss": 0.0218, "step": 24090 }, { - "epoch": 0.26, - "learning_rate": 0.0002609197638969968, - "loss": 0.0284, + "epoch": 0.12, + "learning_rate": 0.0002817618598362351, + "loss": 0.0265, "step": 24100 }, { - "epoch": 0.26, - "learning_rate": 0.0002609035480313939, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.00028175429214322107, + "loss": 0.0265, "step": 24110 }, { - "epoch": 0.26, - "learning_rate": 0.000260887332165791, - "loss": 0.0275, + "epoch": 0.12, + "learning_rate": 0.0002817467244502071, + "loss": 0.0246, "step": 24120 }, { - "epoch": 0.26, - "learning_rate": 0.0002608711163001881, - "loss": 0.0306, + "epoch": 0.12, + "learning_rate": 0.0002817391567571931, + "loss": 0.032, "step": 24130 }, { - "epoch": 0.26, - "learning_rate": 0.00026085490043458516, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.00028173158906417907, + "loss": 0.0256, "step": 24140 }, { - "epoch": 0.26, - "learning_rate": 0.0002608386845689823, - "loss": 0.0293, + "epoch": 0.12, + "learning_rate": 0.00028172402137116505, + "loss": 0.028, "step": 24150 }, { - "epoch": 0.26, - "learning_rate": 0.00026082246870337935, - "loss": 0.0274, + "epoch": 0.12, + "learning_rate": 0.00028171645367815103, + "loss": 0.0244, "step": 24160 }, { - "epoch": 0.26, - "learning_rate": 0.00026080625283777647, - "loss": 0.0292, + "epoch": 0.12, + "learning_rate": 0.000281708885985137, + "loss": 0.0364, "step": 24170 }, { - "epoch": 0.26, - "learning_rate": 0.00026079003697217353, - "loss": 0.0254, + "epoch": 0.12, + "learning_rate": 0.000281701318292123, + "loss": 0.0286, "step": 24180 }, { - "epoch": 0.26, - "learning_rate": 0.00026077382110657065, - "loss": 0.0267, + "epoch": 0.12, + "learning_rate": 0.00028169375059910903, + "loss": 0.0318, "step": 24190 }, { - "epoch": 0.26, - "learning_rate": 0.0002607576052409677, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.000281686182906095, + "loss": 0.027, "step": 24200 }, { - "epoch": 0.26, - "learning_rate": 0.00026074138937536484, - "loss": 0.0279, + "epoch": 0.12, + "learning_rate": 0.000281678615213081, + "loss": 0.0287, "step": 24210 }, { - "epoch": 0.26, - "learning_rate": 0.0002607251735097619, - "loss": 0.032, + "epoch": 0.12, + "learning_rate": 0.000281671047520067, + "loss": 0.0317, "step": 24220 }, { - "epoch": 0.26, - "learning_rate": 0.000260708957644159, - "loss": 0.0244, + "epoch": 0.12, + "learning_rate": 0.00028166347982705296, + "loss": 0.0302, "step": 24230 }, { - "epoch": 0.26, - "learning_rate": 0.0002606927417785561, - "loss": 0.0242, + "epoch": 0.12, + "learning_rate": 0.00028165591213403894, + "loss": 0.0272, "step": 24240 }, { - "epoch": 0.26, - "learning_rate": 0.0002606765259129532, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.000281648344441025, + "loss": 0.0273, "step": 24250 }, { - "epoch": 0.26, - "learning_rate": 0.00026066031004735033, - "loss": 0.0232, + "epoch": 0.12, + "learning_rate": 0.00028164077674801096, + "loss": 0.0303, "step": 24260 }, { - "epoch": 0.26, - "learning_rate": 0.0002606440941817474, - "loss": 0.0265, + "epoch": 0.12, + "learning_rate": 0.00028163320905499694, + "loss": 0.0329, "step": 24270 }, { - "epoch": 0.26, - "learning_rate": 0.00026062787831614446, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.0002816256413619829, + "loss": 0.0332, "step": 24280 }, { - "epoch": 0.26, - "learning_rate": 0.0002606116624505416, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.0002816180736689689, + "loss": 0.0362, "step": 24290 }, { - "epoch": 0.26, - "learning_rate": 0.0002605954465849387, - "loss": 0.0264, + "epoch": 0.12, + "learning_rate": 0.0002816105059759549, + "loss": 0.0304, "step": 24300 }, { - "epoch": 0.26, - "learning_rate": 0.00026057923071933577, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002816029382829409, + "loss": 0.0287, "step": 24310 }, { - "epoch": 0.26, - "learning_rate": 0.00026056301485373283, - "loss": 0.0276, - "step": 24320 + "epoch": 0.12, + "learning_rate": 0.0002815953705899269, + "loss": 0.0327, + "step": 24320 }, { - "epoch": 0.26, - "learning_rate": 0.00026054679898812995, - "loss": 0.0271, + "epoch": 0.12, + "learning_rate": 0.0002815878028969129, + "loss": 0.0282, "step": 24330 }, { - "epoch": 0.26, - "learning_rate": 0.00026053058312252707, - "loss": 0.0256, + "epoch": 0.12, + "learning_rate": 0.00028158023520389886, + "loss": 0.0288, "step": 24340 }, { - "epoch": 0.26, - "learning_rate": 0.00026051436725692414, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.00028157266751088484, + "loss": 0.0349, "step": 24350 }, { - "epoch": 0.26, - "learning_rate": 0.0002604981513913212, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.0002815650998178708, + "loss": 0.0319, "step": 24360 }, { - "epoch": 0.26, - "learning_rate": 0.0002604819355257183, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002815575321248568, + "loss": 0.0286, "step": 24370 }, { - "epoch": 0.26, - "learning_rate": 0.00026046571966011544, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.00028154996443184284, + "loss": 0.0275, "step": 24380 }, { - "epoch": 0.26, - "learning_rate": 0.00026044950379451256, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002815423967388288, + "loss": 0.0355, "step": 24390 }, { - "epoch": 0.26, - "learning_rate": 0.00026043328792890963, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.0002815348290458148, + "loss": 0.0302, "step": 24400 }, { - "epoch": 0.26, - "learning_rate": 0.0002604170720633067, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.0002815272613528008, + "loss": 0.0293, "step": 24410 }, { - "epoch": 0.26, - "learning_rate": 0.0002604008561977038, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.00028151969365978677, + "loss": 0.0315, "step": 24420 }, { - "epoch": 0.26, - "learning_rate": 0.00026038464033210093, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028151212596677275, + "loss": 0.0235, "step": 24430 }, { - "epoch": 0.26, - "learning_rate": 0.000260368424466498, - "loss": 0.0275, + "epoch": 0.12, + "learning_rate": 0.0002815045582737588, + "loss": 0.0301, "step": 24440 }, { - "epoch": 0.26, - "learning_rate": 0.00026035220860089507, - "loss": 0.0268, + "epoch": 0.12, + "learning_rate": 0.00028149699058074477, + "loss": 0.029, "step": 24450 }, { - "epoch": 0.26, - "learning_rate": 0.0002603359927352922, - "loss": 0.0218, + "epoch": 0.12, + "learning_rate": 0.00028148942288773075, + "loss": 0.0302, "step": 24460 }, { - "epoch": 0.26, - "learning_rate": 0.0002603197768696893, - "loss": 0.0218, + "epoch": 0.12, + "learning_rate": 0.00028148185519471673, + "loss": 0.0273, "step": 24470 }, { - "epoch": 0.26, - "learning_rate": 0.00026030356100408637, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.0002814742875017027, + "loss": 0.0269, "step": 24480 }, { - "epoch": 0.26, - "learning_rate": 0.00026028734513848344, - "loss": 0.0258, + "epoch": 0.12, + "learning_rate": 0.0002814667198086887, + "loss": 0.0247, "step": 24490 }, { - "epoch": 0.26, - "learning_rate": 0.00026027112927288056, - "loss": 0.0277, + "epoch": 0.12, + "learning_rate": 0.00028145915211567473, + "loss": 0.026, "step": 24500 }, { - "epoch": 0.26, - "learning_rate": 0.0002602549134072777, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.00028145158442266066, + "loss": 0.0294, "step": 24510 }, { - "epoch": 0.27, - "learning_rate": 0.00026023869754167474, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.00028144401672964664, + "loss": 0.0272, "step": 24520 }, { - "epoch": 0.27, - "learning_rate": 0.00026022248167607186, - "loss": 0.0299, + "epoch": 0.12, + "learning_rate": 0.0002814364490366326, + "loss": 0.0217, "step": 24530 }, { - "epoch": 0.27, - "learning_rate": 0.00026020626581046893, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.00028142888134361865, + "loss": 0.0293, "step": 24540 }, { - "epoch": 0.27, - "learning_rate": 0.00026019004994486605, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.00028142131365060464, + "loss": 0.0248, "step": 24550 }, { - "epoch": 0.27, - "learning_rate": 0.00026017383407926317, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.0002814137459575906, + "loss": 0.0291, "step": 24560 }, { - "epoch": 0.27, - "learning_rate": 0.00026015761821366023, - "loss": 0.0283, + "epoch": 0.12, + "learning_rate": 0.0002814061782645766, + "loss": 0.0301, "step": 24570 }, { - "epoch": 0.27, - "learning_rate": 0.0002601414023480573, - "loss": 0.0256, + "epoch": 0.12, + "learning_rate": 0.0002813986105715626, + "loss": 0.027, "step": 24580 }, { - "epoch": 0.27, - "learning_rate": 0.0002601251864824544, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028139104287854856, + "loss": 0.0261, "step": 24590 }, { - "epoch": 0.27, - "learning_rate": 0.00026010897061685154, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028138347518553454, + "loss": 0.034, "step": 24600 }, { - "epoch": 0.27, - "learning_rate": 0.0002600927547512486, - "loss": 0.0264, + "epoch": 0.12, + "learning_rate": 0.0002813759074925206, + "loss": 0.028, "step": 24610 }, { - "epoch": 0.27, - "learning_rate": 0.00026007653888564567, - "loss": 0.03, + "epoch": 0.12, + "learning_rate": 0.00028136833979950656, + "loss": 0.0271, "step": 24620 }, { - "epoch": 0.27, - "learning_rate": 0.0002600603230200428, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.00028136077210649254, + "loss": 0.0243, "step": 24630 }, { - "epoch": 0.27, - "learning_rate": 0.0002600441071544399, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002813532044134785, + "loss": 0.0262, "step": 24640 }, { - "epoch": 0.27, - "learning_rate": 0.000260027891288837, - "loss": 0.0248, + "epoch": 0.12, + "learning_rate": 0.0002813456367204645, + "loss": 0.0321, "step": 24650 }, { - "epoch": 0.27, - "learning_rate": 0.00026001167542323404, - "loss": 0.03, + "epoch": 0.12, + "learning_rate": 0.0002813380690274505, + "loss": 0.0278, "step": 24660 }, { - "epoch": 0.27, - "learning_rate": 0.00025999545955763116, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.0002813305013344365, + "loss": 0.0268, "step": 24670 }, { - "epoch": 0.27, - "learning_rate": 0.0002599792436920283, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002813229336414225, + "loss": 0.0261, "step": 24680 }, { - "epoch": 0.27, - "learning_rate": 0.00025996302782642535, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002813153659484085, + "loss": 0.0272, "step": 24690 }, { - "epoch": 0.27, - "learning_rate": 0.00025994681196082247, - "loss": 0.0296, + "epoch": 0.12, + "learning_rate": 0.00028130779825539447, + "loss": 0.0261, "step": 24700 }, { - "epoch": 0.27, - "learning_rate": 0.00025993059609521953, - "loss": 0.0241, + "epoch": 0.12, + "learning_rate": 0.00028130023056238045, + "loss": 0.0262, "step": 24710 }, { - "epoch": 0.27, - "learning_rate": 0.00025991438022961665, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.00028129266286936643, + "loss": 0.0257, "step": 24720 }, { - "epoch": 0.27, - "learning_rate": 0.0002598981643640137, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.00028128509517635246, + "loss": 0.0253, "step": 24730 }, { - "epoch": 0.27, - "learning_rate": 0.00025988194849841084, - "loss": 0.0282, + "epoch": 0.12, + "learning_rate": 0.00028127752748333845, + "loss": 0.0288, "step": 24740 }, { - "epoch": 0.27, - "learning_rate": 0.0002598657326328079, - "loss": 0.0279, + "epoch": 0.12, + "learning_rate": 0.0002812699597903244, + "loss": 0.0277, "step": 24750 }, { - "epoch": 0.27, - "learning_rate": 0.000259849516767205, - "loss": 0.0249, + "epoch": 0.12, + "learning_rate": 0.0002812623920973104, + "loss": 0.0255, "step": 24760 }, { - "epoch": 0.27, - "learning_rate": 0.0002598333009016021, - "loss": 0.0252, + "epoch": 0.12, + "learning_rate": 0.0002812548244042964, + "loss": 0.0246, "step": 24770 }, { - "epoch": 0.27, - "learning_rate": 0.0002598170850359992, - "loss": 0.0307, + "epoch": 0.13, + "learning_rate": 0.00028124725671128237, + "loss": 0.0251, "step": 24780 }, { - "epoch": 0.27, - "learning_rate": 0.00025980086917039627, - "loss": 0.0254, + "epoch": 0.13, + "learning_rate": 0.00028123968901826835, + "loss": 0.0291, "step": 24790 }, { - "epoch": 0.27, - "learning_rate": 0.0002597846533047934, - "loss": 0.025, + "epoch": 0.13, + "learning_rate": 0.0002812321213252544, + "loss": 0.0275, "step": 24800 }, { - "epoch": 0.27, - "learning_rate": 0.00025976843743919046, - "loss": 0.0263, + "epoch": 0.13, + "learning_rate": 0.00028122455363224037, + "loss": 0.0207, "step": 24810 }, { - "epoch": 0.27, - "learning_rate": 0.0002597522215735876, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.00028121698593922635, + "loss": 0.023, "step": 24820 }, { - "epoch": 0.27, - "learning_rate": 0.0002597360057079847, - "loss": 0.0255, + "epoch": 0.13, + "learning_rate": 0.00028120941824621233, + "loss": 0.0244, "step": 24830 }, { - "epoch": 0.27, - "learning_rate": 0.00025971978984238176, - "loss": 0.0273, + "epoch": 0.13, + "learning_rate": 0.0002812018505531983, + "loss": 0.0243, "step": 24840 }, { - "epoch": 0.27, - "learning_rate": 0.00025970357397677883, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002811942828601843, + "loss": 0.0252, "step": 24850 }, { - "epoch": 0.27, - "learning_rate": 0.00025968735811117595, - "loss": 0.0262, + "epoch": 0.13, + "learning_rate": 0.00028118671516717033, + "loss": 0.0266, "step": 24860 }, { - "epoch": 0.27, - "learning_rate": 0.00025967114224557307, - "loss": 0.0302, + "epoch": 0.13, + "learning_rate": 0.0002811791474741563, + "loss": 0.0278, "step": 24870 }, { - "epoch": 0.27, - "learning_rate": 0.00025965492637997013, - "loss": 0.0256, + "epoch": 0.13, + "learning_rate": 0.0002811715797811423, + "loss": 0.0258, "step": 24880 }, { - "epoch": 0.27, - "learning_rate": 0.0002596387105143672, - "loss": 0.0285, + "epoch": 0.13, + "learning_rate": 0.0002811640120881283, + "loss": 0.0303, "step": 24890 }, { - "epoch": 0.27, - "learning_rate": 0.0002596224946487643, - "loss": 0.0274, + "epoch": 0.13, + "learning_rate": 0.00028115644439511426, + "loss": 0.0255, "step": 24900 }, { - "epoch": 0.27, - "learning_rate": 0.00025960627878316144, - "loss": 0.027, + "epoch": 0.13, + "learning_rate": 0.00028114887670210024, + "loss": 0.0287, "step": 24910 }, { - "epoch": 0.27, - "learning_rate": 0.0002595900629175585, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.0002811413090090862, + "loss": 0.0292, "step": 24920 }, { - "epoch": 0.27, - "learning_rate": 0.00025957384705195557, - "loss": 0.0329, + "epoch": 0.13, + "learning_rate": 0.00028113374131607226, + "loss": 0.0314, "step": 24930 }, { - "epoch": 0.27, - "learning_rate": 0.0002595576311863527, - "loss": 0.0289, + "epoch": 0.13, + "learning_rate": 0.00028112617362305824, + "loss": 0.0283, "step": 24940 }, { - "epoch": 0.27, - "learning_rate": 0.0002595414153207498, - "loss": 0.0278, + "epoch": 0.13, + "learning_rate": 0.0002811186059300442, + "loss": 0.0254, "step": 24950 }, { - "epoch": 0.27, - "learning_rate": 0.00025952519945514693, - "loss": 0.0292, + "epoch": 0.13, + "learning_rate": 0.0002811110382370302, + "loss": 0.0273, "step": 24960 }, { - "epoch": 0.27, - "learning_rate": 0.000259508983589544, - "loss": 0.028, + "epoch": 0.13, + "learning_rate": 0.0002811034705440162, + "loss": 0.0274, "step": 24970 }, { - "epoch": 0.27, - "learning_rate": 0.00025949276772394106, - "loss": 0.0306, + "epoch": 0.13, + "learning_rate": 0.00028109590285100216, + "loss": 0.0304, "step": 24980 }, { - "epoch": 0.27, - "learning_rate": 0.0002594765518583382, - "loss": 0.0266, + "epoch": 0.13, + "learning_rate": 0.0002810883351579882, + "loss": 0.0299, "step": 24990 }, { - "epoch": 0.27, - "learning_rate": 0.0002594603359927353, - "loss": 0.031, + "epoch": 0.13, + "learning_rate": 0.0002810807674649742, + "loss": 0.0289, "step": 25000 }, { - "epoch": 0.27, - "eval_cer": 0.9215703646568931, - "eval_loss": 0.019244205206632614, - "eval_runtime": 120.3576, - "eval_samples_per_second": 16.617, - "eval_steps_per_second": 4.154, + "epoch": 0.13, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.01934368908405304, + "eval_runtime": 117.2646, + "eval_samples_per_second": 17.055, + "eval_steps_per_second": 4.264, "step": 25000 }, { - "epoch": 0.27, - "learning_rate": 0.00025944412012713237, - "loss": 0.0276, + "epoch": 0.13, + "learning_rate": 0.00028107319977196016, + "loss": 0.032, "step": 25010 }, { - "epoch": 0.27, - "learning_rate": 0.00025942790426152943, - "loss": 0.0269, + "epoch": 0.13, + "learning_rate": 0.00028106563207894614, + "loss": 0.0244, "step": 25020 }, { - "epoch": 0.27, - "learning_rate": 0.00025941168839592655, - "loss": 0.0284, + "epoch": 0.13, + "learning_rate": 0.0002810580643859321, + "loss": 0.0296, "step": 25030 }, { - "epoch": 0.27, - "learning_rate": 0.00025939547253032367, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.0002810504966929181, + "loss": 0.0274, "step": 25040 }, { - "epoch": 0.27, - "learning_rate": 0.00025937925666472074, - "loss": 0.0266, + "epoch": 0.13, + "learning_rate": 0.00028104292899990414, + "loss": 0.0288, "step": 25050 }, { - "epoch": 0.27, - "learning_rate": 0.0002593630407991178, - "loss": 0.0272, + "epoch": 0.13, + "learning_rate": 0.0002810353613068901, + "loss": 0.0311, "step": 25060 }, { - "epoch": 0.27, - "learning_rate": 0.0002593468249335149, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.0002810277936138761, + "loss": 0.0269, "step": 25070 }, { - "epoch": 0.27, - "learning_rate": 0.00025933060906791204, - "loss": 0.0298, + "epoch": 0.13, + "learning_rate": 0.0002810202259208621, + "loss": 0.0316, "step": 25080 }, { - "epoch": 0.27, - "learning_rate": 0.0002593143932023091, - "loss": 0.0354, + "epoch": 0.13, + "learning_rate": 0.00028101265822784807, + "loss": 0.0299, "step": 25090 }, { - "epoch": 0.27, - "learning_rate": 0.00025929817733670623, - "loss": 0.0274, + "epoch": 0.13, + "learning_rate": 0.00028100509053483405, + "loss": 0.0291, "step": 25100 }, { - "epoch": 0.27, - "learning_rate": 0.0002592819614711033, - "loss": 0.0265, + "epoch": 0.13, + "learning_rate": 0.00028099752284182003, + "loss": 0.0313, "step": 25110 }, { - "epoch": 0.27, - "learning_rate": 0.0002592657456055004, - "loss": 0.033, + "epoch": 0.13, + "learning_rate": 0.00028098995514880607, + "loss": 0.031, "step": 25120 }, { - "epoch": 0.27, - "learning_rate": 0.0002592495297398975, - "loss": 0.026, + "epoch": 0.13, + "learning_rate": 0.00028098238745579205, + "loss": 0.028, "step": 25130 }, { - "epoch": 0.27, - "learning_rate": 0.0002592333138742946, - "loss": 0.0254, + "epoch": 0.13, + "learning_rate": 0.00028097481976277803, + "loss": 0.025, "step": 25140 }, { - "epoch": 0.27, - "learning_rate": 0.00025921709800869167, - "loss": 0.0255, + "epoch": 0.13, + "learning_rate": 0.000280967252069764, + "loss": 0.0181, "step": 25150 }, { - "epoch": 0.27, - "learning_rate": 0.0002592008821430888, - "loss": 0.0277, + "epoch": 0.13, + "learning_rate": 0.00028095968437675, + "loss": 0.027, "step": 25160 }, { - "epoch": 0.27, - "learning_rate": 0.00025918466627748585, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.00028095211668373597, + "loss": 0.0255, "step": 25170 }, { - "epoch": 0.27, - "learning_rate": 0.00025916845041188297, - "loss": 0.0255, + "epoch": 0.13, + "learning_rate": 0.000280944548990722, + "loss": 0.0309, "step": 25180 }, { - "epoch": 0.27, - "learning_rate": 0.00025915223454628004, - "loss": 0.0275, + "epoch": 0.13, + "learning_rate": 0.000280936981297708, + "loss": 0.0269, "step": 25190 }, { - "epoch": 0.27, - "learning_rate": 0.00025913601868067716, - "loss": 0.025, + "epoch": 0.13, + "learning_rate": 0.00028092941360469397, + "loss": 0.0306, "step": 25200 }, { - "epoch": 0.27, - "learning_rate": 0.0002591198028150743, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.00028092184591167995, + "loss": 0.0282, "step": 25210 }, { - "epoch": 0.27, - "learning_rate": 0.00025910358694947134, - "loss": 0.0277, + "epoch": 0.13, + "learning_rate": 0.00028091427821866593, + "loss": 0.0253, "step": 25220 }, { - "epoch": 0.27, - "learning_rate": 0.0002590873710838684, - "loss": 0.0254, + "epoch": 0.13, + "learning_rate": 0.0002809067105256519, + "loss": 0.0256, "step": 25230 }, { - "epoch": 0.27, - "learning_rate": 0.00025907115521826553, - "loss": 0.0253, + "epoch": 0.13, + "learning_rate": 0.00028089914283263795, + "loss": 0.0316, "step": 25240 }, { - "epoch": 0.27, - "learning_rate": 0.00025905493935266265, - "loss": 0.0242, + "epoch": 0.13, + "learning_rate": 0.00028089157513962393, + "loss": 0.0256, "step": 25250 }, { - "epoch": 0.27, - "learning_rate": 0.0002590387234870597, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.0002808840074466099, + "loss": 0.0257, "step": 25260 }, { - "epoch": 0.27, - "learning_rate": 0.00025902250762145683, - "loss": 0.0245, + "epoch": 0.13, + "learning_rate": 0.0002808764397535959, + "loss": 0.0248, "step": 25270 }, { - "epoch": 0.27, - "learning_rate": 0.0002590062917558539, - "loss": 0.0262, + "epoch": 0.13, + "learning_rate": 0.0002808688720605819, + "loss": 0.0261, "step": 25280 }, { - "epoch": 0.27, - "learning_rate": 0.000258990075890251, - "loss": 0.025, + "epoch": 0.13, + "learning_rate": 0.00028086130436756786, + "loss": 0.0283, "step": 25290 }, { - "epoch": 0.27, - "learning_rate": 0.0002589738600246481, - "loss": 0.0261, + "epoch": 0.13, + "learning_rate": 0.00028085373667455384, + "loss": 0.0252, "step": 25300 }, { - "epoch": 0.27, - "learning_rate": 0.0002589576441590452, - "loss": 0.0253, + "epoch": 0.13, + "learning_rate": 0.0002808461689815399, + "loss": 0.0266, "step": 25310 }, { - "epoch": 0.27, - "learning_rate": 0.00025894142829344227, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.00028083860128852586, + "loss": 0.0215, "step": 25320 }, { - "epoch": 0.27, - "learning_rate": 0.0002589252124278394, - "loss": 0.0288, + "epoch": 0.13, + "learning_rate": 0.00028083103359551184, + "loss": 0.0299, "step": 25330 }, { - "epoch": 0.27, - "learning_rate": 0.00025890899656223646, - "loss": 0.0268, + "epoch": 0.13, + "learning_rate": 0.0002808234659024978, + "loss": 0.0243, "step": 25340 }, { - "epoch": 0.27, - "learning_rate": 0.0002588927806966336, - "loss": 0.026, + "epoch": 0.13, + "learning_rate": 0.0002808158982094838, + "loss": 0.0348, "step": 25350 }, { - "epoch": 0.27, - "learning_rate": 0.00025887656483103064, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.0002808083305164698, + "loss": 0.0266, "step": 25360 }, { - "epoch": 0.27, - "learning_rate": 0.00025886034896542776, - "loss": 0.0243, + "epoch": 0.13, + "learning_rate": 0.0002808007628234558, + "loss": 0.0305, "step": 25370 }, { - "epoch": 0.27, - "learning_rate": 0.0002588441330998248, - "loss": 0.0242, + "epoch": 0.13, + "learning_rate": 0.0002807931951304418, + "loss": 0.0269, "step": 25380 }, { - "epoch": 0.27, - "learning_rate": 0.00025882791723422195, - "loss": 0.0268, + "epoch": 0.13, + "learning_rate": 0.0002807856274374278, + "loss": 0.0313, "step": 25390 }, { - "epoch": 0.27, - "learning_rate": 0.00025881170136861907, - "loss": 0.0222, + "epoch": 0.13, + "learning_rate": 0.00028077805974441376, + "loss": 0.03, "step": 25400 }, { - "epoch": 0.27, - "learning_rate": 0.00025879548550301613, - "loss": 0.0293, + "epoch": 0.13, + "learning_rate": 0.00028077049205139974, + "loss": 0.0283, "step": 25410 }, { - "epoch": 0.27, - "learning_rate": 0.0002587792696374132, - "loss": 0.0239, + "epoch": 0.13, + "learning_rate": 0.0002807629243583857, + "loss": 0.0247, "step": 25420 }, { - "epoch": 0.27, - "learning_rate": 0.0002587630537718103, - "loss": 0.0257, + "epoch": 0.13, + "learning_rate": 0.0002807553566653717, + "loss": 0.0282, "step": 25430 }, { - "epoch": 0.28, - "learning_rate": 0.00025874683790620744, - "loss": 0.0278, + "epoch": 0.13, + "learning_rate": 0.00028074778897235774, + "loss": 0.0228, "step": 25440 }, { - "epoch": 0.28, - "learning_rate": 0.0002587306220406045, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.0002807402212793437, + "loss": 0.027, "step": 25450 }, { - "epoch": 0.28, - "learning_rate": 0.00025871440617500157, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.0002807326535863297, + "loss": 0.0335, "step": 25460 }, { - "epoch": 0.28, - "learning_rate": 0.0002586981903093987, - "loss": 0.0282, + "epoch": 0.13, + "learning_rate": 0.0002807250858933157, + "loss": 0.0284, "step": 25470 }, { - "epoch": 0.28, - "learning_rate": 0.0002586819744437958, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.00028071751820030167, + "loss": 0.03, "step": 25480 }, { - "epoch": 0.28, - "learning_rate": 0.0002586657585781929, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.00028070995050728765, + "loss": 0.0267, "step": 25490 }, { - "epoch": 0.28, - "learning_rate": 0.00025864954271258994, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.0002807023828142737, + "loss": 0.0261, "step": 25500 }, { - "epoch": 0.28, - "learning_rate": 0.00025863332684698706, - "loss": 0.024, + "epoch": 0.13, + "learning_rate": 0.00028069481512125967, + "loss": 0.0282, "step": 25510 }, { - "epoch": 0.28, - "learning_rate": 0.0002586171109813842, - "loss": 0.0255, + "epoch": 0.13, + "learning_rate": 0.00028068724742824565, + "loss": 0.0257, "step": 25520 }, { - "epoch": 0.28, - "learning_rate": 0.00025860089511578124, - "loss": 0.0315, + "epoch": 0.13, + "learning_rate": 0.00028067967973523163, + "loss": 0.0275, "step": 25530 }, { - "epoch": 0.28, - "learning_rate": 0.00025858467925017836, - "loss": 0.0256, + "epoch": 0.13, + "learning_rate": 0.0002806721120422176, + "loss": 0.0248, "step": 25540 }, { - "epoch": 0.28, - "learning_rate": 0.00025856846338457543, - "loss": 0.0263, + "epoch": 0.13, + "learning_rate": 0.0002806645443492036, + "loss": 0.0252, "step": 25550 }, { - "epoch": 0.28, - "learning_rate": 0.00025855224751897255, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.00028065697665618963, + "loss": 0.0278, "step": 25560 }, { - "epoch": 0.28, - "learning_rate": 0.00025853603165336967, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.0002806494089631756, + "loss": 0.0305, "step": 25570 }, { - "epoch": 0.28, - "learning_rate": 0.00025851981578776674, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.0002806418412701616, + "loss": 0.0253, "step": 25580 }, { - "epoch": 0.28, - "learning_rate": 0.0002585035999221638, - "loss": 0.0274, + "epoch": 0.13, + "learning_rate": 0.00028063427357714757, + "loss": 0.0302, "step": 25590 }, { - "epoch": 0.28, - "learning_rate": 0.0002584873840565609, - "loss": 0.0268, + "epoch": 0.13, + "learning_rate": 0.00028062670588413355, + "loss": 0.0312, "step": 25600 }, { - "epoch": 0.28, - "learning_rate": 0.00025847116819095804, - "loss": 0.0292, + "epoch": 0.13, + "learning_rate": 0.00028061913819111954, + "loss": 0.0293, "step": 25610 }, { - "epoch": 0.28, - "learning_rate": 0.0002584549523253551, - "loss": 0.0276, + "epoch": 0.13, + "learning_rate": 0.0002806115704981055, + "loss": 0.0286, "step": 25620 }, { - "epoch": 0.28, - "learning_rate": 0.00025843873645975217, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00028060400280509155, + "loss": 0.0266, "step": 25630 }, { - "epoch": 0.28, - "learning_rate": 0.0002584225205941493, - "loss": 0.0257, + "epoch": 0.13, + "learning_rate": 0.00028059643511207753, + "loss": 0.0245, "step": 25640 }, { - "epoch": 0.28, - "learning_rate": 0.0002584063047285464, - "loss": 0.0283, + "epoch": 0.13, + "learning_rate": 0.0002805888674190635, + "loss": 0.0277, "step": 25650 }, { - "epoch": 0.28, - "learning_rate": 0.0002583900888629435, - "loss": 0.0327, + "epoch": 0.13, + "learning_rate": 0.0002805812997260495, + "loss": 0.0281, "step": 25660 }, { - "epoch": 0.28, - "learning_rate": 0.00025837387299734054, - "loss": 0.046, + "epoch": 0.13, + "learning_rate": 0.0002805737320330355, + "loss": 0.0347, "step": 25670 }, { - "epoch": 0.28, - "learning_rate": 0.00025835765713173766, - "loss": 0.0337, + "epoch": 0.13, + "learning_rate": 0.00028056616434002146, + "loss": 0.0276, "step": 25680 }, { - "epoch": 0.28, - "learning_rate": 0.0002583414412661348, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.0002805585966470075, + "loss": 0.03, "step": 25690 }, { - "epoch": 0.28, - "learning_rate": 0.00025832522540053185, - "loss": 0.0266, + "epoch": 0.13, + "learning_rate": 0.0002805510289539935, + "loss": 0.0271, "step": 25700 }, { - "epoch": 0.28, - "learning_rate": 0.00025830900953492897, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.00028054346126097946, + "loss": 0.0377, "step": 25710 }, { - "epoch": 0.28, - "learning_rate": 0.00025829279366932603, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.00028053589356796544, + "loss": 0.0605, "step": 25720 }, { - "epoch": 0.28, - "learning_rate": 0.00025827657780372315, - "loss": 0.0282, + "epoch": 0.13, + "learning_rate": 0.0002805283258749514, + "loss": 0.032, "step": 25730 }, { - "epoch": 0.28, - "learning_rate": 0.0002582603619381202, - "loss": 0.025, + "epoch": 0.13, + "learning_rate": 0.0002805207581819374, + "loss": 0.0337, "step": 25740 }, { - "epoch": 0.28, - "learning_rate": 0.00025824414607251734, - "loss": 0.0273, + "epoch": 0.13, + "learning_rate": 0.00028051319048892344, + "loss": 0.0272, "step": 25750 }, { - "epoch": 0.28, - "learning_rate": 0.0002582279302069144, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.0002805056227959094, + "loss": 0.0316, "step": 25760 }, { - "epoch": 0.28, - "learning_rate": 0.0002582117143413115, - "loss": 0.0192, + "epoch": 0.13, + "learning_rate": 0.00028049805510289535, + "loss": 0.0249, "step": 25770 }, { - "epoch": 0.28, - "learning_rate": 0.0002581954984757086, - "loss": 0.026, + "epoch": 0.13, + "learning_rate": 0.00028049048740988133, + "loss": 0.0272, "step": 25780 }, { - "epoch": 0.28, - "learning_rate": 0.0002581792826101057, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.00028048291971686736, + "loss": 0.0345, "step": 25790 }, { - "epoch": 0.28, - "learning_rate": 0.0002581630667445028, - "loss": 0.0299, + "epoch": 0.13, + "learning_rate": 0.00028047535202385335, + "loss": 0.0284, "step": 25800 }, { - "epoch": 0.28, - "learning_rate": 0.0002581468508788999, - "loss": 0.0289, + "epoch": 0.13, + "learning_rate": 0.00028046778433083933, + "loss": 0.0267, "step": 25810 }, { - "epoch": 0.28, - "learning_rate": 0.00025813063501329696, - "loss": 0.0294, + "epoch": 0.13, + "learning_rate": 0.0002804602166378253, + "loss": 0.0271, "step": 25820 }, { - "epoch": 0.28, - "learning_rate": 0.0002581144191476941, - "loss": 0.029, + "epoch": 0.13, + "learning_rate": 0.0002804526489448113, + "loss": 0.0298, "step": 25830 }, { - "epoch": 0.28, - "learning_rate": 0.0002580982032820912, - "loss": 0.0276, + "epoch": 0.13, + "learning_rate": 0.00028044508125179727, + "loss": 0.0277, "step": 25840 }, { - "epoch": 0.28, - "learning_rate": 0.00025808198741648827, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.00028043751355878325, + "loss": 0.0267, "step": 25850 }, { - "epoch": 0.28, - "learning_rate": 0.00025806577155088533, - "loss": 0.0265, + "epoch": 0.13, + "learning_rate": 0.0002804299458657693, + "loss": 0.0267, "step": 25860 }, { - "epoch": 0.28, - "learning_rate": 0.00025804955568528245, - "loss": 0.0256, + "epoch": 0.13, + "learning_rate": 0.00028042237817275527, + "loss": 0.024, "step": 25870 }, { - "epoch": 0.28, - "learning_rate": 0.00025803333981967957, - "loss": 0.0313, + "epoch": 0.13, + "learning_rate": 0.00028041481047974125, + "loss": 0.0263, "step": 25880 }, { - "epoch": 0.28, - "learning_rate": 0.00025801712395407664, - "loss": 0.0267, + "epoch": 0.13, + "learning_rate": 0.00028040724278672723, + "loss": 0.0284, "step": 25890 }, { - "epoch": 0.28, - "learning_rate": 0.00025800090808847376, - "loss": 0.0272, + "epoch": 0.13, + "learning_rate": 0.0002803996750937132, + "loss": 0.0283, "step": 25900 }, { - "epoch": 0.28, - "learning_rate": 0.0002579846922228708, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.0002803921074006992, + "loss": 0.0398, "step": 25910 }, { - "epoch": 0.28, - "learning_rate": 0.00025796847635726794, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.00028038453970768523, + "loss": 0.0498, "step": 25920 }, { - "epoch": 0.28, - "learning_rate": 0.000257952260491665, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002803769720146712, + "loss": 0.03, "step": 25930 }, { - "epoch": 0.28, - "learning_rate": 0.00025793604462606213, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.0002803694043216572, + "loss": 0.0254, "step": 25940 }, { - "epoch": 0.28, - "learning_rate": 0.0002579198287604592, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.0002803618366286432, + "loss": 0.027, "step": 25950 }, { - "epoch": 0.28, - "learning_rate": 0.0002579036128948563, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.00028035426893562916, + "loss": 0.0304, "step": 25960 }, { - "epoch": 0.28, - "learning_rate": 0.00025788739702925343, - "loss": 0.0249, + "epoch": 0.13, + "learning_rate": 0.00028034670124261514, + "loss": 0.0237, "step": 25970 }, { - "epoch": 0.28, - "learning_rate": 0.0002578711811636505, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.0002803391335496011, + "loss": 0.0255, "step": 25980 }, { - "epoch": 0.28, - "learning_rate": 0.00025785496529804756, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.00028033156585658716, + "loss": 0.0223, "step": 25990 }, { - "epoch": 0.28, - "learning_rate": 0.0002578387494324447, - "loss": 0.0267, + "epoch": 0.13, + "learning_rate": 0.00028032399816357314, + "loss": 0.0258, "step": 26000 }, { - "epoch": 0.28, - "eval_cer": 0.9215616786273294, - "eval_loss": 0.018755970522761345, - "eval_runtime": 120.1496, - "eval_samples_per_second": 16.646, - "eval_steps_per_second": 4.161, + "epoch": 0.13, + "eval_cer": 0.9144799598644162, + "eval_loss": 0.019629212096333504, + "eval_runtime": 117.332, + "eval_samples_per_second": 17.046, + "eval_steps_per_second": 4.261, "step": 26000 }, { - "epoch": 0.28, - "learning_rate": 0.0002578225335668418, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.0002803164304705591, + "loss": 0.0294, "step": 26010 }, { - "epoch": 0.28, - "learning_rate": 0.00025780631770123887, - "loss": 0.0249, + "epoch": 0.13, + "learning_rate": 0.0002803088627775451, + "loss": 0.028, "step": 26020 }, { - "epoch": 0.28, - "learning_rate": 0.00025779010183563594, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.0002803012950845311, + "loss": 0.0272, "step": 26030 }, { - "epoch": 0.28, - "learning_rate": 0.00025777388597003306, - "loss": 0.0351, + "epoch": 0.13, + "learning_rate": 0.00028029372739151706, + "loss": 0.0292, "step": 26040 }, { - "epoch": 0.28, - "learning_rate": 0.0002577576701044302, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.0002802861596985031, + "loss": 0.0327, "step": 26050 }, { - "epoch": 0.28, - "learning_rate": 0.00025774145423882724, - "loss": 0.0276, + "epoch": 0.13, + "learning_rate": 0.0002802785920054891, + "loss": 0.0273, "step": 26060 }, { - "epoch": 0.28, - "learning_rate": 0.0002577252383732243, - "loss": 0.0274, + "epoch": 0.13, + "learning_rate": 0.00028027102431247506, + "loss": 0.0342, "step": 26070 }, { - "epoch": 0.28, - "learning_rate": 0.0002577090225076214, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.00028026345661946104, + "loss": 0.0319, "step": 26080 }, { - "epoch": 0.28, - "learning_rate": 0.00025769280664201855, - "loss": 0.0275, + "epoch": 0.13, + "learning_rate": 0.000280255888926447, + "loss": 0.031, "step": 26090 }, { - "epoch": 0.28, - "learning_rate": 0.0002576765907764156, - "loss": 0.0268, + "epoch": 0.13, + "learning_rate": 0.000280248321233433, + "loss": 0.0213, "step": 26100 }, { - "epoch": 0.28, - "learning_rate": 0.00025766037491081273, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.00028024075354041904, + "loss": 0.0271, "step": 26110 }, { - "epoch": 0.28, - "learning_rate": 0.0002576441590452098, - "loss": 0.0272, + "epoch": 0.13, + "learning_rate": 0.000280233185847405, + "loss": 0.0279, "step": 26120 }, { - "epoch": 0.28, - "learning_rate": 0.0002576279431796069, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.000280225618154391, + "loss": 0.0244, "step": 26130 }, { - "epoch": 0.28, - "learning_rate": 0.00025761172731400404, - "loss": 0.0254, + "epoch": 0.13, + "learning_rate": 0.000280218050461377, + "loss": 0.0294, "step": 26140 }, { - "epoch": 0.28, - "learning_rate": 0.0002575955114484011, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.00028021048276836297, + "loss": 0.0253, "step": 26150 }, { - "epoch": 0.28, - "learning_rate": 0.00025757929558279817, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00028020291507534895, + "loss": 0.0221, "step": 26160 }, { - "epoch": 0.28, - "learning_rate": 0.0002575630797171953, - "loss": 0.025, + "epoch": 0.13, + "learning_rate": 0.00028019534738233493, + "loss": 0.0235, "step": 26170 }, { - "epoch": 0.28, - "learning_rate": 0.0002575468638515924, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.00028018777968932097, + "loss": 0.0256, "step": 26180 }, { - "epoch": 0.28, - "learning_rate": 0.0002575306479859895, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00028018021199630695, + "loss": 0.0281, "step": 26190 }, { - "epoch": 0.28, - "learning_rate": 0.00025751443212038654, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.00028017264430329293, + "loss": 0.0277, "step": 26200 }, { - "epoch": 0.28, - "learning_rate": 0.00025749821625478366, - "loss": 0.0257, + "epoch": 0.13, + "learning_rate": 0.0002801650766102789, + "loss": 0.0247, "step": 26210 }, { - "epoch": 0.28, - "learning_rate": 0.0002574820003891808, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.0002801575089172649, + "loss": 0.0251, "step": 26220 }, { - "epoch": 0.28, - "learning_rate": 0.00025746578452357784, - "loss": 0.027, + "epoch": 0.13, + "learning_rate": 0.0002801499412242509, + "loss": 0.0261, "step": 26230 }, { - "epoch": 0.28, - "learning_rate": 0.0002574495686579749, - "loss": 0.0261, + "epoch": 0.13, + "learning_rate": 0.0002801423735312369, + "loss": 0.0286, "step": 26240 }, { - "epoch": 0.28, - "learning_rate": 0.00025743335279237203, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.0002801348058382229, + "loss": 0.0289, "step": 26250 }, { - "epoch": 0.28, - "learning_rate": 0.00025741713692676915, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00028012723814520887, + "loss": 0.0265, "step": 26260 }, { - "epoch": 0.28, - "learning_rate": 0.0002574009210611662, - "loss": 0.0269, + "epoch": 0.13, + "learning_rate": 0.00028011967045219485, + "loss": 0.0294, "step": 26270 }, { - "epoch": 0.28, - "learning_rate": 0.00025738470519556334, - "loss": 0.0274, + "epoch": 0.13, + "learning_rate": 0.00028011210275918083, + "loss": 0.0306, "step": 26280 }, { - "epoch": 0.28, - "learning_rate": 0.0002573684893299604, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.0002801045350661668, + "loss": 0.0267, "step": 26290 }, { - "epoch": 0.28, - "learning_rate": 0.0002573522734643575, - "loss": 0.0258, + "epoch": 0.13, + "learning_rate": 0.00028009696737315285, + "loss": 0.0307, "step": 26300 }, { - "epoch": 0.28, - "learning_rate": 0.0002573360575987546, - "loss": 0.0267, + "epoch": 0.13, + "learning_rate": 0.00028008939968013883, + "loss": 0.027, "step": 26310 }, { - "epoch": 0.28, - "learning_rate": 0.0002573198417331517, - "loss": 0.0257, + "epoch": 0.13, + "learning_rate": 0.0002800818319871248, + "loss": 0.0289, "step": 26320 }, { - "epoch": 0.28, - "learning_rate": 0.00025730362586754877, + "epoch": 0.13, + "learning_rate": 0.0002800742642941108, "loss": 0.0275, "step": 26330 }, { - "epoch": 0.28, - "learning_rate": 0.0002572874100019459, - "loss": 0.0222, + "epoch": 0.13, + "learning_rate": 0.0002800666966010968, + "loss": 0.0258, "step": 26340 }, { - "epoch": 0.28, - "learning_rate": 0.00025727119413634296, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00028005912890808276, + "loss": 0.0311, "step": 26350 }, { - "epoch": 0.28, - "learning_rate": 0.0002572549782707401, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.00028005156121506874, + "loss": 0.0253, "step": 26360 }, { - "epoch": 0.29, - "learning_rate": 0.00025723876240513714, - "loss": 0.0276, + "epoch": 0.13, + "learning_rate": 0.0002800439935220548, + "loss": 0.0236, "step": 26370 }, { - "epoch": 0.29, - "learning_rate": 0.00025722254653953426, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028003642582904076, + "loss": 0.0235, "step": 26380 }, { - "epoch": 0.29, - "learning_rate": 0.00025720633067393133, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028002885813602674, + "loss": 0.0272, "step": 26390 }, { - "epoch": 0.29, - "learning_rate": 0.00025719011480832845, - "loss": 0.0253, + "epoch": 0.13, + "learning_rate": 0.0002800212904430127, + "loss": 0.0229, "step": 26400 }, { - "epoch": 0.29, - "learning_rate": 0.00025717389894272557, - "loss": 0.0278, + "epoch": 0.13, + "learning_rate": 0.0002800137227499987, + "loss": 0.0255, "step": 26410 }, { - "epoch": 0.29, - "learning_rate": 0.00025715768307712263, - "loss": 0.0285, + "epoch": 0.13, + "learning_rate": 0.0002800061550569847, + "loss": 0.0301, "step": 26420 }, { - "epoch": 0.29, - "learning_rate": 0.0002571414672115197, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.0002799985873639707, + "loss": 0.0259, "step": 26430 }, { - "epoch": 0.29, - "learning_rate": 0.0002571252513459168, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.0002799910196709567, + "loss": 0.0226, "step": 26440 }, { - "epoch": 0.29, - "learning_rate": 0.00025710903548031394, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.0002799834519779427, + "loss": 0.0285, "step": 26450 }, { - "epoch": 0.29, - "learning_rate": 0.000257092819614711, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00027997588428492866, + "loss": 0.0286, "step": 26460 }, { - "epoch": 0.29, - "learning_rate": 0.00025707660374910807, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.00027996831659191464, + "loss": 0.027, "step": 26470 }, { - "epoch": 0.29, - "learning_rate": 0.0002570603878835052, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.0002799607488989006, + "loss": 0.0276, "step": 26480 }, { - "epoch": 0.29, - "learning_rate": 0.0002570441720179023, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.0002799531812058866, + "loss": 0.0285, "step": 26490 }, { - "epoch": 0.29, - "learning_rate": 0.0002570279561522994, - "loss": 0.0263, + "epoch": 0.13, + "learning_rate": 0.00027994561351287264, + "loss": 0.0327, "step": 26500 }, { - "epoch": 0.29, - "learning_rate": 0.00025701174028669644, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002799380458198586, + "loss": 0.0265, "step": 26510 }, { - "epoch": 0.29, - "learning_rate": 0.00025699552442109356, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.0002799304781268446, + "loss": 0.0286, "step": 26520 }, { - "epoch": 0.29, - "learning_rate": 0.0002569793085554907, - "loss": 0.0318, + "epoch": 0.13, + "learning_rate": 0.0002799229104338306, + "loss": 0.0261, "step": 26530 }, { - "epoch": 0.29, - "learning_rate": 0.00025696309268988775, - "loss": 0.0265, + "epoch": 0.13, + "learning_rate": 0.00027991534274081657, + "loss": 0.0244, "step": 26540 }, { - "epoch": 0.29, - "learning_rate": 0.00025694687682428487, - "loss": 0.0272, + "epoch": 0.13, + "learning_rate": 0.00027990777504780255, + "loss": 0.0262, "step": 26550 }, { - "epoch": 0.29, - "learning_rate": 0.00025693066095868193, - "loss": 0.03, + "epoch": 0.13, + "learning_rate": 0.0002799002073547886, + "loss": 0.0246, "step": 26560 }, { - "epoch": 0.29, - "learning_rate": 0.00025691444509307905, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.00027989263966177457, + "loss": 0.0241, "step": 26570 }, { - "epoch": 0.29, - "learning_rate": 0.00025689822922747617, - "loss": 0.0275, + "epoch": 0.13, + "learning_rate": 0.00027988507196876055, + "loss": 0.0267, "step": 26580 }, { - "epoch": 0.29, - "learning_rate": 0.00025688201336187324, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.00027987750427574653, + "loss": 0.0271, "step": 26590 }, { - "epoch": 0.29, - "learning_rate": 0.0002568657974962703, - "loss": 0.0226, + "epoch": 0.13, + "learning_rate": 0.0002798699365827325, + "loss": 0.0289, "step": 26600 }, { - "epoch": 0.29, - "learning_rate": 0.0002568495816306674, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.0002798623688897185, + "loss": 0.0224, "step": 26610 }, { - "epoch": 0.29, - "learning_rate": 0.00025683336576506454, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.00027985480119670453, + "loss": 0.0345, "step": 26620 }, { - "epoch": 0.29, - "learning_rate": 0.0002568171498994616, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.0002798472335036905, + "loss": 0.0268, "step": 26630 }, { - "epoch": 0.29, - "learning_rate": 0.0002568009340338587, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.0002798396658106765, + "loss": 0.0274, "step": 26640 }, { - "epoch": 0.29, - "learning_rate": 0.0002567847181682558, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.0002798320981176625, + "loss": 0.0272, "step": 26650 }, { - "epoch": 0.29, - "learning_rate": 0.0002567685023026529, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00027982453042464845, + "loss": 0.0246, "step": 26660 }, { - "epoch": 0.29, - "learning_rate": 0.00025675228643705, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.00027981696273163444, + "loss": 0.0257, "step": 26670 }, { - "epoch": 0.29, - "learning_rate": 0.00025673607057144705, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.0002798093950386204, + "loss": 0.0251, "step": 26680 }, { - "epoch": 0.29, - "learning_rate": 0.00025671985470584417, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.00027980182734560645, + "loss": 0.0335, "step": 26690 }, { - "epoch": 0.29, - "learning_rate": 0.0002567036388402413, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.00027979425965259243, + "loss": 0.0317, "step": 26700 }, { - "epoch": 0.29, - "learning_rate": 0.0002566874229746384, - "loss": 0.0269, + "epoch": 0.13, + "learning_rate": 0.0002797866919595784, + "loss": 0.029, "step": 26710 }, { - "epoch": 0.29, - "learning_rate": 0.00025667120710903547, - "loss": 0.0263, + "epoch": 0.13, + "learning_rate": 0.0002797791242665644, + "loss": 0.0285, "step": 26720 }, { - "epoch": 0.29, - "learning_rate": 0.00025665499124343254, - "loss": 0.0287, + "epoch": 0.13, + "learning_rate": 0.0002797715565735504, + "loss": 0.0266, "step": 26730 }, { - "epoch": 0.29, - "learning_rate": 0.00025663877537782966, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.00027976398888053636, + "loss": 0.0233, "step": 26740 }, { - "epoch": 0.29, - "learning_rate": 0.0002566225595122268, - "loss": 0.0286, + "epoch": 0.13, + "learning_rate": 0.0002797564211875224, + "loss": 0.0269, "step": 26750 }, { - "epoch": 0.29, - "learning_rate": 0.00025660634364662384, - "loss": 0.0279, + "epoch": 0.14, + "learning_rate": 0.0002797488534945084, + "loss": 0.0241, "step": 26760 }, { - "epoch": 0.29, - "learning_rate": 0.0002565901277810209, - "loss": 0.0235, + "epoch": 0.14, + "learning_rate": 0.00027974128580149436, + "loss": 0.0285, "step": 26770 }, { - "epoch": 0.29, - "learning_rate": 0.000256573911915418, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.00027973371810848034, + "loss": 0.0314, "step": 26780 }, { - "epoch": 0.29, - "learning_rate": 0.00025655769604981515, - "loss": 0.0342, + "epoch": 0.14, + "learning_rate": 0.0002797261504154663, + "loss": 0.0305, "step": 26790 }, { - "epoch": 0.29, - "learning_rate": 0.0002565414801842122, - "loss": 0.0287, + "epoch": 0.14, + "learning_rate": 0.0002797185827224523, + "loss": 0.0261, "step": 26800 }, { - "epoch": 0.29, - "learning_rate": 0.0002565252643186093, - "loss": 0.0253, + "epoch": 0.14, + "learning_rate": 0.00027971101502943834, + "loss": 0.0316, "step": 26810 }, { - "epoch": 0.29, - "learning_rate": 0.0002565090484530064, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.0002797034473364243, + "loss": 0.0237, "step": 26820 }, { - "epoch": 0.29, - "learning_rate": 0.0002564928325874035, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002796958796434103, + "loss": 0.0287, "step": 26830 }, { - "epoch": 0.29, - "learning_rate": 0.0002564766167218006, - "loss": 0.0248, + "epoch": 0.14, + "learning_rate": 0.0002796883119503963, + "loss": 0.024, "step": 26840 }, { - "epoch": 0.29, - "learning_rate": 0.0002564604008561977, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.00027968074425738226, + "loss": 0.0314, "step": 26850 }, { - "epoch": 0.29, - "learning_rate": 0.00025644418499059477, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.00027967317656436825, + "loss": 0.0315, "step": 26860 }, { - "epoch": 0.29, - "learning_rate": 0.0002564279691249919, - "loss": 0.0215, - "step": 26870 + "epoch": 0.14, + "learning_rate": 0.00027966560887135423, + "loss": 0.0268, + "step": 26870 }, { - "epoch": 0.29, - "learning_rate": 0.00025641175325938895, - "loss": 0.0267, + "epoch": 0.14, + "learning_rate": 0.00027965804117834026, + "loss": 0.0279, "step": 26880 }, { - "epoch": 0.29, - "learning_rate": 0.0002563955373937861, - "loss": 0.0316, + "epoch": 0.14, + "learning_rate": 0.00027965047348532624, + "loss": 0.0324, "step": 26890 }, { - "epoch": 0.29, - "learning_rate": 0.00025637932152818314, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002796429057923122, + "loss": 0.0249, "step": 26900 }, { - "epoch": 0.29, - "learning_rate": 0.00025636310566258026, - "loss": 0.0269, + "epoch": 0.14, + "learning_rate": 0.0002796353380992982, + "loss": 0.0301, "step": 26910 }, { - "epoch": 0.29, - "learning_rate": 0.0002563468897969773, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.0002796277704062842, + "loss": 0.0246, "step": 26920 }, { - "epoch": 0.29, - "learning_rate": 0.00025633067393137445, - "loss": 0.0217, + "epoch": 0.14, + "learning_rate": 0.00027962020271327017, + "loss": 0.0289, "step": 26930 }, { - "epoch": 0.29, - "learning_rate": 0.0002563144580657715, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.0002796126350202562, + "loss": 0.0264, "step": 26940 }, { - "epoch": 0.29, - "learning_rate": 0.00025629824220016863, - "loss": 0.0256, + "epoch": 0.14, + "learning_rate": 0.0002796050673272422, + "loss": 0.0234, "step": 26950 }, { - "epoch": 0.29, - "learning_rate": 0.0002562820263345657, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.00027959749963422817, + "loss": 0.0335, "step": 26960 }, { - "epoch": 0.29, - "learning_rate": 0.0002562658104689628, - "loss": 0.0255, + "epoch": 0.14, + "learning_rate": 0.00027958993194121415, + "loss": 0.0256, "step": 26970 }, { - "epoch": 0.29, - "learning_rate": 0.00025624959460335994, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.00027958236424820013, + "loss": 0.0356, "step": 26980 }, { - "epoch": 0.29, - "learning_rate": 0.000256233378737757, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.0002795747965551861, + "loss": 0.0252, "step": 26990 }, { - "epoch": 0.29, - "learning_rate": 0.00025621716287215407, - "loss": 0.0245, + "epoch": 0.14, + "learning_rate": 0.0002795672288621721, + "loss": 0.0255, "step": 27000 }, { - "epoch": 0.29, - "eval_cer": 0.9215590728184603, - "eval_loss": 0.017664359882473946, - "eval_runtime": 120.4378, - "eval_samples_per_second": 16.606, - "eval_steps_per_second": 4.152, + "epoch": 0.14, + "eval_cer": 0.9144469663961525, + "eval_loss": 0.020766137167811394, + "eval_runtime": 117.1709, + "eval_samples_per_second": 17.069, + "eval_steps_per_second": 4.267, "step": 27000 }, { - "epoch": 0.29, - "learning_rate": 0.0002562009470065512, - "loss": 0.0323, + "epoch": 0.14, + "learning_rate": 0.00027955966116915813, + "loss": 0.0269, "step": 27010 }, { - "epoch": 0.29, - "learning_rate": 0.0002561847311409483, - "loss": 0.0263, + "epoch": 0.14, + "learning_rate": 0.0002795520934761441, + "loss": 0.0345, "step": 27020 }, { - "epoch": 0.29, - "learning_rate": 0.00025616851527534537, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.00027954452578313004, + "loss": 0.0293, "step": 27030 }, { - "epoch": 0.29, - "learning_rate": 0.00025615229940974244, - "loss": 0.0333, + "epoch": 0.14, + "learning_rate": 0.0002795369580901161, + "loss": 0.0293, "step": 27040 }, { - "epoch": 0.29, - "learning_rate": 0.00025613608354413956, - "loss": 0.0262, + "epoch": 0.14, + "learning_rate": 0.00027952939039710206, + "loss": 0.0265, "step": 27050 }, { - "epoch": 0.29, - "learning_rate": 0.0002561198676785367, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.00027952182270408804, + "loss": 0.0272, "step": 27060 }, { - "epoch": 0.29, - "learning_rate": 0.00025610365181293374, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.000279514255011074, + "loss": 0.0266, "step": 27070 }, { - "epoch": 0.29, - "learning_rate": 0.0002560874359473308, - "loss": 0.0293, + "epoch": 0.14, + "learning_rate": 0.00027950668731806, + "loss": 0.0241, "step": 27080 }, { - "epoch": 0.29, - "learning_rate": 0.00025607122008172793, - "loss": 0.0271, + "epoch": 0.14, + "learning_rate": 0.000279499119625046, + "loss": 0.0265, "step": 27090 }, { - "epoch": 0.29, - "learning_rate": 0.00025605500421612505, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.00027949155193203196, + "loss": 0.0272, "step": 27100 }, { - "epoch": 0.29, - "learning_rate": 0.0002560387883505221, - "loss": 0.0247, + "epoch": 0.14, + "learning_rate": 0.000279483984239018, + "loss": 0.033, "step": 27110 }, { - "epoch": 0.29, - "learning_rate": 0.00025602257248491923, - "loss": 0.0321, + "epoch": 0.14, + "learning_rate": 0.000279476416546004, + "loss": 0.0283, "step": 27120 }, { - "epoch": 0.29, - "learning_rate": 0.0002560063566193163, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027946884885298996, + "loss": 0.0311, "step": 27130 }, { - "epoch": 0.29, - "learning_rate": 0.0002559901407537134, - "loss": 0.0247, + "epoch": 0.14, + "learning_rate": 0.00027946128115997594, + "loss": 0.0304, "step": 27140 }, { - "epoch": 0.29, - "learning_rate": 0.00025597392488811054, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002794537134669619, + "loss": 0.0269, "step": 27150 }, { - "epoch": 0.29, - "learning_rate": 0.0002559577090225076, - "loss": 0.027, + "epoch": 0.14, + "learning_rate": 0.0002794461457739479, + "loss": 0.0238, "step": 27160 }, { - "epoch": 0.29, - "learning_rate": 0.00025594149315690467, - "loss": 0.0283, + "epoch": 0.14, + "learning_rate": 0.00027943857808093394, + "loss": 0.0255, "step": 27170 }, { - "epoch": 0.29, - "learning_rate": 0.0002559252772913018, - "loss": 0.0251, + "epoch": 0.14, + "learning_rate": 0.0002794310103879199, + "loss": 0.0229, "step": 27180 }, { - "epoch": 0.29, - "learning_rate": 0.0002559090614256989, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002794234426949059, + "loss": 0.026, "step": 27190 }, { - "epoch": 0.29, - "learning_rate": 0.000255892845560096, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.0002794158750018919, + "loss": 0.0263, "step": 27200 }, { - "epoch": 0.29, - "learning_rate": 0.00025587662969449304, - "loss": 0.0241, + "epoch": 0.14, + "learning_rate": 0.00027940830730887787, + "loss": 0.0264, "step": 27210 }, { - "epoch": 0.29, - "learning_rate": 0.00025586041382889016, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.00027940073961586385, + "loss": 0.0274, "step": 27220 }, { - "epoch": 0.29, - "learning_rate": 0.0002558441979632873, + "epoch": 0.14, + "learning_rate": 0.00027939317192284983, "loss": 0.0254, "step": 27230 }, { - "epoch": 0.29, - "learning_rate": 0.00025582798209768435, - "loss": 0.0288, + "epoch": 0.14, + "learning_rate": 0.00027938560422983587, + "loss": 0.0266, "step": 27240 }, { - "epoch": 0.29, - "learning_rate": 0.0002558117662320814, - "loss": 0.0271, + "epoch": 0.14, + "learning_rate": 0.00027937803653682185, + "loss": 0.0252, "step": 27250 }, { - "epoch": 0.29, - "learning_rate": 0.00025579555036647853, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.00027937046884380783, + "loss": 0.0275, "step": 27260 }, { - "epoch": 0.29, - "learning_rate": 0.00025577933450087565, - "loss": 0.026, + "epoch": 0.14, + "learning_rate": 0.0002793629011507938, + "loss": 0.023, "step": 27270 }, { - "epoch": 0.29, - "learning_rate": 0.0002557631186352727, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.0002793553334577798, + "loss": 0.0264, "step": 27280 }, { - "epoch": 0.3, - "learning_rate": 0.00025574690276966984, - "loss": 0.0251, + "epoch": 0.14, + "learning_rate": 0.0002793477657647658, + "loss": 0.0249, "step": 27290 }, { - "epoch": 0.3, - "learning_rate": 0.0002557306869040669, - "loss": 0.0262, + "epoch": 0.14, + "learning_rate": 0.0002793401980717518, + "loss": 0.0292, "step": 27300 }, { - "epoch": 0.3, - "learning_rate": 0.000255714471038464, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.0002793326303787378, + "loss": 0.0271, "step": 27310 }, { - "epoch": 0.3, - "learning_rate": 0.0002556982551728611, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027932506268572377, + "loss": 0.0252, "step": 27320 }, { - "epoch": 0.3, - "learning_rate": 0.0002556820393072582, - "loss": 0.0246, + "epoch": 0.14, + "learning_rate": 0.00027931749499270975, + "loss": 0.0293, "step": 27330 }, { - "epoch": 0.3, - "learning_rate": 0.0002556658234416553, - "loss": 0.0257, + "epoch": 0.14, + "learning_rate": 0.00027930992729969573, + "loss": 0.027, "step": 27340 }, { - "epoch": 0.3, - "learning_rate": 0.0002556496075760524, - "loss": 0.0235, + "epoch": 0.14, + "learning_rate": 0.0002793023596066817, + "loss": 0.0279, "step": 27350 }, { - "epoch": 0.3, - "learning_rate": 0.0002556333917104495, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027929479191366775, + "loss": 0.0275, "step": 27360 }, { - "epoch": 0.3, - "learning_rate": 0.0002556171758448466, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.00027928722422065373, + "loss": 0.0384, "step": 27370 }, { - "epoch": 0.3, - "learning_rate": 0.00025560095997924365, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.0002792796565276397, + "loss": 0.0245, "step": 27380 }, { - "epoch": 0.3, - "learning_rate": 0.00025558474411364077, - "loss": 0.0265, + "epoch": 0.14, + "learning_rate": 0.0002792720888346257, + "loss": 0.0309, "step": 27390 }, { - "epoch": 0.3, - "learning_rate": 0.0002555685282480379, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002792645211416117, + "loss": 0.0259, "step": 27400 }, { - "epoch": 0.3, - "learning_rate": 0.00025555231238243495, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.00027925695344859766, + "loss": 0.0272, "step": 27410 }, { - "epoch": 0.3, - "learning_rate": 0.00025553609651683207, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.00027924938575558364, + "loss": 0.0263, "step": 27420 }, { - "epoch": 0.3, - "learning_rate": 0.00025551988065122914, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.0002792418180625697, + "loss": 0.0229, "step": 27430 }, { - "epoch": 0.3, - "learning_rate": 0.00025550366478562626, - "loss": 0.0249, + "epoch": 0.14, + "learning_rate": 0.00027923425036955566, + "loss": 0.0285, "step": 27440 }, { - "epoch": 0.3, - "learning_rate": 0.0002554874489200233, - "loss": 0.0255, + "epoch": 0.14, + "learning_rate": 0.00027922668267654164, + "loss": 0.0271, "step": 27450 }, { - "epoch": 0.3, - "learning_rate": 0.00025547123305442044, - "loss": 0.0302, + "epoch": 0.14, + "learning_rate": 0.0002792191149835276, + "loss": 0.0283, "step": 27460 }, { - "epoch": 0.3, - "learning_rate": 0.0002554550171888175, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.0002792115472905136, + "loss": 0.0266, "step": 27470 }, { - "epoch": 0.3, - "learning_rate": 0.00025543880132321463, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.0002792039795974996, + "loss": 0.0267, "step": 27480 }, { - "epoch": 0.3, - "learning_rate": 0.0002554225854576117, - "loss": 0.0266, + "epoch": 0.14, + "learning_rate": 0.0002791964119044856, + "loss": 0.0275, "step": 27490 }, { - "epoch": 0.3, - "learning_rate": 0.0002554063695920088, - "loss": 0.0254, + "epoch": 0.14, + "learning_rate": 0.0002791888442114716, + "loss": 0.0313, "step": 27500 }, { - "epoch": 0.3, - "learning_rate": 0.0002553901537264059, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.0002791812765184576, + "loss": 0.0277, "step": 27510 }, { - "epoch": 0.3, - "learning_rate": 0.000255373937860803, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027917370882544356, + "loss": 0.0307, "step": 27520 }, { - "epoch": 0.3, - "learning_rate": 0.00025535772199520006, - "loss": 0.029, + "epoch": 0.14, + "learning_rate": 0.00027916614113242954, + "loss": 0.0735, "step": 27530 }, { - "epoch": 0.3, - "learning_rate": 0.0002553415061295972, - "loss": 0.027, + "epoch": 0.14, + "learning_rate": 0.0002791585734394155, + "loss": 0.0338, "step": 27540 }, { - "epoch": 0.3, - "learning_rate": 0.00025532529026399425, - "loss": 0.0252, + "epoch": 0.14, + "learning_rate": 0.00027915100574640156, + "loss": 0.0304, "step": 27550 }, { - "epoch": 0.3, - "learning_rate": 0.00025530907439839137, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.00027914343805338754, + "loss": 0.036, "step": 27560 }, { - "epoch": 0.3, - "learning_rate": 0.00025529285853278844, - "loss": 0.0267, + "epoch": 0.14, + "learning_rate": 0.0002791358703603735, + "loss": 0.0325, "step": 27570 }, { - "epoch": 0.3, - "learning_rate": 0.00025527664266718555, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.0002791283026673595, + "loss": 0.0392, "step": 27580 }, { - "epoch": 0.3, - "learning_rate": 0.0002552604268015827, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002791207349743455, + "loss": 0.0254, "step": 27590 }, { - "epoch": 0.3, - "learning_rate": 0.00025524421093597974, - "loss": 0.0246, + "epoch": 0.14, + "learning_rate": 0.00027911316728133147, + "loss": 0.0372, "step": 27600 }, { - "epoch": 0.3, - "learning_rate": 0.0002552279950703768, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.00027910559958831745, + "loss": 0.0293, "step": 27610 }, { - "epoch": 0.3, - "learning_rate": 0.0002552117792047739, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.0002790980318953035, + "loss": 0.0353, "step": 27620 }, { - "epoch": 0.3, - "learning_rate": 0.00025519556333917105, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027909046420228947, + "loss": 0.0362, "step": 27630 }, { - "epoch": 0.3, - "learning_rate": 0.0002551793474735681, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.00027908289650927545, + "loss": 0.0291, "step": 27640 }, { - "epoch": 0.3, - "learning_rate": 0.0002551631316079652, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.00027907532881626143, + "loss": 0.0336, "step": 27650 }, { - "epoch": 0.3, - "learning_rate": 0.0002551469157423623, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002790677611232474, + "loss": 0.0239, "step": 27660 }, { - "epoch": 0.3, - "learning_rate": 0.0002551306998767594, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.0002790601934302334, + "loss": 0.0268, "step": 27670 }, { - "epoch": 0.3, - "learning_rate": 0.0002551144840111565, - "loss": 0.0281, + "epoch": 0.14, + "learning_rate": 0.00027905262573721943, + "loss": 0.026, "step": 27680 }, { - "epoch": 0.3, - "learning_rate": 0.00025509826814555355, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002790450580442054, + "loss": 0.0304, "step": 27690 }, { - "epoch": 0.3, - "learning_rate": 0.00025508205227995067, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.0002790374903511914, + "loss": 0.0298, "step": 27700 }, { - "epoch": 0.3, - "learning_rate": 0.0002550658364143478, - "loss": 0.0245, + "epoch": 0.14, + "learning_rate": 0.0002790299226581774, + "loss": 0.0302, "step": 27710 }, { - "epoch": 0.3, - "learning_rate": 0.0002550496205487449, - "loss": 0.0264, + "epoch": 0.14, + "learning_rate": 0.00027902235496516335, + "loss": 0.0229, "step": 27720 }, { - "epoch": 0.3, - "learning_rate": 0.000255033404683142, - "loss": 0.026, + "epoch": 0.14, + "learning_rate": 0.00027901478727214934, + "loss": 0.0303, "step": 27730 }, { - "epoch": 0.3, - "learning_rate": 0.00025501718881753904, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.0002790072195791353, + "loss": 0.0267, "step": 27740 }, { - "epoch": 0.3, - "learning_rate": 0.00025500097295193616, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.00027899965188612135, + "loss": 0.0317, "step": 27750 }, { - "epoch": 0.3, - "learning_rate": 0.0002549847570863333, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.00027899208419310733, + "loss": 0.028, "step": 27760 }, { - "epoch": 0.3, - "learning_rate": 0.00025496854122073034, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002789845165000933, + "loss": 0.0281, "step": 27770 }, { - "epoch": 0.3, - "learning_rate": 0.0002549523253551274, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.0002789769488070793, + "loss": 0.0298, "step": 27780 }, { - "epoch": 0.3, - "learning_rate": 0.00025493610948952453, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.0002789693811140653, + "loss": 0.0308, "step": 27790 }, { - "epoch": 0.3, - "learning_rate": 0.00025491989362392165, - "loss": 0.0254, + "epoch": 0.14, + "learning_rate": 0.00027896181342105126, + "loss": 0.0301, "step": 27800 }, { - "epoch": 0.3, - "learning_rate": 0.0002549036777583187, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.0002789542457280373, + "loss": 0.0275, "step": 27810 }, { - "epoch": 0.3, - "learning_rate": 0.0002548874618927158, - "loss": 0.0284, + "epoch": 0.14, + "learning_rate": 0.0002789466780350233, + "loss": 0.0259, "step": 27820 }, { - "epoch": 0.3, - "learning_rate": 0.0002548712460271129, - "loss": 0.0236, + "epoch": 0.14, + "learning_rate": 0.00027893911034200926, + "loss": 0.0266, "step": 27830 }, { - "epoch": 0.3, - "learning_rate": 0.00025485503016151, - "loss": 0.0243, + "epoch": 0.14, + "learning_rate": 0.00027893154264899524, + "loss": 0.022, "step": 27840 }, { - "epoch": 0.3, - "learning_rate": 0.0002548388142959071, - "loss": 0.0248, + "epoch": 0.14, + "learning_rate": 0.0002789239749559812, + "loss": 0.0281, "step": 27850 }, { - "epoch": 0.3, - "learning_rate": 0.0002548225984303042, - "loss": 0.0246, + "epoch": 0.14, + "learning_rate": 0.0002789164072629672, + "loss": 0.0254, "step": 27860 }, { - "epoch": 0.3, - "learning_rate": 0.00025480638256470127, - "loss": 0.0272, + "epoch": 0.14, + "learning_rate": 0.00027890883956995324, + "loss": 0.0222, "step": 27870 }, { - "epoch": 0.3, - "learning_rate": 0.0002547901666990984, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002789012718769392, + "loss": 0.0244, "step": 27880 }, { - "epoch": 0.3, - "learning_rate": 0.00025477395083349546, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.0002788937041839252, + "loss": 0.023, "step": 27890 }, { - "epoch": 0.3, - "learning_rate": 0.0002547577349678926, - "loss": 0.0243, + "epoch": 0.14, + "learning_rate": 0.0002788861364909112, + "loss": 0.0324, "step": 27900 }, { - "epoch": 0.3, - "learning_rate": 0.00025474151910228964, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.00027887856879789716, + "loss": 0.025, "step": 27910 }, { - "epoch": 0.3, - "learning_rate": 0.00025472530323668676, - "loss": 0.0344, + "epoch": 0.14, + "learning_rate": 0.00027887100110488315, + "loss": 0.0321, "step": 27920 }, { - "epoch": 0.3, - "learning_rate": 0.00025470908737108383, - "loss": 0.0302, + "epoch": 0.14, + "learning_rate": 0.00027886343341186913, + "loss": 0.0259, "step": 27930 }, { - "epoch": 0.3, - "learning_rate": 0.00025469287150548095, - "loss": 0.0305, + "epoch": 0.14, + "learning_rate": 0.00027885586571885516, + "loss": 0.0302, "step": 27940 }, { - "epoch": 0.3, - "learning_rate": 0.000254676655639878, - "loss": 0.0264, + "epoch": 0.14, + "learning_rate": 0.00027884829802584114, + "loss": 0.0277, "step": 27950 }, { - "epoch": 0.3, - "learning_rate": 0.00025466043977427513, - "loss": 0.0285, + "epoch": 0.14, + "learning_rate": 0.0002788407303328271, + "loss": 0.0261, "step": 27960 }, { - "epoch": 0.3, - "learning_rate": 0.0002546442239086722, - "loss": 0.027, + "epoch": 0.14, + "learning_rate": 0.0002788331626398131, + "loss": 0.0243, "step": 27970 }, { - "epoch": 0.3, - "learning_rate": 0.0002546280080430693, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002788255949467991, + "loss": 0.0271, "step": 27980 }, { - "epoch": 0.3, - "learning_rate": 0.00025461179217746644, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027881802725378507, + "loss": 0.0277, "step": 27990 }, { - "epoch": 0.3, - "learning_rate": 0.0002545955763118635, - "loss": 0.0258, + "epoch": 0.14, + "learning_rate": 0.0002788104595607711, + "loss": 0.0278, "step": 28000 }, { - "epoch": 0.3, - "eval_cer": 0.9215990285544536, - "eval_loss": 0.01768692582845688, - "eval_runtime": 120.5374, - "eval_samples_per_second": 16.592, - "eval_steps_per_second": 4.148, + "epoch": 0.14, + "eval_cer": 0.9144489071884033, + "eval_loss": 0.019581960514187813, + "eval_runtime": 117.2391, + "eval_samples_per_second": 17.059, + "eval_steps_per_second": 4.265, "step": 28000 }, { - "epoch": 0.3, - "learning_rate": 0.00025457936044626057, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002788028918677571, + "loss": 0.026, "step": 28010 }, { - "epoch": 0.3, - "learning_rate": 0.0002545631445806577, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.00027879532417474307, + "loss": 0.0265, "step": 28020 }, { - "epoch": 0.3, - "learning_rate": 0.0002545469287150548, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.00027878775648172905, + "loss": 0.0289, "step": 28030 }, { - "epoch": 0.3, - "learning_rate": 0.0002545307128494519, - "loss": 0.0302, + "epoch": 0.14, + "learning_rate": 0.00027878018878871503, + "loss": 0.0244, "step": 28040 }, { - "epoch": 0.3, - "learning_rate": 0.00025451449698384894, - "loss": 0.027, + "epoch": 0.14, + "learning_rate": 0.000278772621095701, + "loss": 0.026, "step": 28050 }, { - "epoch": 0.3, - "learning_rate": 0.00025449828111824606, - "loss": 0.0256, + "epoch": 0.14, + "learning_rate": 0.000278765053402687, + "loss": 0.0308, "step": 28060 }, { - "epoch": 0.3, - "learning_rate": 0.0002544820652526432, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.00027875748570967303, + "loss": 0.0273, "step": 28070 }, { - "epoch": 0.3, - "learning_rate": 0.00025446584938704025, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.000278749918016659, + "loss": 0.0355, "step": 28080 }, { - "epoch": 0.3, - "learning_rate": 0.00025444963352143737, - "loss": 0.0275, + "epoch": 0.14, + "learning_rate": 0.000278742350323645, + "loss": 0.0232, "step": 28090 }, { - "epoch": 0.3, - "learning_rate": 0.00025443341765583443, - "loss": 0.0264, + "epoch": 0.14, + "learning_rate": 0.000278734782630631, + "loss": 0.0242, "step": 28100 }, { - "epoch": 0.3, - "learning_rate": 0.00025441720179023155, - "loss": 0.0206, + "epoch": 0.14, + "learning_rate": 0.00027872721493761696, + "loss": 0.024, "step": 28110 }, { - "epoch": 0.3, - "learning_rate": 0.0002544009859246286, - "loss": 0.0263, + "epoch": 0.14, + "learning_rate": 0.00027871964724460294, + "loss": 0.0248, "step": 28120 }, { - "epoch": 0.3, - "learning_rate": 0.00025438477005902574, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.000278712079551589, + "loss": 0.0276, "step": 28130 }, { - "epoch": 0.3, - "learning_rate": 0.0002543685541934228, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.00027870451185857495, + "loss": 0.0257, "step": 28140 }, { - "epoch": 0.3, - "learning_rate": 0.0002543523383278199, - "loss": 0.0245, + "epoch": 0.14, + "learning_rate": 0.00027869694416556094, + "loss": 0.0262, "step": 28150 }, { - "epoch": 0.3, - "learning_rate": 0.00025433612246221704, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.0002786893764725469, + "loss": 0.0285, "step": 28160 }, { - "epoch": 0.3, - "learning_rate": 0.0002543199065966141, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.0002786818087795329, + "loss": 0.0277, "step": 28170 }, { - "epoch": 0.3, - "learning_rate": 0.0002543036907310112, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.0002786742410865189, + "loss": 0.0282, "step": 28180 }, { - "epoch": 0.3, - "learning_rate": 0.0002542874748654083, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.0002786666733935049, + "loss": 0.0276, "step": 28190 }, { - "epoch": 0.3, - "learning_rate": 0.0002542712589998054, - "loss": 0.0292, + "epoch": 0.14, + "learning_rate": 0.0002786591057004909, + "loss": 0.0262, "step": 28200 }, { - "epoch": 0.3, - "learning_rate": 0.0002542550431342025, - "loss": 0.0257, + "epoch": 0.14, + "learning_rate": 0.0002786515380074769, + "loss": 0.0309, "step": 28210 }, { - "epoch": 0.31, - "learning_rate": 0.00025423882726859954, - "loss": 0.0268, + "epoch": 0.14, + "learning_rate": 0.00027864397031446286, + "loss": 0.027, "step": 28220 }, { - "epoch": 0.31, - "learning_rate": 0.00025422261140299666, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027863640262144884, + "loss": 0.028, "step": 28230 }, { - "epoch": 0.31, - "learning_rate": 0.0002542063955373938, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.0002786288349284348, + "loss": 0.0263, "step": 28240 }, { - "epoch": 0.31, - "learning_rate": 0.00025419017967179085, - "loss": 0.0302, + "epoch": 0.14, + "learning_rate": 0.0002786212672354208, + "loss": 0.0252, "step": 28250 }, { - "epoch": 0.31, - "learning_rate": 0.0002541739638061879, - "loss": 0.0251, + "epoch": 0.14, + "learning_rate": 0.00027861369954240684, + "loss": 0.0231, "step": 28260 }, { - "epoch": 0.31, - "learning_rate": 0.00025415774794058504, - "loss": 0.0253, + "epoch": 0.14, + "learning_rate": 0.0002786061318493928, + "loss": 0.0324, "step": 28270 }, { - "epoch": 0.31, - "learning_rate": 0.00025414153207498216, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027859856415637875, + "loss": 0.0271, "step": 28280 }, { - "epoch": 0.31, - "learning_rate": 0.0002541253162093793, - "loss": 0.0259, + "epoch": 0.14, + "learning_rate": 0.00027859099646336473, + "loss": 0.0323, "step": 28290 }, { - "epoch": 0.31, - "learning_rate": 0.00025410910034377634, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027858342877035077, + "loss": 0.0298, "step": 28300 }, { - "epoch": 0.31, - "learning_rate": 0.0002540928844781734, - "loss": 0.0217, + "epoch": 0.14, + "learning_rate": 0.00027857586107733675, + "loss": 0.0259, "step": 28310 }, { - "epoch": 0.31, - "learning_rate": 0.0002540766686125705, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.00027856829338432273, + "loss": 0.0275, "step": 28320 }, { - "epoch": 0.31, - "learning_rate": 0.00025406045274696765, - "loss": 0.0217, + "epoch": 0.14, + "learning_rate": 0.0002785607256913087, + "loss": 0.0289, "step": 28330 }, { - "epoch": 0.31, - "learning_rate": 0.0002540442368813647, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.0002785531579982947, + "loss": 0.0295, "step": 28340 }, { - "epoch": 0.31, - "learning_rate": 0.0002540280210157618, - "loss": 0.0255, + "epoch": 0.14, + "learning_rate": 0.0002785455903052807, + "loss": 0.0278, "step": 28350 }, { - "epoch": 0.31, - "learning_rate": 0.0002540118051501589, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.0002785380226122667, + "loss": 0.0243, "step": 28360 }, { - "epoch": 0.31, - "learning_rate": 0.000253995589284556, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.0002785304549192527, + "loss": 0.0245, "step": 28370 }, { - "epoch": 0.31, - "learning_rate": 0.0002539793734189531, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.00027852288722623867, + "loss": 0.0259, "step": 28380 }, { - "epoch": 0.31, - "learning_rate": 0.00025396315755335015, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.00027851531953322465, + "loss": 0.0271, "step": 28390 }, { - "epoch": 0.31, - "learning_rate": 0.00025394694168774727, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.00027850775184021064, + "loss": 0.0339, "step": 28400 }, { - "epoch": 0.31, - "learning_rate": 0.0002539307258221444, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.0002785001841471966, + "loss": 0.0302, "step": 28410 }, { - "epoch": 0.31, - "learning_rate": 0.00025391450995654145, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027849261645418265, + "loss": 0.0254, "step": 28420 }, { - "epoch": 0.31, - "learning_rate": 0.0002538982940909386, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.00027848504876116863, + "loss": 0.0304, "step": 28430 }, { - "epoch": 0.31, - "learning_rate": 0.00025388207822533564, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.0002784774810681546, + "loss": 0.0308, "step": 28440 }, { - "epoch": 0.31, - "learning_rate": 0.00025386586235973276, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.0002784699133751406, + "loss": 0.0263, "step": 28450 }, { - "epoch": 0.31, - "learning_rate": 0.0002538496464941298, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.0002784623456821266, + "loss": 0.0257, "step": 28460 }, { - "epoch": 0.31, - "learning_rate": 0.00025383343062852694, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.00027845477798911256, + "loss": 0.0271, "step": 28470 }, { - "epoch": 0.31, - "learning_rate": 0.000253817214762924, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027844721029609854, + "loss": 0.0242, "step": 28480 }, { - "epoch": 0.31, - "learning_rate": 0.00025380099889732113, - "loss": 0.0243, + "epoch": 0.14, + "learning_rate": 0.0002784396426030846, + "loss": 0.0299, "step": 28490 }, { - "epoch": 0.31, - "learning_rate": 0.0002537847830317182, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.00027843207491007056, + "loss": 0.0269, "step": 28500 }, { - "epoch": 0.31, - "learning_rate": 0.0002537685671661153, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027842450721705654, + "loss": 0.0218, "step": 28510 }, { - "epoch": 0.31, - "learning_rate": 0.0002537523513005124, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.0002784169395240425, + "loss": 0.0264, "step": 28520 }, { - "epoch": 0.31, - "learning_rate": 0.0002537361354349095, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.0002784093718310285, + "loss": 0.0277, "step": 28530 }, { - "epoch": 0.31, - "learning_rate": 0.00025371991956930657, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.0002784018041380145, + "loss": 0.022, "step": 28540 }, { - "epoch": 0.31, - "learning_rate": 0.0002537037037037037, - "loss": 0.0253, + "epoch": 0.14, + "learning_rate": 0.0002783942364450005, + "loss": 0.0259, "step": 28550 }, { - "epoch": 0.31, - "learning_rate": 0.00025368748783810075, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.0002783866687519865, + "loss": 0.0247, "step": 28560 }, { - "epoch": 0.31, - "learning_rate": 0.00025367127197249787, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.0002783791010589725, + "loss": 0.0326, "step": 28570 }, { - "epoch": 0.31, - "learning_rate": 0.00025365505610689494, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.00027837153336595846, + "loss": 0.0264, "step": 28580 }, { - "epoch": 0.31, - "learning_rate": 0.00025363884024129206, - "loss": 0.0257, + "epoch": 0.14, + "learning_rate": 0.00027836396567294445, + "loss": 0.0302, "step": 28590 }, { - "epoch": 0.31, - "learning_rate": 0.0002536226243756892, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.0002783563979799304, + "loss": 0.0238, "step": 28600 }, { - "epoch": 0.31, - "learning_rate": 0.00025360640851008624, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.00027834883028691646, + "loss": 0.0248, "step": 28610 }, { - "epoch": 0.31, - "learning_rate": 0.0002535901926444833, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027834126259390244, + "loss": 0.0241, "step": 28620 }, { - "epoch": 0.31, - "learning_rate": 0.00025357397677888043, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.0002783336949008884, + "loss": 0.0256, "step": 28630 }, { - "epoch": 0.31, - "learning_rate": 0.00025355776091327755, - "loss": 0.0272, + "epoch": 0.14, + "learning_rate": 0.0002783261272078744, + "loss": 0.0241, "step": 28640 }, { - "epoch": 0.31, - "learning_rate": 0.0002535415450476746, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.0002783185595148604, + "loss": 0.0243, "step": 28650 }, { - "epoch": 0.31, - "learning_rate": 0.0002535253291820717, - "loss": 0.0249, + "epoch": 0.14, + "learning_rate": 0.00027831099182184637, + "loss": 0.0278, "step": 28660 }, { - "epoch": 0.31, - "learning_rate": 0.0002535091133164688, - "loss": 0.0235, + "epoch": 0.14, + "learning_rate": 0.00027830342412883235, + "loss": 0.0215, "step": 28670 }, { - "epoch": 0.31, - "learning_rate": 0.0002534928974508659, - "loss": 0.023, + "epoch": 0.14, + "learning_rate": 0.0002782958564358184, + "loss": 0.0272, "step": 28680 }, { - "epoch": 0.31, - "learning_rate": 0.000253476681585263, - "loss": 0.0306, + "epoch": 0.14, + "learning_rate": 0.00027828828874280437, + "loss": 0.0275, "step": 28690 }, { - "epoch": 0.31, - "learning_rate": 0.00025346046571966005, - "loss": 0.0278, + "epoch": 0.14, + "learning_rate": 0.00027828072104979035, + "loss": 0.0244, "step": 28700 }, { - "epoch": 0.31, - "learning_rate": 0.00025344424985405717, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.00027827315335677633, + "loss": 0.0249, "step": 28710 }, { - "epoch": 0.31, - "learning_rate": 0.0002534280339884543, - "loss": 0.026, + "epoch": 0.14, + "learning_rate": 0.0002782655856637623, + "loss": 0.0267, "step": 28720 }, { - "epoch": 0.31, - "learning_rate": 0.0002534118181228514, - "loss": 0.0243, + "epoch": 0.14, + "learning_rate": 0.0002782580179707483, + "loss": 0.0328, "step": 28730 }, { - "epoch": 0.31, - "learning_rate": 0.0002533956022572485, - "loss": 0.0237, + "epoch": 0.14, + "learning_rate": 0.00027825045027773433, + "loss": 0.0308, "step": 28740 }, { - "epoch": 0.31, - "learning_rate": 0.00025337938639164554, - "loss": 0.029, + "epoch": 0.15, + "learning_rate": 0.0002782428825847203, + "loss": 0.0261, "step": 28750 }, { - "epoch": 0.31, - "learning_rate": 0.00025336317052604266, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002782353148917063, + "loss": 0.0326, "step": 28760 }, { - "epoch": 0.31, - "learning_rate": 0.0002533469546604398, - "loss": 0.0276, + "epoch": 0.15, + "learning_rate": 0.0002782277471986923, + "loss": 0.0281, "step": 28770 }, { - "epoch": 0.31, - "learning_rate": 0.00025333073879483685, - "loss": 0.0289, + "epoch": 0.15, + "learning_rate": 0.00027822017950567826, + "loss": 0.0258, "step": 28780 }, { - "epoch": 0.31, - "learning_rate": 0.0002533145229292339, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.00027821261181266424, + "loss": 0.0279, "step": 28790 }, { - "epoch": 0.31, - "learning_rate": 0.00025329830706363103, - "loss": 0.0228, + "epoch": 0.15, + "learning_rate": 0.0002782050441196502, + "loss": 0.0553, "step": 28800 }, { - "epoch": 0.31, - "learning_rate": 0.00025328209119802815, - "loss": 0.0253, + "epoch": 0.15, + "learning_rate": 0.00027819747642663625, + "loss": 0.0291, "step": 28810 }, { - "epoch": 0.31, - "learning_rate": 0.0002532658753324252, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027818990873362224, + "loss": 0.0254, "step": 28820 }, { - "epoch": 0.31, - "learning_rate": 0.0002532496594668223, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.0002781823410406082, + "loss": 0.0298, "step": 28830 }, { - "epoch": 0.31, - "learning_rate": 0.0002532334436012194, - "loss": 0.0265, + "epoch": 0.15, + "learning_rate": 0.0002781747733475942, + "loss": 0.0266, "step": 28840 }, { - "epoch": 0.31, - "learning_rate": 0.0002532172277356165, - "loss": 0.0283, + "epoch": 0.15, + "learning_rate": 0.0002781672056545802, + "loss": 0.025, "step": 28850 }, { - "epoch": 0.31, - "learning_rate": 0.0002532010118700136, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.00027815963796156616, + "loss": 0.0223, "step": 28860 }, { - "epoch": 0.31, - "learning_rate": 0.0002531847960044107, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002781520702685522, + "loss": 0.0274, "step": 28870 }, { - "epoch": 0.31, - "learning_rate": 0.0002531685801388078, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.0002781445025755382, + "loss": 0.0294, "step": 28880 }, { - "epoch": 0.31, - "learning_rate": 0.0002531523642732049, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027813693488252416, + "loss": 0.021, "step": 28890 }, { - "epoch": 0.31, - "learning_rate": 0.000253136148407602, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.00027812936718951014, + "loss": 0.0343, "step": 28900 }, { - "epoch": 0.31, - "learning_rate": 0.0002531199325419991, - "loss": 0.0231, + "epoch": 0.15, + "learning_rate": 0.0002781217994964961, + "loss": 0.0349, "step": 28910 }, { - "epoch": 0.31, - "learning_rate": 0.00025310371667639615, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.0002781142318034821, + "loss": 0.028, "step": 28920 }, { - "epoch": 0.31, - "learning_rate": 0.00025308750081079326, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.00027810666411046814, + "loss": 0.0245, "step": 28930 }, { - "epoch": 0.31, - "learning_rate": 0.0002530712849451904, - "loss": 0.0237, + "epoch": 0.15, + "learning_rate": 0.0002780990964174541, + "loss": 0.0247, "step": 28940 }, { - "epoch": 0.31, - "learning_rate": 0.00025305506907958745, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.0002780915287244401, + "loss": 0.0269, "step": 28950 }, { - "epoch": 0.31, - "learning_rate": 0.0002530388532139845, - "loss": 0.0279, + "epoch": 0.15, + "learning_rate": 0.0002780839610314261, + "loss": 0.0236, "step": 28960 }, { - "epoch": 0.31, - "learning_rate": 0.00025302263734838164, - "loss": 0.0246, + "epoch": 0.15, + "learning_rate": 0.00027807639333841207, + "loss": 0.0265, "step": 28970 }, { - "epoch": 0.31, - "learning_rate": 0.00025300642148277876, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.00027806882564539805, + "loss": 0.0263, "step": 28980 }, { - "epoch": 0.31, - "learning_rate": 0.0002529902056171758, - "loss": 0.0246, + "epoch": 0.15, + "learning_rate": 0.00027806125795238403, + "loss": 0.0232, "step": 28990 }, { - "epoch": 0.31, - "learning_rate": 0.0002529739897515729, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.00027805369025937006, + "loss": 0.0245, "step": 29000 }, { - "epoch": 0.31, - "eval_cer": 0.9215694960539368, - "eval_loss": 0.01686452515423298, - "eval_runtime": 121.6905, - "eval_samples_per_second": 16.435, - "eval_steps_per_second": 4.109, + "epoch": 0.15, + "eval_cer": 0.914481900656667, + "eval_loss": 0.019330712035298347, + "eval_runtime": 117.3753, + "eval_samples_per_second": 17.039, + "eval_steps_per_second": 4.26, "step": 29000 }, { - "epoch": 0.31, - "learning_rate": 0.00025295777388597, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.00027804612256635605, + "loss": 0.0274, "step": 29010 }, { - "epoch": 0.31, - "learning_rate": 0.0002529415580203671, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.000278038554873342, + "loss": 0.0276, "step": 29020 }, { - "epoch": 0.31, - "learning_rate": 0.0002529253421547642, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.000278030987180328, + "loss": 0.0246, "step": 29030 }, { - "epoch": 0.31, - "learning_rate": 0.0002529091262891613, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.000278023419487314, + "loss": 0.0309, "step": 29040 }, { - "epoch": 0.31, - "learning_rate": 0.0002528929104235584, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.00027801585179429997, + "loss": 0.0265, "step": 29050 }, { - "epoch": 0.31, - "learning_rate": 0.0002528766945579555, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.000278008284101286, + "loss": 0.0284, "step": 29060 }, { - "epoch": 0.31, - "learning_rate": 0.00025286047869235256, - "loss": 0.023, + "epoch": 0.15, + "learning_rate": 0.000278000716408272, + "loss": 0.0239, "step": 29070 }, { - "epoch": 0.31, - "learning_rate": 0.0002528442628267497, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027799314871525797, + "loss": 0.0235, "step": 29080 }, { - "epoch": 0.31, - "learning_rate": 0.00025282804696114675, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.00027798558102224395, + "loss": 0.0256, "step": 29090 }, { - "epoch": 0.31, - "learning_rate": 0.00025281183109554387, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.00027797801332922993, + "loss": 0.0255, "step": 29100 }, { - "epoch": 0.31, - "learning_rate": 0.00025279561522994093, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.0002779704456362159, + "loss": 0.0223, "step": 29110 }, { - "epoch": 0.31, - "learning_rate": 0.00025277939936433805, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.00027796287794320195, + "loss": 0.025, "step": 29120 }, { - "epoch": 0.31, - "learning_rate": 0.0002527631834987351, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.00027795531025018793, + "loss": 0.027, "step": 29130 }, { - "epoch": 0.32, - "learning_rate": 0.00025274696763313224, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002779477425571739, + "loss": 0.0279, "step": 29140 }, { - "epoch": 0.32, - "learning_rate": 0.0002527307517675293, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.0002779401748641599, + "loss": 0.0236, "step": 29150 }, { - "epoch": 0.32, - "learning_rate": 0.0002527145359019264, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.0002779326071711459, + "loss": 0.0221, "step": 29160 }, { - "epoch": 0.32, - "learning_rate": 0.00025269832003632355, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027792503947813186, + "loss": 0.0285, "step": 29170 }, { - "epoch": 0.32, - "learning_rate": 0.0002526821041707206, - "loss": 0.0262, + "epoch": 0.15, + "learning_rate": 0.00027791747178511784, + "loss": 0.0282, "step": 29180 }, { - "epoch": 0.32, - "learning_rate": 0.0002526658883051177, - "loss": 0.0243, + "epoch": 0.15, + "learning_rate": 0.0002779099040921039, + "loss": 0.0262, "step": 29190 }, { - "epoch": 0.32, - "learning_rate": 0.0002526496724395148, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.00027790233639908986, + "loss": 0.0262, "step": 29200 }, { - "epoch": 0.32, - "learning_rate": 0.0002526334565739119, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027789476870607584, + "loss": 0.0211, "step": 29210 }, { - "epoch": 0.32, - "learning_rate": 0.000252617240708309, - "loss": 0.0252, + "epoch": 0.15, + "learning_rate": 0.0002778872010130618, + "loss": 0.0244, "step": 29220 }, { - "epoch": 0.32, - "learning_rate": 0.00025260102484270605, - "loss": 0.0231, + "epoch": 0.15, + "learning_rate": 0.0002778796333200478, + "loss": 0.0257, "step": 29230 }, { - "epoch": 0.32, - "learning_rate": 0.00025258480897710317, - "loss": 0.0228, + "epoch": 0.15, + "learning_rate": 0.0002778720656270338, + "loss": 0.0246, "step": 29240 }, { - "epoch": 0.32, - "learning_rate": 0.0002525685931115003, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002778644979340198, + "loss": 0.026, "step": 29250 }, { - "epoch": 0.32, - "learning_rate": 0.00025255237724589735, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.0002778569302410058, + "loss": 0.0239, "step": 29260 }, { - "epoch": 0.32, - "learning_rate": 0.0002525361613802944, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.0002778493625479918, + "loss": 0.0322, "step": 29270 }, { - "epoch": 0.32, - "learning_rate": 0.00025251994551469154, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.00027784179485497776, + "loss": 0.0275, "step": 29280 }, { - "epoch": 0.32, - "learning_rate": 0.00025250372964908866, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.00027783422716196374, + "loss": 0.038, "step": 29290 }, { - "epoch": 0.32, - "learning_rate": 0.0002524875137834858, - "loss": 0.0225, + "epoch": 0.15, + "learning_rate": 0.0002778266594689497, + "loss": 0.0285, "step": 29300 }, { - "epoch": 0.32, - "learning_rate": 0.00025247129791788284, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.0002778190917759357, + "loss": 0.0286, "step": 29310 }, { - "epoch": 0.32, - "learning_rate": 0.0002524550820522799, - "loss": 0.0253, + "epoch": 0.15, + "learning_rate": 0.00027781152408292174, + "loss": 0.0296, "step": 29320 }, { - "epoch": 0.32, - "learning_rate": 0.00025243886618667703, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.0002778039563899077, + "loss": 0.0242, "step": 29330 }, { - "epoch": 0.32, - "learning_rate": 0.00025242265032107415, - "loss": 0.0283, + "epoch": 0.15, + "learning_rate": 0.0002777963886968937, + "loss": 0.0275, "step": 29340 }, { - "epoch": 0.32, - "learning_rate": 0.0002524064344554712, - "loss": 0.0262, + "epoch": 0.15, + "learning_rate": 0.0002777888210038797, + "loss": 0.0258, "step": 29350 }, { - "epoch": 0.32, - "learning_rate": 0.0002523902185898683, - "loss": 0.0259, + "epoch": 0.15, + "learning_rate": 0.00027778125331086567, + "loss": 0.025, "step": 29360 }, { - "epoch": 0.32, - "learning_rate": 0.0002523740027242654, - "loss": 0.0261, + "epoch": 0.15, + "learning_rate": 0.00027777368561785165, + "loss": 0.0303, "step": 29370 }, { - "epoch": 0.32, - "learning_rate": 0.0002523577868586625, - "loss": 0.0219, + "epoch": 0.15, + "learning_rate": 0.0002777661179248377, + "loss": 0.0265, "step": 29380 }, { - "epoch": 0.32, - "learning_rate": 0.0002523415709930596, - "loss": 0.0257, + "epoch": 0.15, + "learning_rate": 0.00027775855023182367, + "loss": 0.0271, "step": 29390 }, { - "epoch": 0.32, - "learning_rate": 0.00025232535512745665, - "loss": 0.0225, + "epoch": 0.15, + "learning_rate": 0.00027775098253880965, + "loss": 0.0256, "step": 29400 }, { - "epoch": 0.32, - "learning_rate": 0.00025230913926185377, - "loss": 0.0264, + "epoch": 0.15, + "learning_rate": 0.00027774341484579563, + "loss": 0.0277, "step": 29410 }, { - "epoch": 0.32, - "learning_rate": 0.0002522929233962509, - "loss": 0.0252, + "epoch": 0.15, + "learning_rate": 0.0002777358471527816, + "loss": 0.023, "step": 29420 }, { - "epoch": 0.32, - "learning_rate": 0.00025227670753064796, - "loss": 0.0259, + "epoch": 0.15, + "learning_rate": 0.0002777282794597676, + "loss": 0.0252, "step": 29430 }, { - "epoch": 0.32, - "learning_rate": 0.0002522604916650451, - "loss": 0.0263, + "epoch": 0.15, + "learning_rate": 0.0002777207117667536, + "loss": 0.027, "step": 29440 }, { - "epoch": 0.32, - "learning_rate": 0.00025224427579944214, - "loss": 0.0268, + "epoch": 0.15, + "learning_rate": 0.0002777131440737396, + "loss": 0.027, "step": 29450 }, { - "epoch": 0.32, - "learning_rate": 0.00025222805993383926, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.0002777055763807256, + "loss": 0.0269, "step": 29460 }, { - "epoch": 0.32, - "learning_rate": 0.00025221184406823633, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.00027769800868771157, + "loss": 0.0234, "step": 29470 }, { - "epoch": 0.32, - "learning_rate": 0.00025219562820263345, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.00027769044099469755, + "loss": 0.0261, "step": 29480 }, { - "epoch": 0.32, - "learning_rate": 0.0002521794123370305, - "loss": 0.0262, + "epoch": 0.15, + "learning_rate": 0.00027768287330168353, + "loss": 0.026, "step": 29490 }, { - "epoch": 0.32, - "learning_rate": 0.00025216319647142763, - "loss": 0.0242, + "epoch": 0.15, + "learning_rate": 0.0002776753056086695, + "loss": 0.0213, "step": 29500 }, { - "epoch": 0.32, - "learning_rate": 0.00025214698060582475, - "loss": 0.0245, + "epoch": 0.15, + "learning_rate": 0.00027766773791565555, + "loss": 0.0267, "step": 29510 }, { - "epoch": 0.32, - "learning_rate": 0.0002521307647402218, - "loss": 0.0253, + "epoch": 0.15, + "learning_rate": 0.00027766017022264153, + "loss": 0.0263, "step": 29520 }, { - "epoch": 0.32, - "learning_rate": 0.0002521145488746189, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.0002776526025296275, + "loss": 0.026, "step": 29530 }, { - "epoch": 0.32, - "learning_rate": 0.000252098333009016, - "loss": 0.0266, + "epoch": 0.15, + "learning_rate": 0.00027764503483661344, + "loss": 0.0273, "step": 29540 }, { - "epoch": 0.32, - "learning_rate": 0.0002520821171434131, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002776374671435995, + "loss": 0.0258, "step": 29550 }, { - "epoch": 0.32, - "learning_rate": 0.0002520659012778102, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027762989945058546, + "loss": 0.0249, "step": 29560 }, { - "epoch": 0.32, - "learning_rate": 0.00025204968541220725, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.00027762233175757144, + "loss": 0.0302, "step": 29570 }, { - "epoch": 0.32, - "learning_rate": 0.0002520334695466044, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002776147640645574, + "loss": 0.034, "step": 29580 }, { - "epoch": 0.32, - "learning_rate": 0.0002520172536810015, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.0002776071963715434, + "loss": 0.0244, "step": 29590 }, { - "epoch": 0.32, - "learning_rate": 0.00025200103781539856, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.0002775996286785294, + "loss": 0.0234, "step": 29600 }, { - "epoch": 0.32, - "learning_rate": 0.0002519848219497957, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.0002775920609855154, + "loss": 0.0261, "step": 29610 }, { - "epoch": 0.32, - "learning_rate": 0.00025196860608419275, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002775844932925014, + "loss": 0.0279, "step": 29620 }, { - "epoch": 0.32, - "learning_rate": 0.00025195239021858987, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.0002775769255994874, + "loss": 0.0277, "step": 29630 }, { - "epoch": 0.32, - "learning_rate": 0.00025193617435298693, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.00027756935790647336, + "loss": 0.0304, "step": 29640 }, { - "epoch": 0.32, - "learning_rate": 0.00025191995848738405, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.00027756179021345935, + "loss": 0.0272, "step": 29650 }, { - "epoch": 0.32, - "learning_rate": 0.0002519037426217811, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002775542225204453, + "loss": 0.0267, "step": 29660 }, { - "epoch": 0.32, - "learning_rate": 0.00025188752675617824, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027754665482743136, + "loss": 0.0304, "step": 29670 }, { - "epoch": 0.32, - "learning_rate": 0.0002518713108905753, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027753908713441734, + "loss": 0.024, "step": 29680 }, { - "epoch": 0.32, - "learning_rate": 0.0002518550950249724, - "loss": 0.0285, + "epoch": 0.15, + "learning_rate": 0.0002775315194414033, + "loss": 0.0297, "step": 29690 }, { - "epoch": 0.32, - "learning_rate": 0.0002518388791593695, - "loss": 0.023, + "epoch": 0.15, + "learning_rate": 0.0002775239517483893, + "loss": 0.0217, "step": 29700 }, { - "epoch": 0.32, - "learning_rate": 0.0002518226632937666, - "loss": 0.0237, + "epoch": 0.15, + "learning_rate": 0.0002775163840553753, + "loss": 0.0248, "step": 29710 }, { - "epoch": 0.32, - "learning_rate": 0.0002518064474281637, - "loss": 0.0265, + "epoch": 0.15, + "learning_rate": 0.00027750881636236127, + "loss": 0.0237, "step": 29720 }, { - "epoch": 0.32, - "learning_rate": 0.0002517902315625608, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.00027750124866934725, + "loss": 0.0281, "step": 29730 }, { - "epoch": 0.32, - "learning_rate": 0.0002517740156969579, - "loss": 0.0285, + "epoch": 0.15, + "learning_rate": 0.0002774936809763333, + "loss": 0.0284, "step": 29740 }, { - "epoch": 0.32, - "learning_rate": 0.000251757799831355, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027748611328331927, + "loss": 0.0239, "step": 29750 }, { - "epoch": 0.32, - "learning_rate": 0.00025174158396575204, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.00027747854559030525, + "loss": 0.0253, "step": 29760 }, { - "epoch": 0.32, - "learning_rate": 0.00025172536810014916, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.00027747097789729123, + "loss": 0.026, "step": 29770 }, { - "epoch": 0.32, - "learning_rate": 0.0002517091522345463, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.0002774634102042772, + "loss": 0.0258, "step": 29780 }, { - "epoch": 0.32, - "learning_rate": 0.00025169293636894335, - "loss": 0.0295, + "epoch": 0.15, + "learning_rate": 0.0002774558425112632, + "loss": 0.0239, "step": 29790 }, { - "epoch": 0.32, - "learning_rate": 0.0002516767205033404, - "loss": 0.0279, + "epoch": 0.15, + "learning_rate": 0.00027744827481824923, + "loss": 0.0196, "step": 29800 }, { - "epoch": 0.32, - "learning_rate": 0.00025166050463773753, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.0002774407071252352, + "loss": 0.0255, "step": 29810 }, { - "epoch": 0.32, - "learning_rate": 0.00025164428877213465, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.0002774331394322212, + "loss": 0.0267, "step": 29820 }, { - "epoch": 0.32, - "learning_rate": 0.0002516280729065317, - "loss": 0.0251, + "epoch": 0.15, + "learning_rate": 0.0002774255717392072, + "loss": 0.0261, "step": 29830 }, { - "epoch": 0.32, - "learning_rate": 0.0002516118570409288, - "loss": 0.0237, + "epoch": 0.15, + "learning_rate": 0.00027741800404619316, + "loss": 0.0263, "step": 29840 }, { - "epoch": 0.32, - "learning_rate": 0.0002515956411753259, - "loss": 0.0264, + "epoch": 0.15, + "learning_rate": 0.00027741043635317914, + "loss": 0.0293, "step": 29850 }, { - "epoch": 0.32, - "learning_rate": 0.000251579425309723, - "loss": 0.0267, + "epoch": 0.15, + "learning_rate": 0.0002774028686601651, + "loss": 0.0241, "step": 29860 }, { - "epoch": 0.32, - "learning_rate": 0.0002515632094441201, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.00027739530096715115, + "loss": 0.0231, "step": 29870 }, { - "epoch": 0.32, - "learning_rate": 0.0002515469935785172, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.00027738773327413714, + "loss": 0.0228, "step": 29880 }, { - "epoch": 0.32, - "learning_rate": 0.0002515307777129143, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.0002773801655811231, + "loss": 0.026, "step": 29890 }, { - "epoch": 0.32, - "learning_rate": 0.0002515145618473114, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002773725978881091, + "loss": 0.027, "step": 29900 }, { - "epoch": 0.32, - "learning_rate": 0.0002514983459817085, - "loss": 0.023, + "epoch": 0.15, + "learning_rate": 0.0002773650301950951, + "loss": 0.0249, "step": 29910 }, { - "epoch": 0.32, - "learning_rate": 0.0002514821301161056, - "loss": 0.0282, + "epoch": 0.15, + "learning_rate": 0.00027735746250208106, + "loss": 0.0291, "step": 29920 }, { - "epoch": 0.32, - "learning_rate": 0.00025146591425050265, - "loss": 0.0281, + "epoch": 0.15, + "learning_rate": 0.0002773498948090671, + "loss": 0.0242, "step": 29930 }, { - "epoch": 0.32, - "learning_rate": 0.00025144969838489977, - "loss": 0.0252, + "epoch": 0.15, + "learning_rate": 0.0002773423271160531, + "loss": 0.0272, "step": 29940 }, { - "epoch": 0.32, - "learning_rate": 0.0002514334825192969, - "loss": 0.0278, + "epoch": 0.15, + "learning_rate": 0.00027733475942303906, + "loss": 0.0286, "step": 29950 }, { - "epoch": 0.32, - "learning_rate": 0.00025141726665369395, - "loss": 0.0237, + "epoch": 0.15, + "learning_rate": 0.00027732719173002504, + "loss": 0.0244, "step": 29960 }, { - "epoch": 0.32, - "learning_rate": 0.000251401050788091, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.000277319624037011, + "loss": 0.0281, "step": 29970 }, { - "epoch": 0.32, - "learning_rate": 0.00025138483492248814, - "loss": 0.0267, + "epoch": 0.15, + "learning_rate": 0.000277312056343997, + "loss": 0.0295, "step": 29980 }, { - "epoch": 0.32, - "learning_rate": 0.00025136861905688526, - "loss": 0.0225, + "epoch": 0.15, + "learning_rate": 0.00027730448865098304, + "loss": 0.0313, "step": 29990 }, { - "epoch": 0.32, - "learning_rate": 0.0002513524031912823, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.000277296920957969, + "loss": 0.0226, "step": 30000 }, { - "epoch": 0.32, - "eval_cer": 0.921567758848024, - "eval_loss": 0.017599964514374733, - "eval_runtime": 121.9748, - "eval_samples_per_second": 16.397, - "eval_steps_per_second": 4.099, + "epoch": 0.15, + "eval_cer": 0.9144518183767796, + "eval_loss": 0.019204232841730118, + "eval_runtime": 117.3422, + "eval_samples_per_second": 17.044, + "eval_steps_per_second": 4.261, "step": 30000 }, { - "epoch": 0.32, - "learning_rate": 0.0002513361873256794, - "loss": 0.0246, + "epoch": 0.15, + "learning_rate": 0.000277289353264955, + "loss": 0.0214, "step": 30010 }, { - "epoch": 0.32, - "learning_rate": 0.0002513199714600765, - "loss": 0.0224, + "epoch": 0.15, + "learning_rate": 0.000277281785571941, + "loss": 0.0318, "step": 30020 }, { - "epoch": 0.32, - "learning_rate": 0.00025130375559447363, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027727421787892697, + "loss": 0.0273, "step": 30030 }, { - "epoch": 0.32, - "learning_rate": 0.0002512875397288707, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.00027726665018591295, + "loss": 0.025, "step": 30040 }, { - "epoch": 0.32, - "learning_rate": 0.0002512713238632678, - "loss": 0.0285, + "epoch": 0.15, + "learning_rate": 0.00027725908249289893, + "loss": 0.0252, "step": 30050 }, { - "epoch": 0.32, - "learning_rate": 0.0002512551079976649, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.00027725151479988496, + "loss": 0.0308, "step": 30060 }, { - "epoch": 0.33, - "learning_rate": 0.000251238892132062, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.00027724394710687095, + "loss": 0.0281, "step": 30070 }, { - "epoch": 0.33, - "learning_rate": 0.00025122267626645907, - "loss": 0.0263, + "epoch": 0.15, + "learning_rate": 0.0002772363794138569, + "loss": 0.0299, "step": 30080 }, { - "epoch": 0.33, - "learning_rate": 0.0002512064604008562, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.0002772288117208429, + "loss": 0.03, "step": 30090 }, { - "epoch": 0.33, - "learning_rate": 0.00025119024453525325, - "loss": 0.0274, + "epoch": 0.15, + "learning_rate": 0.0002772212440278289, + "loss": 0.0269, "step": 30100 }, { - "epoch": 0.33, - "learning_rate": 0.00025117402866965037, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.00027721367633481487, + "loss": 0.0316, "step": 30110 }, { - "epoch": 0.33, - "learning_rate": 0.00025115781280404744, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.0002772061086418009, + "loss": 0.0249, "step": 30120 }, { - "epoch": 0.33, - "learning_rate": 0.00025114159693844456, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.0002771985409487869, + "loss": 0.0273, "step": 30130 }, { - "epoch": 0.33, - "learning_rate": 0.0002511253810728416, - "loss": 0.0221, + "epoch": 0.15, + "learning_rate": 0.00027719097325577287, + "loss": 0.0247, "step": 30140 }, { - "epoch": 0.33, - "learning_rate": 0.00025110916520723874, - "loss": 0.0243, + "epoch": 0.15, + "learning_rate": 0.00027718340556275885, + "loss": 0.0259, "step": 30150 }, { - "epoch": 0.33, - "learning_rate": 0.0002510929493416358, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.00027717583786974483, + "loss": 0.0293, "step": 30160 }, { - "epoch": 0.33, - "learning_rate": 0.00025107673347603293, - "loss": 0.0277, + "epoch": 0.15, + "learning_rate": 0.0002771682701767308, + "loss": 0.0249, "step": 30170 }, { - "epoch": 0.33, - "learning_rate": 0.00025106051761043005, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.00027716070248371685, + "loss": 0.0281, "step": 30180 }, { - "epoch": 0.33, - "learning_rate": 0.0002510443017448271, - "loss": 0.0238, + "epoch": 0.15, + "learning_rate": 0.00027715313479070283, + "loss": 0.0224, "step": 30190 }, { - "epoch": 0.33, - "learning_rate": 0.0002510280858792242, - "loss": 0.0274, + "epoch": 0.15, + "learning_rate": 0.0002771455670976888, + "loss": 0.0264, "step": 30200 }, { - "epoch": 0.33, - "learning_rate": 0.0002510118700136213, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.0002771379994046748, + "loss": 0.0284, "step": 30210 }, { - "epoch": 0.33, - "learning_rate": 0.0002509956541480184, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.0002771304317116608, + "loss": 0.0267, "step": 30220 }, { - "epoch": 0.33, - "learning_rate": 0.0002509794382824155, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.00027712286401864676, + "loss": 0.0297, "step": 30230 }, { - "epoch": 0.33, - "learning_rate": 0.0002509632224168126, - "loss": 0.0279, + "epoch": 0.15, + "learning_rate": 0.00027711529632563274, + "loss": 0.0244, "step": 30240 }, { - "epoch": 0.33, - "learning_rate": 0.00025094700655120967, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002771077286326188, + "loss": 0.0247, "step": 30250 }, { - "epoch": 0.33, - "learning_rate": 0.0002509307906856068, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.00027710016093960476, + "loss": 0.026, "step": 30260 }, { - "epoch": 0.33, - "learning_rate": 0.00025091457482000386, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.00027709259324659074, + "loss": 0.0262, "step": 30270 }, { - "epoch": 0.33, - "learning_rate": 0.000250898358954401, - "loss": 0.0257, + "epoch": 0.15, + "learning_rate": 0.0002770850255535767, + "loss": 0.0253, "step": 30280 }, { - "epoch": 0.33, - "learning_rate": 0.00025088214308879804, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002770774578605627, + "loss": 0.0328, "step": 30290 }, { - "epoch": 0.33, - "learning_rate": 0.00025086592722319516, - "loss": 0.0271, + "epoch": 0.15, + "learning_rate": 0.0002770698901675487, + "loss": 0.0283, "step": 30300 }, { - "epoch": 0.33, - "learning_rate": 0.0002508497113575923, - "loss": 0.0262, + "epoch": 0.15, + "learning_rate": 0.0002770623224745347, + "loss": 0.0256, "step": 30310 }, { - "epoch": 0.33, - "learning_rate": 0.00025083349549198935, - "loss": 0.0265, + "epoch": 0.15, + "learning_rate": 0.0002770547547815207, + "loss": 0.0247, "step": 30320 }, { - "epoch": 0.33, - "learning_rate": 0.0002508172796263864, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.0002770471870885067, + "loss": 0.0259, "step": 30330 }, { - "epoch": 0.33, - "learning_rate": 0.00025080106376078353, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.00027703961939549266, + "loss": 0.0289, "step": 30340 }, { - "epoch": 0.33, - "learning_rate": 0.00025078484789518065, - "loss": 0.0256, + "epoch": 0.15, + "learning_rate": 0.00027703205170247864, + "loss": 0.0257, "step": 30350 }, { - "epoch": 0.33, - "learning_rate": 0.0002507686320295777, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.0002770244840094646, + "loss": 0.031, "step": 30360 }, { - "epoch": 0.33, - "learning_rate": 0.0002507524161639748, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.0002770169163164506, + "loss": 0.0309, "step": 30370 }, { - "epoch": 0.33, - "learning_rate": 0.0002507362002983719, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.00027700934862343664, + "loss": 0.0271, "step": 30380 }, { - "epoch": 0.33, - "learning_rate": 0.000250719984432769, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002770017809304226, + "loss": 0.0275, "step": 30390 }, { - "epoch": 0.33, - "learning_rate": 0.0002507037685671661, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.0002769942132374086, + "loss": 0.0253, "step": 30400 }, { - "epoch": 0.33, - "learning_rate": 0.00025068755270156315, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.0002769866455443946, + "loss": 0.0263, "step": 30410 }, { - "epoch": 0.33, - "learning_rate": 0.0002506713368359603, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.00027697907785138057, + "loss": 0.0239, "step": 30420 }, { - "epoch": 0.33, - "learning_rate": 0.0002506551209703574, - "loss": 0.0238, + "epoch": 0.15, + "learning_rate": 0.00027697151015836655, + "loss": 0.039, "step": 30430 }, { - "epoch": 0.33, - "learning_rate": 0.00025063890510475446, - "loss": 0.0232, + "epoch": 0.15, + "learning_rate": 0.0002769639424653526, + "loss": 0.0278, "step": 30440 }, { - "epoch": 0.33, - "learning_rate": 0.0002506226892391516, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.00027695637477233857, + "loss": 0.0306, "step": 30450 }, { - "epoch": 0.33, - "learning_rate": 0.00025060647337354864, - "loss": 0.0228, + "epoch": 0.15, + "learning_rate": 0.00027694880707932455, + "loss": 0.0284, "step": 30460 }, { - "epoch": 0.33, - "learning_rate": 0.00025059025750794576, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.00027694123938631053, + "loss": 0.0228, "step": 30470 }, { - "epoch": 0.33, - "learning_rate": 0.0002505740416423429, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002769336716932965, + "loss": 0.0214, "step": 30480 }, { - "epoch": 0.33, - "learning_rate": 0.00025055782577673995, - "loss": 0.0263, + "epoch": 0.15, + "learning_rate": 0.0002769261040002825, + "loss": 0.0261, "step": 30490 }, { - "epoch": 0.33, - "learning_rate": 0.000250541609911137, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.0002769185363072685, + "loss": 0.0256, "step": 30500 }, { - "epoch": 0.33, - "learning_rate": 0.00025052539404553414, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.0002769109686142545, + "loss": 0.0233, "step": 30510 }, { - "epoch": 0.33, - "learning_rate": 0.00025050917817993126, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.0002769034009212405, + "loss": 0.027, "step": 30520 }, { - "epoch": 0.33, - "learning_rate": 0.0002504929623143283, - "loss": 0.0244, + "epoch": 0.15, + "learning_rate": 0.00027689583322822647, + "loss": 0.0232, "step": 30530 }, { - "epoch": 0.33, - "learning_rate": 0.0002504767464487254, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.00027688826553521245, + "loss": 0.0211, "step": 30540 }, { - "epoch": 0.33, - "learning_rate": 0.0002504605305831225, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.00027688069784219843, + "loss": 0.0259, "step": 30550 }, { - "epoch": 0.33, - "learning_rate": 0.0002504443147175196, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.0002768731301491844, + "loss": 0.0233, "step": 30560 }, { - "epoch": 0.33, - "learning_rate": 0.0002504280988519167, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.00027686556245617045, + "loss": 0.0195, "step": 30570 }, { - "epoch": 0.33, - "learning_rate": 0.00025041188298631376, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.00027685799476315643, + "loss": 0.0276, "step": 30580 }, { - "epoch": 0.33, - "learning_rate": 0.0002503956671207109, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.0002768504270701424, + "loss": 0.0213, "step": 30590 }, { - "epoch": 0.33, - "learning_rate": 0.000250379451255108, - "loss": 0.0244, + "epoch": 0.15, + "learning_rate": 0.0002768428593771284, + "loss": 0.0234, "step": 30600 }, { - "epoch": 0.33, - "learning_rate": 0.00025036323538950506, - "loss": 0.0225, + "epoch": 0.15, + "learning_rate": 0.0002768352916841144, + "loss": 0.0259, "step": 30610 }, { - "epoch": 0.33, - "learning_rate": 0.0002503470195239022, - "loss": 0.023, + "epoch": 0.15, + "learning_rate": 0.00027682772399110036, + "loss": 0.0246, "step": 30620 }, { - "epoch": 0.33, - "learning_rate": 0.00025033080365829925, - "loss": 0.0247, + "epoch": 0.15, + "learning_rate": 0.0002768201562980864, + "loss": 0.0295, "step": 30630 }, { - "epoch": 0.33, - "learning_rate": 0.00025031458779269637, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.0002768125886050724, + "loss": 0.0258, "step": 30640 }, { - "epoch": 0.33, - "learning_rate": 0.00025029837192709343, - "loss": 0.0289, + "epoch": 0.15, + "learning_rate": 0.00027680502091205836, + "loss": 0.0265, "step": 30650 }, { - "epoch": 0.33, - "learning_rate": 0.00025028215606149055, - "loss": 0.0242, + "epoch": 0.15, + "learning_rate": 0.00027679745321904434, + "loss": 0.0241, "step": 30660 }, { - "epoch": 0.33, - "learning_rate": 0.0002502659401958876, - "loss": 0.0245, + "epoch": 0.15, + "learning_rate": 0.0002767898855260303, + "loss": 0.0441, "step": 30670 }, { - "epoch": 0.33, - "learning_rate": 0.00025024972433028474, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.0002767823178330163, + "loss": 0.0257, "step": 30680 }, { - "epoch": 0.33, - "learning_rate": 0.0002502335084646818, - "loss": 0.0184, + "epoch": 0.15, + "learning_rate": 0.00027677475014000234, + "loss": 0.029, "step": 30690 }, { - "epoch": 0.33, - "learning_rate": 0.0002502172925990789, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.0002767671824469883, + "loss": 0.0312, "step": 30700 }, { - "epoch": 0.33, - "learning_rate": 0.000250201076733476, - "loss": 0.0228, + "epoch": 0.15, + "learning_rate": 0.0002767596147539743, + "loss": 0.0256, "step": 30710 }, { - "epoch": 0.33, - "learning_rate": 0.0002501848608678731, - "loss": 0.0262, + "epoch": 0.15, + "learning_rate": 0.0002767520470609603, + "loss": 0.0256, "step": 30720 }, { - "epoch": 0.33, - "learning_rate": 0.0002501686450022702, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027674447936794626, + "loss": 0.0235, "step": 30730 }, { - "epoch": 0.33, - "learning_rate": 0.0002501524291366673, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.00027673691167493224, + "loss": 0.0247, "step": 30740 }, { - "epoch": 0.33, - "learning_rate": 0.0002501362132710644, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.0002767293439819182, + "loss": 0.0266, "step": 30750 }, { - "epoch": 0.33, - "learning_rate": 0.0002501199974054615, - "loss": 0.0337, + "epoch": 0.16, + "learning_rate": 0.00027672177628890426, + "loss": 0.0233, "step": 30760 }, { - "epoch": 0.33, - "learning_rate": 0.00025010378153985855, - "loss": 0.0294, + "epoch": 0.16, + "learning_rate": 0.00027671420859589024, + "loss": 0.0232, "step": 30770 }, { - "epoch": 0.33, - "learning_rate": 0.00025008756567425567, - "loss": 0.0249, + "epoch": 0.16, + "learning_rate": 0.0002767066409028762, + "loss": 0.0239, "step": 30780 }, { - "epoch": 0.33, - "learning_rate": 0.0002500713498086528, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.0002766990732098622, + "loss": 0.0255, "step": 30790 }, { - "epoch": 0.33, - "learning_rate": 0.00025005513394304985, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.0002766915055168482, + "loss": 0.0253, "step": 30800 }, { - "epoch": 0.33, - "learning_rate": 0.0002500389180774469, - "loss": 0.0232, + "epoch": 0.16, + "learning_rate": 0.00027668393782383417, + "loss": 0.0265, "step": 30810 }, { - "epoch": 0.33, - "learning_rate": 0.00025002270221184404, - "loss": 0.0246, + "epoch": 0.16, + "learning_rate": 0.00027667637013082015, + "loss": 0.0232, "step": 30820 }, { - "epoch": 0.33, - "learning_rate": 0.00025000648634624116, - "loss": 0.0284, + "epoch": 0.16, + "learning_rate": 0.00027666880243780613, + "loss": 0.0303, "step": 30830 }, { - "epoch": 0.33, - "learning_rate": 0.0002499902704806382, - "loss": 0.0254, + "epoch": 0.16, + "learning_rate": 0.0002766612347447921, + "loss": 0.0239, "step": 30840 }, { - "epoch": 0.33, - "learning_rate": 0.0002499740546150353, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.0002766536670517781, + "loss": 0.0263, "step": 30850 }, { - "epoch": 0.33, - "learning_rate": 0.0002499578387494324, - "loss": 0.0261, + "epoch": 0.16, + "learning_rate": 0.00027664609935876413, + "loss": 0.0243, "step": 30860 }, { - "epoch": 0.33, - "learning_rate": 0.00024994162288382953, - "loss": 0.0294, + "epoch": 0.16, + "learning_rate": 0.0002766385316657501, + "loss": 0.0242, "step": 30870 }, { - "epoch": 0.33, - "learning_rate": 0.0002499254070182266, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.0002766309639727361, + "loss": 0.0213, "step": 30880 }, { - "epoch": 0.33, - "learning_rate": 0.0002499091911526237, + "epoch": 0.16, + "learning_rate": 0.0002766233962797221, "loss": 0.0252, "step": 30890 }, { - "epoch": 0.33, - "learning_rate": 0.0002498929752870208, - "loss": 0.0237, + "epoch": 0.16, + "learning_rate": 0.00027661582858670806, + "loss": 0.0249, "step": 30900 }, { - "epoch": 0.33, - "learning_rate": 0.0002498767594214179, - "loss": 0.0234, + "epoch": 0.16, + "learning_rate": 0.00027660826089369404, + "loss": 0.0239, "step": 30910 }, { - "epoch": 0.33, - "learning_rate": 0.000249860543555815, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027660069320068007, + "loss": 0.0233, "step": 30920 }, { - "epoch": 0.33, - "learning_rate": 0.0002498443276902121, - "loss": 0.0234, + "epoch": 0.16, + "learning_rate": 0.00027659312550766605, + "loss": 0.0233, "step": 30930 }, { - "epoch": 0.33, - "learning_rate": 0.00024982811182460915, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.00027658555781465204, + "loss": 0.0249, "step": 30940 }, { - "epoch": 0.33, - "learning_rate": 0.00024981189595900627, - "loss": 0.0232, + "epoch": 0.16, + "learning_rate": 0.000276577990121638, + "loss": 0.0231, "step": 30950 }, { - "epoch": 0.33, - "learning_rate": 0.0002497956800934034, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.000276570422428624, + "loss": 0.0243, "step": 30960 }, { - "epoch": 0.33, - "learning_rate": 0.00024977946422780046, - "loss": 0.0239, + "epoch": 0.16, + "learning_rate": 0.00027656285473561, + "loss": 0.032, "step": 30970 }, { - "epoch": 0.33, - "learning_rate": 0.0002497632483621975, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.00027655528704259596, + "loss": 0.0222, "step": 30980 }, { - "epoch": 0.34, - "learning_rate": 0.00024974703249659464, - "loss": 0.0241, + "epoch": 0.16, + "learning_rate": 0.000276547719349582, + "loss": 0.0229, "step": 30990 }, { - "epoch": 0.34, - "learning_rate": 0.00024973081663099176, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.000276540151656568, + "loss": 0.0259, "step": 31000 }, { - "epoch": 0.34, - "eval_cer": 0.92159989715741, - "eval_loss": 0.01651957258582115, - "eval_runtime": 121.4844, - "eval_samples_per_second": 16.463, - "eval_steps_per_second": 4.116, + "epoch": 0.16, + "eval_cer": 0.914447936792278, + "eval_loss": 0.018999282270669937, + "eval_runtime": 117.1152, + "eval_samples_per_second": 17.077, + "eval_steps_per_second": 4.269, "step": 31000 }, { - "epoch": 0.34, - "learning_rate": 0.0002497146007653888, - "loss": 0.0224, + "epoch": 0.16, + "learning_rate": 0.00027653258396355396, + "loss": 0.0254, "step": 31010 }, { - "epoch": 0.34, - "learning_rate": 0.0002496983848997859, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027652501627053994, + "loss": 0.0239, "step": 31020 }, { - "epoch": 0.34, - "learning_rate": 0.000249682169034183, - "loss": 0.0226, + "epoch": 0.16, + "learning_rate": 0.0002765174485775259, + "loss": 0.0342, "step": 31030 }, { - "epoch": 0.34, - "learning_rate": 0.00024966595316858013, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002765098808845119, + "loss": 0.0252, "step": 31040 }, { - "epoch": 0.34, - "learning_rate": 0.00024964973730297725, - "loss": 0.0226, + "epoch": 0.16, + "learning_rate": 0.00027650231319149794, + "loss": 0.0225, "step": 31050 }, { - "epoch": 0.34, - "learning_rate": 0.0002496335214373743, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.0002764947454984839, + "loss": 0.0251, "step": 31060 }, { - "epoch": 0.34, - "learning_rate": 0.0002496173055717714, - "loss": 0.0184, + "epoch": 0.16, + "learning_rate": 0.0002764871778054699, + "loss": 0.0287, "step": 31070 }, { - "epoch": 0.34, - "learning_rate": 0.0002496010897061685, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002764796101124559, + "loss": 0.0304, "step": 31080 }, { - "epoch": 0.34, - "learning_rate": 0.0002495848738405656, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027647204241944187, + "loss": 0.0259, "step": 31090 }, { - "epoch": 0.34, - "learning_rate": 0.0002495686579749627, - "loss": 0.0281, + "epoch": 0.16, + "learning_rate": 0.00027646447472642785, + "loss": 0.0233, "step": 31100 }, { - "epoch": 0.34, - "learning_rate": 0.00024955244210935975, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027645690703341383, + "loss": 0.0262, "step": 31110 }, { - "epoch": 0.34, - "learning_rate": 0.0002495362262437569, - "loss": 0.0261, + "epoch": 0.16, + "learning_rate": 0.00027644933934039986, + "loss": 0.0269, "step": 31120 }, { - "epoch": 0.34, - "learning_rate": 0.000249520010378154, - "loss": 0.0255, + "epoch": 0.16, + "learning_rate": 0.00027644177164738585, + "loss": 0.0222, "step": 31130 }, { - "epoch": 0.34, - "learning_rate": 0.00024950379451255106, - "loss": 0.0264, + "epoch": 0.16, + "learning_rate": 0.0002764342039543718, + "loss": 0.0196, "step": 31140 }, { - "epoch": 0.34, - "learning_rate": 0.0002494875786469481, - "loss": 0.0247, + "epoch": 0.16, + "learning_rate": 0.0002764266362613578, + "loss": 0.0283, "step": 31150 }, { - "epoch": 0.34, - "learning_rate": 0.00024947136278134524, - "loss": 0.0248, + "epoch": 0.16, + "learning_rate": 0.0002764190685683438, + "loss": 0.024, "step": 31160 }, { - "epoch": 0.34, - "learning_rate": 0.00024945514691574236, - "loss": 0.0321, + "epoch": 0.16, + "learning_rate": 0.00027641150087532977, + "loss": 0.0239, "step": 31170 }, { - "epoch": 0.34, - "learning_rate": 0.00024943893105013943, - "loss": 0.0244, + "epoch": 0.16, + "learning_rate": 0.0002764039331823158, + "loss": 0.0208, "step": 31180 }, { - "epoch": 0.34, - "learning_rate": 0.00024942271518453655, - "loss": 0.0266, + "epoch": 0.16, + "learning_rate": 0.0002763963654893018, + "loss": 0.024, "step": 31190 }, { - "epoch": 0.34, - "learning_rate": 0.0002494064993189336, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.00027638879779628777, + "loss": 0.0275, "step": 31200 }, { - "epoch": 0.34, - "learning_rate": 0.00024939028345333074, - "loss": 0.0238, + "epoch": 0.16, + "learning_rate": 0.00027638123010327375, + "loss": 0.0274, "step": 31210 }, { - "epoch": 0.34, - "learning_rate": 0.0002493740675877278, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027637366241025973, + "loss": 0.0258, "step": 31220 }, { - "epoch": 0.34, - "learning_rate": 0.0002493578517221249, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.0002763660947172457, + "loss": 0.0258, "step": 31230 }, { - "epoch": 0.34, - "learning_rate": 0.000249341635856522, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.00027635852702423175, + "loss": 0.0236, "step": 31240 }, { - "epoch": 0.34, - "learning_rate": 0.0002493254199909191, - "loss": 0.0253, + "epoch": 0.16, + "learning_rate": 0.00027635095933121773, + "loss": 0.0244, "step": 31250 }, { - "epoch": 0.34, - "learning_rate": 0.00024930920412531617, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.0002763433916382037, + "loss": 0.0262, "step": 31260 }, { - "epoch": 0.34, - "learning_rate": 0.0002492929882597133, + "epoch": 0.16, + "learning_rate": 0.0002763358239451897, "loss": 0.0266, "step": 31270 }, { - "epoch": 0.34, - "learning_rate": 0.00024927677239411036, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.0002763282562521757, + "loss": 0.0286, "step": 31280 }, { - "epoch": 0.34, - "learning_rate": 0.0002492605565285075, - "loss": 0.0262, + "epoch": 0.16, + "learning_rate": 0.00027632068855916166, + "loss": 0.0289, "step": 31290 }, { - "epoch": 0.34, - "learning_rate": 0.00024924434066290454, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.00027631312086614764, + "loss": 0.0289, "step": 31300 }, { - "epoch": 0.34, - "learning_rate": 0.00024922812479730166, - "loss": 0.0232, + "epoch": 0.16, + "learning_rate": 0.0002763055531731337, + "loss": 0.0294, "step": 31310 }, { - "epoch": 0.34, - "learning_rate": 0.0002492119089316988, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.00027629798548011966, + "loss": 0.0253, "step": 31320 }, { - "epoch": 0.34, - "learning_rate": 0.00024919569306609585, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027629041778710564, + "loss": 0.0262, "step": 31330 }, { - "epoch": 0.34, - "learning_rate": 0.0002491794772004929, - "loss": 0.0277, + "epoch": 0.16, + "learning_rate": 0.0002762828500940916, + "loss": 0.0199, "step": 31340 }, { - "epoch": 0.34, - "learning_rate": 0.00024916326133489003, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.0002762752824010776, + "loss": 0.024, "step": 31350 }, { - "epoch": 0.34, - "learning_rate": 0.00024914704546928715, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.0002762677147080636, + "loss": 0.0228, "step": 31360 }, { - "epoch": 0.34, - "learning_rate": 0.0002491308296036842, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002762601470150496, + "loss": 0.0392, "step": 31370 }, { - "epoch": 0.34, - "learning_rate": 0.0002491146137380813, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.0002762525793220356, + "loss": 0.0231, "step": 31380 }, { - "epoch": 0.34, - "learning_rate": 0.0002490983978724784, - "loss": 0.0255, + "epoch": 0.16, + "learning_rate": 0.0002762450116290216, + "loss": 0.0297, "step": 31390 }, { - "epoch": 0.34, - "learning_rate": 0.0002490821820068755, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.00027623744393600756, + "loss": 0.0354, "step": 31400 }, { - "epoch": 0.34, - "learning_rate": 0.0002490659661412726, - "loss": 0.0262, + "epoch": 0.16, + "learning_rate": 0.00027622987624299354, + "loss": 0.0284, "step": 31410 }, { - "epoch": 0.34, - "learning_rate": 0.00024904975027566966, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002762223085499795, + "loss": 0.0366, "step": 31420 }, { - "epoch": 0.34, - "learning_rate": 0.0002490335344100668, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.00027621474085696556, + "loss": 0.0256, "step": 31430 }, { - "epoch": 0.34, - "learning_rate": 0.0002490173185444639, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.00027620717316395154, + "loss": 0.0294, "step": 31440 }, { - "epoch": 0.34, - "learning_rate": 0.00024900110267886096, - "loss": 0.0435, + "epoch": 0.16, + "learning_rate": 0.0002761996054709375, + "loss": 0.0249, "step": 31450 }, { - "epoch": 0.34, - "learning_rate": 0.0002489848868132581, - "loss": 0.0214, + "epoch": 0.16, + "learning_rate": 0.0002761920377779235, + "loss": 0.0317, "step": 31460 }, { - "epoch": 0.34, - "learning_rate": 0.00024896867094765515, - "loss": 0.0214, + "epoch": 0.16, + "learning_rate": 0.0002761844700849095, + "loss": 0.0279, "step": 31470 }, { - "epoch": 0.34, - "learning_rate": 0.00024895245508205227, - "loss": 0.0237, + "epoch": 0.16, + "learning_rate": 0.00027617690239189547, + "loss": 0.0217, "step": 31480 }, { - "epoch": 0.34, - "learning_rate": 0.0002489362392164494, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027616933469888145, + "loss": 0.0259, "step": 31490 }, { - "epoch": 0.34, - "learning_rate": 0.00024892002335084645, - "loss": 0.0238, + "epoch": 0.16, + "learning_rate": 0.0002761617670058675, + "loss": 0.0209, "step": 31500 }, { - "epoch": 0.34, - "learning_rate": 0.0002489038074852435, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.00027615419931285347, + "loss": 0.0255, "step": 31510 }, { - "epoch": 0.34, - "learning_rate": 0.00024888759161964064, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.00027614663161983945, + "loss": 0.0325, "step": 31520 }, { - "epoch": 0.34, - "learning_rate": 0.00024887137575403776, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027613906392682543, + "loss": 0.0311, "step": 31530 }, { - "epoch": 0.34, - "learning_rate": 0.0002488551598884348, - "loss": 0.0257, + "epoch": 0.16, + "learning_rate": 0.0002761314962338114, + "loss": 0.0289, "step": 31540 }, { - "epoch": 0.34, - "learning_rate": 0.0002488389440228319, - "loss": 0.0266, + "epoch": 0.16, + "learning_rate": 0.0002761239285407974, + "loss": 0.0283, "step": 31550 }, { - "epoch": 0.34, - "learning_rate": 0.000248822728157229, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.00027611636084778343, + "loss": 0.0269, "step": 31560 }, { - "epoch": 0.34, - "learning_rate": 0.00024880651229162613, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.0002761087931547694, + "loss": 0.027, "step": 31570 }, { - "epoch": 0.34, - "learning_rate": 0.0002487902964260232, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.0002761012254617554, + "loss": 0.0232, "step": 31580 }, { - "epoch": 0.34, - "learning_rate": 0.00024877408056042026, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.00027609365776874137, + "loss": 0.025, "step": 31590 }, { - "epoch": 0.34, - "learning_rate": 0.0002487578646948174, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.00027608609007572735, + "loss": 0.025, "step": 31600 }, { - "epoch": 0.34, - "learning_rate": 0.0002487416488292145, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027607852238271333, + "loss": 0.0265, "step": 31610 }, { - "epoch": 0.34, - "learning_rate": 0.00024872543296361157, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.0002760709546896993, + "loss": 0.0258, "step": 31620 }, { - "epoch": 0.34, - "learning_rate": 0.0002487092170980087, - "loss": 0.0233, + "epoch": 0.16, + "learning_rate": 0.00027606338699668535, + "loss": 0.0225, "step": 31630 }, { - "epoch": 0.34, - "learning_rate": 0.00024869300123240575, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.00027605581930367133, + "loss": 0.0229, "step": 31640 }, { - "epoch": 0.34, - "learning_rate": 0.00024867678536680287, - "loss": 0.021, + "epoch": 0.16, + "learning_rate": 0.0002760482516106573, + "loss": 0.0274, "step": 31650 }, { - "epoch": 0.34, - "learning_rate": 0.0002486605695012, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002760406839176433, + "loss": 0.0216, "step": 31660 }, { - "epoch": 0.34, - "learning_rate": 0.00024864435363559706, - "loss": 0.0187, + "epoch": 0.16, + "learning_rate": 0.0002760331162246293, + "loss": 0.0267, "step": 31670 }, { - "epoch": 0.34, - "learning_rate": 0.0002486281377699941, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027602554853161526, + "loss": 0.0232, "step": 31680 }, { - "epoch": 0.34, - "learning_rate": 0.00024861192190439124, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.0002760179808386013, + "loss": 0.0241, "step": 31690 }, { - "epoch": 0.34, - "learning_rate": 0.00024859570603878836, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.0002760104131455873, + "loss": 0.0282, "step": 31700 }, { - "epoch": 0.34, - "learning_rate": 0.00024857949017318543, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.00027600284545257326, + "loss": 0.0242, "step": 31710 }, { - "epoch": 0.34, - "learning_rate": 0.0002485632743075825, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027599527775955924, + "loss": 0.0243, "step": 31720 }, { - "epoch": 0.34, - "learning_rate": 0.0002485470584419796, - "loss": 0.0241, + "epoch": 0.16, + "learning_rate": 0.0002759877100665452, + "loss": 0.027, "step": 31730 }, { - "epoch": 0.34, - "learning_rate": 0.00024853084257637673, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.0002759801423735312, + "loss": 0.0262, "step": 31740 }, { - "epoch": 0.34, - "learning_rate": 0.0002485146267107738, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.00027597257468051724, + "loss": 0.0339, "step": 31750 }, { - "epoch": 0.34, - "learning_rate": 0.0002484984108451709, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002759650069875032, + "loss": 0.0257, "step": 31760 }, { - "epoch": 0.34, - "learning_rate": 0.000248482194979568, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002759574392944892, + "loss": 0.0305, "step": 31770 }, { - "epoch": 0.34, - "learning_rate": 0.0002484659791139651, - "loss": 0.0256, + "epoch": 0.16, + "learning_rate": 0.0002759498716014752, + "loss": 0.0229, "step": 31780 }, { - "epoch": 0.34, - "learning_rate": 0.00024844976324836217, - "loss": 0.0233, + "epoch": 0.16, + "learning_rate": 0.00027594230390846116, + "loss": 0.0226, "step": 31790 }, { - "epoch": 0.34, - "learning_rate": 0.0002484335473827593, - "loss": 0.0433, + "epoch": 0.16, + "learning_rate": 0.00027593473621544714, + "loss": 0.0289, "step": 31800 }, { - "epoch": 0.34, - "learning_rate": 0.00024841733151715635, - "loss": 0.0341, + "epoch": 0.16, + "learning_rate": 0.0002759271685224331, + "loss": 0.0262, "step": 31810 }, { - "epoch": 0.34, - "learning_rate": 0.0002484011156515535, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027591960082941916, + "loss": 0.0232, "step": 31820 }, { - "epoch": 0.34, - "learning_rate": 0.00024838489978595054, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.00027591203313640514, + "loss": 0.0242, "step": 31830 }, { - "epoch": 0.34, - "learning_rate": 0.00024836868392034766, - "loss": 0.0257, + "epoch": 0.16, + "learning_rate": 0.0002759044654433911, + "loss": 0.0299, "step": 31840 }, { - "epoch": 0.34, - "learning_rate": 0.0002483524680547447, - "loss": 0.0258, + "epoch": 0.16, + "learning_rate": 0.0002758968977503771, + "loss": 0.0288, "step": 31850 }, { - "epoch": 0.34, - "learning_rate": 0.00024833625218914185, - "loss": 0.0263, + "epoch": 0.16, + "learning_rate": 0.0002758893300573631, + "loss": 0.0235, "step": 31860 }, { - "epoch": 0.34, - "learning_rate": 0.0002483200363235389, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027588176236434907, + "loss": 0.0263, "step": 31870 }, { - "epoch": 0.34, - "learning_rate": 0.00024830382045793603, - "loss": 0.026, + "epoch": 0.16, + "learning_rate": 0.0002758741946713351, + "loss": 0.0336, "step": 31880 }, { - "epoch": 0.34, - "learning_rate": 0.0002482876045923331, - "loss": 0.0276, + "epoch": 0.16, + "learning_rate": 0.0002758666269783211, + "loss": 0.0238, "step": 31890 }, { - "epoch": 0.34, - "learning_rate": 0.0002482713887267302, - "loss": 0.0263, + "epoch": 0.16, + "learning_rate": 0.00027585905928530707, + "loss": 0.0272, "step": 31900 }, { - "epoch": 0.34, - "learning_rate": 0.0002482551728611273, - "loss": 0.0322, + "epoch": 0.16, + "learning_rate": 0.00027585149159229305, + "loss": 0.0237, "step": 31910 }, { - "epoch": 0.35, - "learning_rate": 0.0002482389569955244, - "loss": 0.0224, + "epoch": 0.16, + "learning_rate": 0.00027584392389927903, + "loss": 0.0236, "step": 31920 }, { - "epoch": 0.35, - "learning_rate": 0.0002482227411299215, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.000275836356206265, + "loss": 0.0247, "step": 31930 }, { - "epoch": 0.35, - "learning_rate": 0.0002482065252643186, - "loss": 0.0247, + "epoch": 0.16, + "learning_rate": 0.000275828788513251, + "loss": 0.0271, "step": 31940 }, { - "epoch": 0.35, - "learning_rate": 0.00024819030939871565, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.00027582122082023703, + "loss": 0.0268, "step": 31950 }, { - "epoch": 0.35, - "learning_rate": 0.00024817409353311277, - "loss": 0.0237, + "epoch": 0.16, + "learning_rate": 0.000275813653127223, + "loss": 0.0238, "step": 31960 }, { - "epoch": 0.35, - "learning_rate": 0.0002481578776675099, - "loss": 0.0257, + "epoch": 0.16, + "learning_rate": 0.000275806085434209, + "loss": 0.0258, "step": 31970 }, { - "epoch": 0.35, - "learning_rate": 0.00024814166180190696, - "loss": 0.0233, + "epoch": 0.16, + "learning_rate": 0.000275798517741195, + "loss": 0.0256, "step": 31980 }, { - "epoch": 0.35, - "learning_rate": 0.000248125445936304, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027579095004818095, + "loss": 0.0247, "step": 31990 }, { - "epoch": 0.35, - "learning_rate": 0.00024810923007070114, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027578338235516694, + "loss": 0.0273, "step": 32000 }, { - "epoch": 0.35, - "eval_cer": 0.9215825250982824, - "eval_loss": 0.016736265271902084, - "eval_runtime": 121.554, - "eval_samples_per_second": 16.454, - "eval_steps_per_second": 4.113, + "epoch": 0.16, + "eval_cer": 0.9144896638256703, + "eval_loss": 0.017893997952342033, + "eval_runtime": 117.1916, + "eval_samples_per_second": 17.066, + "eval_steps_per_second": 4.267, "step": 32000 }, { - "epoch": 0.35, - "learning_rate": 0.00024809301420509826, - "loss": 0.0264, + "epoch": 0.16, + "learning_rate": 0.00027577581466215297, + "loss": 0.0236, "step": 32010 }, { - "epoch": 0.35, - "learning_rate": 0.00024807679833949533, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027576824696913895, + "loss": 0.0283, "step": 32020 }, { - "epoch": 0.35, - "learning_rate": 0.0002480605824738924, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.00027576067927612493, + "loss": 0.025, "step": 32030 }, { - "epoch": 0.35, - "learning_rate": 0.0002480443666082895, - "loss": 0.0244, + "epoch": 0.16, + "learning_rate": 0.0002757531115831109, + "loss": 0.0208, "step": 32040 }, { - "epoch": 0.35, - "learning_rate": 0.00024802815074268663, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.0002757455438900969, + "loss": 0.025, "step": 32050 }, { - "epoch": 0.35, - "learning_rate": 0.00024801193487708375, - "loss": 0.0234, + "epoch": 0.16, + "learning_rate": 0.0002757379761970829, + "loss": 0.023, "step": 32060 }, { - "epoch": 0.35, - "learning_rate": 0.0002479957190114808, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027573040850406886, + "loss": 0.0272, "step": 32070 }, { - "epoch": 0.35, - "learning_rate": 0.0002479795031458779, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.00027572284081105484, + "loss": 0.0225, "step": 32080 }, { - "epoch": 0.35, - "learning_rate": 0.000247963287280275, - "loss": 0.0266, + "epoch": 0.16, + "learning_rate": 0.0002757152731180408, + "loss": 0.0277, "step": 32090 }, { - "epoch": 0.35, - "learning_rate": 0.0002479470714146721, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002757077054250268, + "loss": 0.0251, "step": 32100 }, { - "epoch": 0.35, - "learning_rate": 0.0002479308555490692, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.00027570013773201284, + "loss": 0.0266, "step": 32110 }, { - "epoch": 0.35, - "learning_rate": 0.00024791463968346626, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.0002756925700389988, + "loss": 0.0257, "step": 32120 }, { - "epoch": 0.35, - "learning_rate": 0.0002478984238178634, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.0002756850023459848, + "loss": 0.0245, "step": 32130 }, { - "epoch": 0.35, - "learning_rate": 0.0002478822079522605, - "loss": 0.0239, + "epoch": 0.16, + "learning_rate": 0.0002756774346529708, + "loss": 0.0266, "step": 32140 }, { - "epoch": 0.35, - "learning_rate": 0.00024786599208665756, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.00027566986695995677, + "loss": 0.0264, "step": 32150 }, { - "epoch": 0.35, - "learning_rate": 0.00024784977622105463, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.00027566229926694275, + "loss": 0.0255, "step": 32160 }, { - "epoch": 0.35, - "learning_rate": 0.00024783356035545175, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.00027565473157392873, + "loss": 0.0344, "step": 32170 }, { - "epoch": 0.35, - "learning_rate": 0.00024781734448984887, - "loss": 0.0236, + "epoch": 0.16, + "learning_rate": 0.00027564716388091476, + "loss": 0.0269, "step": 32180 }, { - "epoch": 0.35, - "learning_rate": 0.00024780112862424593, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027563959618790075, + "loss": 0.0241, "step": 32190 }, { - "epoch": 0.35, - "learning_rate": 0.00024778491275864305, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.00027563202849488673, + "loss": 0.0234, "step": 32200 }, { - "epoch": 0.35, - "learning_rate": 0.0002477686968930401, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.0002756244608018727, + "loss": 0.028, "step": 32210 }, { - "epoch": 0.35, - "learning_rate": 0.00024775248102743724, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.0002756168931088587, + "loss": 0.0252, "step": 32220 }, { - "epoch": 0.35, - "learning_rate": 0.0002477362651618343, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.00027560932541584467, + "loss": 0.0261, "step": 32230 }, { - "epoch": 0.35, - "learning_rate": 0.0002477200492962314, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.0002756017577228307, + "loss": 0.0281, "step": 32240 }, { - "epoch": 0.35, - "learning_rate": 0.0002477038334306285, - "loss": 0.0245, + "epoch": 0.16, + "learning_rate": 0.0002755941900298167, + "loss": 0.0255, "step": 32250 }, { - "epoch": 0.35, - "learning_rate": 0.0002476876175650256, - "loss": 0.021, + "epoch": 0.16, + "learning_rate": 0.00027558662233680267, + "loss": 0.0309, "step": 32260 }, { - "epoch": 0.35, - "learning_rate": 0.0002476714016994227, - "loss": 0.0243, + "epoch": 0.16, + "learning_rate": 0.00027557905464378865, + "loss": 0.0308, "step": 32270 }, { - "epoch": 0.35, - "learning_rate": 0.0002476551858338198, - "loss": 0.0252, + "epoch": 0.16, + "learning_rate": 0.00027557148695077463, + "loss": 0.0274, "step": 32280 }, { - "epoch": 0.35, - "learning_rate": 0.00024763896996821686, - "loss": 0.0268, + "epoch": 0.16, + "learning_rate": 0.0002755639192577606, + "loss": 0.0283, "step": 32290 }, { - "epoch": 0.35, - "learning_rate": 0.000247622754102614, - "loss": 0.0233, + "epoch": 0.16, + "learning_rate": 0.00027555635156474665, + "loss": 0.0241, "step": 32300 }, { - "epoch": 0.35, - "learning_rate": 0.00024760653823701105, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.00027554878387173263, + "loss": 0.0299, "step": 32310 }, { - "epoch": 0.35, - "learning_rate": 0.00024759032237140817, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.0002755412161787186, + "loss": 0.0252, "step": 32320 }, { - "epoch": 0.35, - "learning_rate": 0.0002475741065058053, - "loss": 0.0239, + "epoch": 0.16, + "learning_rate": 0.0002755336484857046, + "loss": 0.0258, "step": 32330 }, { - "epoch": 0.35, - "learning_rate": 0.00024755789064020235, - "loss": 0.0288, + "epoch": 0.16, + "learning_rate": 0.0002755260807926906, + "loss": 0.0216, "step": 32340 }, { - "epoch": 0.35, - "learning_rate": 0.0002475416747745994, - "loss": 0.0281, + "epoch": 0.16, + "learning_rate": 0.00027551851309967656, + "loss": 0.0266, "step": 32350 }, { - "epoch": 0.35, - "learning_rate": 0.00024752545890899654, - "loss": 0.0226, + "epoch": 0.16, + "learning_rate": 0.00027551094540666254, + "loss": 0.0251, "step": 32360 }, { - "epoch": 0.35, - "learning_rate": 0.00024750924304339366, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002755033777136486, + "loss": 0.0318, "step": 32370 }, { - "epoch": 0.35, - "learning_rate": 0.0002474930271777907, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.00027549581002063456, + "loss": 0.0237, "step": 32380 }, { - "epoch": 0.35, - "learning_rate": 0.00024747681131218784, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.00027548824232762054, + "loss": 0.0221, "step": 32390 }, { - "epoch": 0.35, - "learning_rate": 0.0002474605954465849, - "loss": 0.0255, + "epoch": 0.16, + "learning_rate": 0.0002754806746346065, + "loss": 0.0226, "step": 32400 }, { - "epoch": 0.35, - "learning_rate": 0.00024744437958098203, - "loss": 0.0244, + "epoch": 0.16, + "learning_rate": 0.0002754731069415925, + "loss": 0.0262, "step": 32410 }, { - "epoch": 0.35, - "learning_rate": 0.0002474281637153791, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.0002754655392485785, + "loss": 0.0233, "step": 32420 }, { - "epoch": 0.35, - "learning_rate": 0.0002474119478497762, - "loss": 0.0263, + "epoch": 0.16, + "learning_rate": 0.0002754579715555645, + "loss": 0.0227, "step": 32430 }, { - "epoch": 0.35, - "learning_rate": 0.0002473957319841733, - "loss": 0.0265, + "epoch": 0.16, + "learning_rate": 0.0002754504038625505, + "loss": 0.0267, "step": 32440 }, { - "epoch": 0.35, - "learning_rate": 0.0002473795161185704, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.0002754428361695365, + "loss": 0.0282, "step": 32450 }, { - "epoch": 0.35, - "learning_rate": 0.00024736330025296746, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.00027543526847652246, + "loss": 0.0243, "step": 32460 }, { - "epoch": 0.35, - "learning_rate": 0.0002473470843873646, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.00027542770078350844, + "loss": 0.0223, "step": 32470 }, { - "epoch": 0.35, - "learning_rate": 0.00024733086852176165, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.0002754201330904944, + "loss": 0.0243, "step": 32480 }, { - "epoch": 0.35, - "learning_rate": 0.00024731465265615877, - "loss": 0.0239, + "epoch": 0.16, + "learning_rate": 0.00027541256539748046, + "loss": 0.0246, "step": 32490 }, { - "epoch": 0.35, - "learning_rate": 0.0002472984367905559, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027540499770446644, + "loss": 0.0247, "step": 32500 }, { - "epoch": 0.35, - "learning_rate": 0.00024728222092495296, - "loss": 0.0268, + "epoch": 0.16, + "learning_rate": 0.0002753974300114524, + "loss": 0.0245, "step": 32510 }, { - "epoch": 0.35, - "learning_rate": 0.00024726600505935, - "loss": 0.027, + "epoch": 0.16, + "learning_rate": 0.0002753898623184384, + "loss": 0.0256, "step": 32520 }, { - "epoch": 0.35, - "learning_rate": 0.00024724978919374714, - "loss": 0.0247, + "epoch": 0.16, + "learning_rate": 0.0002753822946254244, + "loss": 0.0232, "step": 32530 }, { - "epoch": 0.35, - "learning_rate": 0.00024723357332814426, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.00027537472693241037, + "loss": 0.0264, "step": 32540 }, { - "epoch": 0.35, - "learning_rate": 0.0002472173574625413, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.00027536715923939635, + "loss": 0.024, "step": 32550 }, { - "epoch": 0.35, - "learning_rate": 0.0002472011415969384, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.0002753595915463824, + "loss": 0.026, "step": 32560 }, { - "epoch": 0.35, - "learning_rate": 0.0002471849257313355, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027535202385336837, + "loss": 0.0236, "step": 32570 }, { - "epoch": 0.35, - "learning_rate": 0.00024716870986573263, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.00027534445616035435, + "loss": 0.0233, "step": 32580 }, { - "epoch": 0.35, - "learning_rate": 0.0002471524940001297, - "loss": 0.0239, + "epoch": 0.16, + "learning_rate": 0.00027533688846734033, + "loss": 0.0288, "step": 32590 }, { - "epoch": 0.35, - "learning_rate": 0.00024713627813452676, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.0002753293207743263, + "loss": 0.026, "step": 32600 }, { - "epoch": 0.35, - "learning_rate": 0.0002471200622689239, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002753217530813123, + "loss": 0.0255, "step": 32610 }, { - "epoch": 0.35, - "learning_rate": 0.000247103846403321, - "loss": 0.0224, + "epoch": 0.16, + "learning_rate": 0.00027531418538829833, + "loss": 0.0266, "step": 32620 }, { - "epoch": 0.35, - "learning_rate": 0.0002470876305377181, - "loss": 0.0226, + "epoch": 0.16, + "learning_rate": 0.0002753066176952843, + "loss": 0.0249, "step": 32630 }, { - "epoch": 0.35, - "learning_rate": 0.0002470714146721152, - "loss": 0.0228, + "epoch": 0.16, + "learning_rate": 0.0002752990500022703, + "loss": 0.0277, "step": 32640 }, { - "epoch": 0.35, - "learning_rate": 0.00024705519880651225, - "loss": 0.0234, + "epoch": 0.16, + "learning_rate": 0.00027529148230925627, + "loss": 0.0321, "step": 32650 }, { - "epoch": 0.35, - "learning_rate": 0.0002470389829409094, - "loss": 0.0255, + "epoch": 0.16, + "learning_rate": 0.00027528391461624225, + "loss": 0.026, "step": 32660 }, { - "epoch": 0.35, - "learning_rate": 0.0002470227670753065, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.00027527634692322823, + "loss": 0.0227, "step": 32670 }, { - "epoch": 0.35, - "learning_rate": 0.00024700655120970356, - "loss": 0.0172, + "epoch": 0.16, + "learning_rate": 0.0002752687792302142, + "loss": 0.0266, "step": 32680 }, { - "epoch": 0.35, - "learning_rate": 0.0002469903353441006, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.00027526121153720025, + "loss": 0.0263, "step": 32690 }, { - "epoch": 0.35, - "learning_rate": 0.00024697411947849774, - "loss": 0.0247, + "epoch": 0.16, + "learning_rate": 0.00027525364384418623, + "loss": 0.0239, "step": 32700 }, { - "epoch": 0.35, - "learning_rate": 0.00024695790361289486, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.0002752460761511722, + "loss": 0.0281, "step": 32710 }, { - "epoch": 0.35, - "learning_rate": 0.00024694168774729193, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002752385084581582, + "loss": 0.0254, "step": 32720 }, { - "epoch": 0.35, - "learning_rate": 0.000246925471881689, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002752309407651442, + "loss": 0.0253, "step": 32730 }, { - "epoch": 0.35, - "learning_rate": 0.0002469092560160861, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.00027522337307213016, + "loss": 0.0253, "step": 32740 }, { - "epoch": 0.35, - "learning_rate": 0.00024689304015048324, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.0002752158053791162, + "loss": 0.0266, "step": 32750 }, { - "epoch": 0.35, - "learning_rate": 0.0002468768242848803, - "loss": 0.0223, + "epoch": 0.17, + "learning_rate": 0.0002752082376861022, + "loss": 0.028, "step": 32760 }, { - "epoch": 0.35, - "learning_rate": 0.0002468606084192774, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.00027520066999308816, + "loss": 0.0268, "step": 32770 }, { - "epoch": 0.35, - "learning_rate": 0.0002468443925536745, - "loss": 0.0212, + "epoch": 0.17, + "learning_rate": 0.00027519310230007414, + "loss": 0.0232, "step": 32780 }, { - "epoch": 0.35, - "learning_rate": 0.0002468281766880716, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002751855346070601, + "loss": 0.0297, "step": 32790 }, { - "epoch": 0.35, - "learning_rate": 0.00024681196082246867, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.0002751779669140461, + "loss": 0.0244, "step": 32800 }, { - "epoch": 0.35, - "learning_rate": 0.0002467957449568658, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027517039922103214, + "loss": 0.0301, "step": 32810 }, { - "epoch": 0.35, - "learning_rate": 0.00024677952909126286, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.0002751628315280181, + "loss": 0.03, "step": 32820 }, { - "epoch": 0.35, - "learning_rate": 0.00024676331322566, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.0002751552638350041, + "loss": 0.0269, "step": 32830 }, { - "epoch": 0.36, - "learning_rate": 0.00024674709736005704, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002751476961419901, + "loss": 0.0339, "step": 32840 }, { - "epoch": 0.36, - "learning_rate": 0.00024673088149445416, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.00027514012844897606, + "loss": 0.0306, "step": 32850 }, { - "epoch": 0.36, - "learning_rate": 0.00024671466562885123, - "loss": 0.0259, + "epoch": 0.17, + "learning_rate": 0.00027513256075596204, + "loss": 0.0241, "step": 32860 }, { - "epoch": 0.36, - "learning_rate": 0.00024669844976324835, + "epoch": 0.17, + "learning_rate": 0.000275124993062948, "loss": 0.0235, "step": 32870 }, { - "epoch": 0.36, - "learning_rate": 0.0002466822338976454, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.00027511742536993406, + "loss": 0.0263, "step": 32880 }, { - "epoch": 0.36, - "learning_rate": 0.00024666601803204253, - "loss": 0.0238, + "epoch": 0.17, + "learning_rate": 0.00027510985767692004, + "loss": 0.023, "step": 32890 }, { - "epoch": 0.36, - "learning_rate": 0.0002466498021664396, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.000275102289983906, + "loss": 0.0251, "step": 32900 }, { - "epoch": 0.36, - "learning_rate": 0.0002466335863008367, - "loss": 0.0228, + "epoch": 0.17, + "learning_rate": 0.000275094722290892, + "loss": 0.0289, "step": 32910 }, { - "epoch": 0.36, - "learning_rate": 0.0002466173704352338, - "loss": 0.0249, + "epoch": 0.17, + "learning_rate": 0.000275087154597878, + "loss": 0.0268, "step": 32920 }, { - "epoch": 0.36, - "learning_rate": 0.0002466011545696309, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.00027507958690486397, + "loss": 0.0261, "step": 32930 }, { - "epoch": 0.36, - "learning_rate": 0.000246584938704028, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.00027507201921185, + "loss": 0.0416, "step": 32940 }, { - "epoch": 0.36, - "learning_rate": 0.0002465687228384251, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.000275064451518836, + "loss": 0.0258, "step": 32950 }, { - "epoch": 0.36, - "learning_rate": 0.00024655250697282216, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.00027505688382582197, + "loss": 0.0251, "step": 32960 }, { - "epoch": 0.36, - "learning_rate": 0.0002465362911072193, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.00027504931613280795, + "loss": 0.0262, "step": 32970 }, { - "epoch": 0.36, - "learning_rate": 0.0002465200752416164, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027504174843979393, + "loss": 0.0235, "step": 32980 }, { - "epoch": 0.36, - "learning_rate": 0.00024650385937601346, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002750341807467799, + "loss": 0.023, "step": 32990 }, { - "epoch": 0.36, - "learning_rate": 0.0002464876435104105, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.00027502661305376595, + "loss": 0.0284, "step": 33000 }, { - "epoch": 0.36, - "eval_cer": 0.921567758848024, - "eval_loss": 0.01648101769387722, - "eval_runtime": 121.6437, - "eval_samples_per_second": 16.441, - "eval_steps_per_second": 4.11, + "epoch": 0.17, + "eval_cer": 0.9144838414489178, + "eval_loss": 0.018402038142085075, + "eval_runtime": 117.2116, + "eval_samples_per_second": 17.063, + "eval_steps_per_second": 4.266, "step": 33000 }, { - "epoch": 0.36, - "learning_rate": 0.00024647142764480765, - "loss": 0.0208, + "epoch": 0.17, + "learning_rate": 0.00027501904536075193, + "loss": 0.0259, "step": 33010 }, { - "epoch": 0.36, - "learning_rate": 0.00024645521177920477, - "loss": 0.0232, + "epoch": 0.17, + "learning_rate": 0.0002750114776677379, + "loss": 0.0246, "step": 33020 }, { - "epoch": 0.36, - "learning_rate": 0.00024643899591360183, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.0002750039099747239, + "loss": 0.0264, "step": 33030 }, { - "epoch": 0.36, - "learning_rate": 0.0002464227800479989, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002749963422817099, + "loss": 0.0245, "step": 33040 }, { - "epoch": 0.36, - "learning_rate": 0.000246406564182396, - "loss": 0.0227, + "epoch": 0.17, + "learning_rate": 0.00027498877458869585, + "loss": 0.0211, "step": 33050 }, { - "epoch": 0.36, - "learning_rate": 0.00024639034831679314, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.00027498120689568184, + "loss": 0.021, "step": 33060 }, { - "epoch": 0.36, - "learning_rate": 0.00024637413245119026, - "loss": 0.0233, + "epoch": 0.17, + "learning_rate": 0.00027497363920266787, + "loss": 0.0223, "step": 33070 }, { - "epoch": 0.36, - "learning_rate": 0.0002463579165855873, - "loss": 0.0241, + "epoch": 0.17, + "learning_rate": 0.00027496607150965385, + "loss": 0.0232, "step": 33080 }, { - "epoch": 0.36, - "learning_rate": 0.0002463417007199844, - "loss": 0.0267, + "epoch": 0.17, + "learning_rate": 0.00027495850381663983, + "loss": 0.0241, "step": 33090 }, { - "epoch": 0.36, - "learning_rate": 0.0002463254848543815, - "loss": 0.0251, + "epoch": 0.17, + "learning_rate": 0.0002749509361236258, + "loss": 0.0265, "step": 33100 }, { - "epoch": 0.36, - "learning_rate": 0.00024630926898877863, - "loss": 0.0314, + "epoch": 0.17, + "learning_rate": 0.0002749433684306118, + "loss": 0.0264, "step": 33110 }, { - "epoch": 0.36, - "learning_rate": 0.0002462930531231757, - "loss": 0.0331, + "epoch": 0.17, + "learning_rate": 0.0002749358007375978, + "loss": 0.026, "step": 33120 }, { - "epoch": 0.36, - "learning_rate": 0.00024627683725757276, - "loss": 0.0293, + "epoch": 0.17, + "learning_rate": 0.0002749282330445838, + "loss": 0.0317, "step": 33130 }, { - "epoch": 0.36, - "learning_rate": 0.0002462606213919699, - "loss": 0.027, + "epoch": 0.17, + "learning_rate": 0.0002749206653515698, + "loss": 0.0236, "step": 33140 }, { - "epoch": 0.36, - "learning_rate": 0.000246244405526367, - "loss": 0.0267, + "epoch": 0.17, + "learning_rate": 0.0002749130976585558, + "loss": 0.0231, "step": 33150 }, { - "epoch": 0.36, - "learning_rate": 0.00024622818966076406, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.00027490552996554176, + "loss": 0.0312, "step": 33160 }, { - "epoch": 0.36, - "learning_rate": 0.00024621197379516113, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.00027489796227252774, + "loss": 0.026, "step": 33170 }, { - "epoch": 0.36, - "learning_rate": 0.00024619575792955825, - "loss": 0.0216, + "epoch": 0.17, + "learning_rate": 0.0002748903945795137, + "loss": 0.0219, "step": 33180 }, { - "epoch": 0.36, - "learning_rate": 0.00024617954206395537, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.0002748828268864997, + "loss": 0.023, "step": 33190 }, { - "epoch": 0.36, - "learning_rate": 0.00024616332619835244, - "loss": 0.0245, + "epoch": 0.17, + "learning_rate": 0.00027487525919348574, + "loss": 0.0482, "step": 33200 }, { - "epoch": 0.36, - "learning_rate": 0.00024614711033274956, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.0002748676915004717, + "loss": 0.0344, "step": 33210 }, { - "epoch": 0.36, - "learning_rate": 0.0002461308944671466, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.0002748601238074577, + "loss": 0.0282, "step": 33220 }, { - "epoch": 0.36, - "learning_rate": 0.00024611467860154374, - "loss": 0.0222, + "epoch": 0.17, + "learning_rate": 0.0002748525561144437, + "loss": 0.0291, "step": 33230 }, { - "epoch": 0.36, - "learning_rate": 0.00024609846273594086, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.00027484498842142966, + "loss": 0.0255, "step": 33240 }, { - "epoch": 0.36, - "learning_rate": 0.0002460822468703379, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027483742072841565, + "loss": 0.0249, "step": 33250 }, { - "epoch": 0.36, - "learning_rate": 0.000246066031004735, - "loss": 0.0208, + "epoch": 0.17, + "learning_rate": 0.0002748298530354017, + "loss": 0.0304, "step": 33260 }, { - "epoch": 0.36, - "learning_rate": 0.0002460498151391321, - "loss": 0.0223, + "epoch": 0.17, + "learning_rate": 0.00027482228534238766, + "loss": 0.0233, "step": 33270 }, { - "epoch": 0.36, - "learning_rate": 0.00024603359927352923, - "loss": 0.0233, + "epoch": 0.17, + "learning_rate": 0.00027481471764937364, + "loss": 0.0265, "step": 33280 }, { - "epoch": 0.36, - "learning_rate": 0.0002460173834079263, - "loss": 0.0245, + "epoch": 0.17, + "learning_rate": 0.0002748071499563596, + "loss": 0.0249, "step": 33290 }, { - "epoch": 0.36, - "learning_rate": 0.00024600116754232336, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.0002747995822633456, + "loss": 0.024, "step": 33300 }, { - "epoch": 0.36, - "learning_rate": 0.0002459849516767205, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.0002747920145703316, + "loss": 0.0461, "step": 33310 }, { - "epoch": 0.36, - "learning_rate": 0.0002459687358111176, - "loss": 0.0249, + "epoch": 0.17, + "learning_rate": 0.00027478444687731757, + "loss": 0.0418, "step": 33320 }, { - "epoch": 0.36, - "learning_rate": 0.00024595251994551467, - "loss": 0.0244, + "epoch": 0.17, + "learning_rate": 0.00027477687918430355, + "loss": 0.024, "step": 33330 }, { - "epoch": 0.36, - "learning_rate": 0.0002459363040799118, - "loss": 0.0245, + "epoch": 0.17, + "learning_rate": 0.00027476931149128953, + "loss": 0.0279, "step": 33340 }, { - "epoch": 0.36, - "learning_rate": 0.00024592008821430885, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.0002747617437982755, + "loss": 0.0224, "step": 33350 }, { - "epoch": 0.36, - "learning_rate": 0.000245903872348706, - "loss": 0.0227, + "epoch": 0.17, + "learning_rate": 0.00027475417610526155, + "loss": 0.0258, "step": 33360 }, { - "epoch": 0.36, - "learning_rate": 0.00024588765648310304, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.00027474660841224753, + "loss": 0.0233, "step": 33370 }, { - "epoch": 0.36, - "learning_rate": 0.00024587144061750016, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.0002747390407192335, + "loss": 0.0235, "step": 33380 }, { - "epoch": 0.36, - "learning_rate": 0.0002458552247518972, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.0002747314730262195, + "loss": 0.0258, "step": 33390 }, { - "epoch": 0.36, - "learning_rate": 0.00024583900888629434, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.0002747239053332055, + "loss": 0.0259, "step": 33400 }, { - "epoch": 0.36, - "learning_rate": 0.0002458227930206914, - "loss": 0.0245, + "epoch": 0.17, + "learning_rate": 0.00027471633764019146, + "loss": 0.0227, "step": 33410 }, { - "epoch": 0.36, - "learning_rate": 0.00024580657715508853, - "loss": 0.0221, + "epoch": 0.17, + "learning_rate": 0.00027470876994717744, + "loss": 0.0265, "step": 33420 }, { - "epoch": 0.36, - "learning_rate": 0.0002457903612894856, - "loss": 0.0277, + "epoch": 0.17, + "learning_rate": 0.0002747012022541635, + "loss": 0.0227, "step": 33430 }, { - "epoch": 0.36, - "learning_rate": 0.0002457741454238827, - "loss": 0.029, + "epoch": 0.17, + "learning_rate": 0.00027469363456114946, + "loss": 0.026, "step": 33440 }, { - "epoch": 0.36, - "learning_rate": 0.0002457579295582798, - "loss": 0.025, + "epoch": 0.17, + "learning_rate": 0.00027468606686813544, + "loss": 0.031, "step": 33450 }, { - "epoch": 0.36, - "learning_rate": 0.0002457417136926769, - "loss": 0.0217, + "epoch": 0.17, + "learning_rate": 0.0002746784991751214, + "loss": 0.0264, "step": 33460 }, { - "epoch": 0.36, - "learning_rate": 0.00024572549782707397, - "loss": 0.0232, + "epoch": 0.17, + "learning_rate": 0.0002746709314821074, + "loss": 0.0224, "step": 33470 }, { - "epoch": 0.36, - "learning_rate": 0.0002457092819614711, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.0002746633637890934, + "loss": 0.0261, "step": 33480 }, { - "epoch": 0.36, - "learning_rate": 0.00024569306609586815, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002746557960960794, + "loss": 0.026, "step": 33490 }, { - "epoch": 0.36, - "learning_rate": 0.00024567685023026527, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.0002746482284030654, + "loss": 0.0263, "step": 33500 }, { - "epoch": 0.36, - "learning_rate": 0.0002456606343646624, - "loss": 0.0239, + "epoch": 0.17, + "learning_rate": 0.0002746406607100514, + "loss": 0.0246, "step": 33510 }, { - "epoch": 0.36, - "learning_rate": 0.00024564441849905946, - "loss": 0.0211, + "epoch": 0.17, + "learning_rate": 0.00027463309301703736, + "loss": 0.0218, "step": 33520 }, { - "epoch": 0.36, - "learning_rate": 0.0002456282026334565, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027462552532402334, + "loss": 0.0232, "step": 33530 }, { - "epoch": 0.36, - "learning_rate": 0.00024561198676785364, - "loss": 0.0244, + "epoch": 0.17, + "learning_rate": 0.0002746179576310093, + "loss": 0.0267, "step": 33540 }, { - "epoch": 0.36, - "learning_rate": 0.00024559577090225076, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.00027461038993799536, + "loss": 0.0298, "step": 33550 }, { - "epoch": 0.36, - "learning_rate": 0.00024557955503664783, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.00027460282224498134, + "loss": 0.0277, "step": 33560 }, { - "epoch": 0.36, - "learning_rate": 0.0002455633391710449, - "loss": 0.0234, + "epoch": 0.17, + "learning_rate": 0.0002745952545519673, + "loss": 0.0324, "step": 33570 }, { - "epoch": 0.36, - "learning_rate": 0.000245547123305442, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.0002745876868589533, + "loss": 0.0339, "step": 33580 }, { - "epoch": 0.36, - "learning_rate": 0.00024553090743983913, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.0002745801191659393, + "loss": 0.0385, "step": 33590 }, { - "epoch": 0.36, - "learning_rate": 0.0002455146915742362, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.00027457255147292527, + "loss": 0.0297, "step": 33600 }, { - "epoch": 0.36, - "learning_rate": 0.00024549847570863327, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.00027456498377991125, + "loss": 0.0355, "step": 33610 }, { - "epoch": 0.36, - "learning_rate": 0.0002454822598430304, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.0002745574160868973, + "loss": 0.0277, "step": 33620 }, { - "epoch": 0.36, - "learning_rate": 0.0002454660439774275, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.00027454984839388327, + "loss": 0.0244, "step": 33630 }, { - "epoch": 0.36, - "learning_rate": 0.0002454498281118246, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027454228070086925, + "loss": 0.0249, "step": 33640 }, { - "epoch": 0.36, - "learning_rate": 0.0002454336122462217, - "loss": 0.0271, + "epoch": 0.17, + "learning_rate": 0.00027453471300785523, + "loss": 0.0265, "step": 33650 }, { - "epoch": 0.36, - "learning_rate": 0.00024541739638061876, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.0002745271453148412, + "loss": 0.0274, "step": 33660 }, { - "epoch": 0.36, - "learning_rate": 0.0002454011805150159, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.0002745195776218272, + "loss": 0.0221, "step": 33670 }, { - "epoch": 0.36, - "learning_rate": 0.000245384964649413, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.00027451200992881323, + "loss": 0.0293, "step": 33680 }, { - "epoch": 0.36, - "learning_rate": 0.00024536874878381006, - "loss": 0.0221, + "epoch": 0.17, + "learning_rate": 0.0002745044422357992, + "loss": 0.031, "step": 33690 }, { - "epoch": 0.36, - "learning_rate": 0.0002453525329182071, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.0002744968745427852, + "loss": 0.0247, "step": 33700 }, { - "epoch": 0.36, - "learning_rate": 0.00024533631705260425, - "loss": 0.0248, + "epoch": 0.17, + "learning_rate": 0.00027448930684977117, + "loss": 0.0258, "step": 33710 }, { - "epoch": 0.36, - "learning_rate": 0.00024532010118700137, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.00027448173915675715, + "loss": 0.0284, "step": 33720 }, { - "epoch": 0.36, - "learning_rate": 0.00024530388532139843, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027447417146374313, + "loss": 0.0239, "step": 33730 }, { - "epoch": 0.36, - "learning_rate": 0.0002452876694557955, - "loss": 0.0228, + "epoch": 0.17, + "learning_rate": 0.0002744666037707291, + "loss": 0.0254, "step": 33740 }, { - "epoch": 0.36, - "learning_rate": 0.0002452714535901926, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.00027445903607771515, + "loss": 0.0232, "step": 33750 }, { - "epoch": 0.36, - "learning_rate": 0.00024525523772458974, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.00027445146838470113, + "loss": 0.0246, "step": 33760 }, { - "epoch": 0.37, - "learning_rate": 0.0002452390218589868, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.0002744439006916871, + "loss": 0.0247, "step": 33770 }, { - "epoch": 0.37, - "learning_rate": 0.0002452228059933839, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.0002744363329986731, + "loss": 0.0282, "step": 33780 }, { - "epoch": 0.37, - "learning_rate": 0.000245206590127781, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002744287653056591, + "loss": 0.021, "step": 33790 }, { - "epoch": 0.37, - "learning_rate": 0.0002451903742621781, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.00027442119761264506, + "loss": 0.0207, "step": 33800 }, { - "epoch": 0.37, - "learning_rate": 0.00024517415839657523, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.0002744136299196311, + "loss": 0.0308, "step": 33810 }, { - "epoch": 0.37, - "learning_rate": 0.0002451579425309723, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.0002744060622266171, + "loss": 0.0278, "step": 33820 }, { - "epoch": 0.37, - "learning_rate": 0.00024514172666536936, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.00027439849453360306, + "loss": 0.0252, "step": 33830 }, { - "epoch": 0.37, - "learning_rate": 0.0002451255107997665, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.00027439092684058904, + "loss": 0.025, "step": 33840 }, { - "epoch": 0.37, - "learning_rate": 0.0002451092949341636, - "loss": 0.0222, + "epoch": 0.17, + "learning_rate": 0.000274383359147575, + "loss": 0.0246, "step": 33850 }, { - "epoch": 0.37, - "learning_rate": 0.00024509307906856067, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.000274375791454561, + "loss": 0.0229, "step": 33860 }, { - "epoch": 0.37, - "learning_rate": 0.00024507686320295773, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.00027436822376154704, + "loss": 0.027, "step": 33870 }, { - "epoch": 0.37, - "learning_rate": 0.00024506064733735485, - "loss": 0.0274, + "epoch": 0.17, + "learning_rate": 0.000274360656068533, + "loss": 0.028, "step": 33880 }, { - "epoch": 0.37, - "learning_rate": 0.00024504443147175197, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.000274353088375519, + "loss": 0.0222, "step": 33890 }, { - "epoch": 0.37, - "learning_rate": 0.00024502821560614904, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.000274345520682505, + "loss": 0.0245, "step": 33900 }, { - "epoch": 0.37, - "learning_rate": 0.0002450119997405461, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.00027433795298949096, + "loss": 0.029, "step": 33910 }, { - "epoch": 0.37, - "learning_rate": 0.0002449957838749432, - "loss": 0.0254, + "epoch": 0.17, + "learning_rate": 0.00027433038529647694, + "loss": 0.0274, "step": 33920 }, { - "epoch": 0.37, - "learning_rate": 0.00024497956800934034, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.0002743228176034629, + "loss": 0.0244, "step": 33930 }, { - "epoch": 0.37, - "learning_rate": 0.0002449633521437374, - "loss": 0.0261, + "epoch": 0.17, + "learning_rate": 0.00027431524991044896, + "loss": 0.0235, "step": 33940 }, { - "epoch": 0.37, - "learning_rate": 0.0002449471362781345, - "loss": 0.0251, + "epoch": 0.17, + "learning_rate": 0.00027430768221743494, + "loss": 0.0224, "step": 33950 }, { - "epoch": 0.37, - "learning_rate": 0.0002449309204125316, - "loss": 0.0273, + "epoch": 0.17, + "learning_rate": 0.0002743001145244209, + "loss": 0.0215, "step": 33960 }, { - "epoch": 0.37, - "learning_rate": 0.0002449147045469287, - "loss": 0.0271, + "epoch": 0.17, + "learning_rate": 0.0002742925468314069, + "loss": 0.0234, "step": 33970 }, { - "epoch": 0.37, - "learning_rate": 0.0002448984886813258, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.0002742849791383929, + "loss": 0.021, "step": 33980 }, { - "epoch": 0.37, - "learning_rate": 0.0002448822728157229, - "loss": 0.0223, + "epoch": 0.17, + "learning_rate": 0.00027427741144537887, + "loss": 0.0245, "step": 33990 }, { - "epoch": 0.37, - "learning_rate": 0.00024486605695011996, - "loss": 0.0232, + "epoch": 0.17, + "learning_rate": 0.0002742698437523649, + "loss": 0.0264, "step": 34000 }, { - "epoch": 0.37, - "eval_cer": 0.9215582042155038, - "eval_loss": 0.016336919739842415, - "eval_runtime": 121.6996, - "eval_samples_per_second": 16.434, - "eval_steps_per_second": 4.108, + "epoch": 0.17, + "eval_cer": 0.9144916046179211, + "eval_loss": 0.017292475327849388, + "eval_runtime": 117.3012, + "eval_samples_per_second": 17.05, + "eval_steps_per_second": 4.263, "step": 34000 }, { - "epoch": 0.37, - "learning_rate": 0.0002448498410845171, - "loss": 0.0247, + "epoch": 0.17, + "learning_rate": 0.0002742622760593509, + "loss": 0.0221, "step": 34010 }, { - "epoch": 0.37, - "learning_rate": 0.00024483362521891415, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.00027425470836633687, + "loss": 0.0193, "step": 34020 }, { - "epoch": 0.37, - "learning_rate": 0.00024481740935331127, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.00027424714067332285, + "loss": 0.0214, "step": 34030 }, { - "epoch": 0.37, - "learning_rate": 0.00024480119348770833, - "loss": 0.0254, + "epoch": 0.17, + "learning_rate": 0.00027423957298030883, + "loss": 0.0213, "step": 34040 }, { - "epoch": 0.37, - "learning_rate": 0.00024478497762210545, - "loss": 0.024, + "epoch": 0.17, + "learning_rate": 0.0002742320052872948, + "loss": 0.026, "step": 34050 }, { - "epoch": 0.37, - "learning_rate": 0.0002447687617565025, - "loss": 0.0241, + "epoch": 0.17, + "learning_rate": 0.00027422443759428085, + "loss": 0.0271, "step": 34060 }, { - "epoch": 0.37, - "learning_rate": 0.00024475254589089964, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.00027421686990126683, + "loss": 0.0249, "step": 34070 }, { - "epoch": 0.37, - "learning_rate": 0.00024473633002529676, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002742093022082528, + "loss": 0.0263, "step": 34080 }, { - "epoch": 0.37, - "learning_rate": 0.0002447201141596938, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.0002742017345152388, + "loss": 0.0283, "step": 34090 }, { - "epoch": 0.37, - "learning_rate": 0.0002447038982940909, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002741941668222248, + "loss": 0.0274, "step": 34100 }, { - "epoch": 0.37, - "learning_rate": 0.000244687682428488, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027418659912921075, + "loss": 0.0246, "step": 34110 }, { - "epoch": 0.37, - "learning_rate": 0.00024467146656288513, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.00027417903143619674, + "loss": 0.032, "step": 34120 }, { - "epoch": 0.37, - "learning_rate": 0.0002446552506972822, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.00027417146374318277, + "loss": 0.0216, "step": 34130 }, { - "epoch": 0.37, - "learning_rate": 0.00024463903483167926, - "loss": 0.0246, + "epoch": 0.17, + "learning_rate": 0.00027416389605016875, + "loss": 0.0195, "step": 34140 }, { - "epoch": 0.37, - "learning_rate": 0.0002446228189660764, - "loss": 0.0212, + "epoch": 0.17, + "learning_rate": 0.00027415632835715473, + "loss": 0.0229, "step": 34150 }, { - "epoch": 0.37, - "learning_rate": 0.0002446066031004735, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.0002741487606641407, + "loss": 0.023, "step": 34160 }, { - "epoch": 0.37, - "learning_rate": 0.00024459038723487057, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.0002741411929711267, + "loss": 0.0224, "step": 34170 }, { - "epoch": 0.37, - "learning_rate": 0.00024457417136926763, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.0002741336252781127, + "loss": 0.0255, "step": 34180 }, { - "epoch": 0.37, - "learning_rate": 0.00024455795550366475, - "loss": 0.0216, + "epoch": 0.17, + "learning_rate": 0.0002741260575850987, + "loss": 0.0225, "step": 34190 }, { - "epoch": 0.37, - "learning_rate": 0.00024454173963806187, - "loss": 0.0252, + "epoch": 0.17, + "learning_rate": 0.0002741184898920847, + "loss": 0.0278, "step": 34200 }, { - "epoch": 0.37, - "learning_rate": 0.00024452552377245894, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.0002741109221990707, + "loss": 0.024, "step": 34210 }, { - "epoch": 0.37, - "learning_rate": 0.00024450930790685606, - "loss": 0.0257, + "epoch": 0.17, + "learning_rate": 0.00027410335450605666, + "loss": 0.0245, "step": 34220 }, { - "epoch": 0.37, - "learning_rate": 0.0002444930920412531, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027409578681304264, + "loss": 0.0246, "step": 34230 }, { - "epoch": 0.37, - "learning_rate": 0.00024447687617565024, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.0002740882191200286, + "loss": 0.0223, "step": 34240 }, { - "epoch": 0.37, - "learning_rate": 0.00024446066031004736, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.0002740806514270146, + "loss": 0.0229, "step": 34250 }, { - "epoch": 0.37, - "learning_rate": 0.00024444444444444443, - "loss": 0.025, + "epoch": 0.17, + "learning_rate": 0.00027407308373400064, + "loss": 0.0231, "step": 34260 }, { - "epoch": 0.37, - "learning_rate": 0.0002444282285788415, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.0002740655160409866, + "loss": 0.0233, "step": 34270 }, { - "epoch": 0.37, - "learning_rate": 0.0002444120127132386, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002740579483479726, + "loss": 0.0288, "step": 34280 }, { - "epoch": 0.37, - "learning_rate": 0.00024439579684763573, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.0002740503806549586, + "loss": 0.0272, "step": 34290 }, { - "epoch": 0.37, - "learning_rate": 0.0002443795809820328, - "loss": 0.0275, + "epoch": 0.17, + "learning_rate": 0.00027404281296194457, + "loss": 0.0274, "step": 34300 }, { - "epoch": 0.37, - "learning_rate": 0.00024436336511642987, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.00027403524526893055, + "loss": 0.0286, "step": 34310 }, { - "epoch": 0.37, - "learning_rate": 0.000244347149250827, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.0002740276775759166, + "loss": 0.0246, "step": 34320 }, { - "epoch": 0.37, - "learning_rate": 0.0002443309333852241, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.00027402010988290256, + "loss": 0.0235, "step": 34330 }, { - "epoch": 0.37, - "learning_rate": 0.00024431471751962117, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.00027401254218988854, + "loss": 0.0323, "step": 34340 }, { - "epoch": 0.37, - "learning_rate": 0.0002442985016540183, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002740049744968745, + "loss": 0.0235, "step": 34350 }, { - "epoch": 0.37, - "learning_rate": 0.00024428228578841536, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.0002739974068038605, + "loss": 0.0277, "step": 34360 }, { - "epoch": 0.37, - "learning_rate": 0.0002442660699228125, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.0002739898391108465, + "loss": 0.0265, "step": 34370 }, { - "epoch": 0.37, - "learning_rate": 0.00024424985405720954, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.0002739822714178325, + "loss": 0.025, "step": 34380 }, { - "epoch": 0.37, - "learning_rate": 0.00024423363819160666, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002739747037248185, + "loss": 0.025, "step": 34390 }, { - "epoch": 0.37, - "learning_rate": 0.00024421742232600373, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.0002739671360318045, + "loss": 0.0258, "step": 34400 }, { - "epoch": 0.37, - "learning_rate": 0.00024420120646040085, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027395956833879047, + "loss": 0.0213, "step": 34410 }, { - "epoch": 0.37, - "learning_rate": 0.0002441849905947979, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027395200064577645, + "loss": 0.0279, "step": 34420 }, { - "epoch": 0.37, - "learning_rate": 0.00024416877472919503, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.00027394443295276243, + "loss": 0.0225, "step": 34430 }, { - "epoch": 0.37, - "learning_rate": 0.0002441525588635921, - "loss": 0.0226, + "epoch": 0.17, + "learning_rate": 0.0002739368652597484, + "loss": 0.0276, "step": 34440 }, { - "epoch": 0.37, - "learning_rate": 0.00024413634299798922, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.00027392929756673445, + "loss": 0.0242, "step": 34450 }, { - "epoch": 0.37, - "learning_rate": 0.00024412012713238628, - "loss": 0.0243, + "epoch": 0.17, + "learning_rate": 0.00027392172987372043, + "loss": 0.0296, "step": 34460 }, { - "epoch": 0.37, - "learning_rate": 0.0002441039112667834, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.0002739141621807064, + "loss": 0.0247, "step": 34470 }, { - "epoch": 0.37, - "learning_rate": 0.0002440876954011805, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.0002739065944876924, + "loss": 0.0257, "step": 34480 }, { - "epoch": 0.37, - "learning_rate": 0.0002440714795355776, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002738990267946784, + "loss": 0.0237, "step": 34490 }, { - "epoch": 0.37, - "learning_rate": 0.00024405526366997465, - "loss": 0.0259, + "epoch": 0.17, + "learning_rate": 0.00027389145910166436, + "loss": 0.0226, "step": 34500 }, { - "epoch": 0.37, - "learning_rate": 0.00024403904780437177, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002738838914086504, + "loss": 0.0243, "step": 34510 }, { - "epoch": 0.37, - "learning_rate": 0.00024402283193876887, - "loss": 0.0254, + "epoch": 0.17, + "learning_rate": 0.0002738763237156364, + "loss": 0.0301, "step": 34520 }, { - "epoch": 0.37, - "learning_rate": 0.00024400661607316596, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.00027386875602262236, + "loss": 0.0272, "step": 34530 }, { - "epoch": 0.37, - "learning_rate": 0.00024399040020756308, - "loss": 0.0234, + "epoch": 0.17, + "learning_rate": 0.00027386118832960834, + "loss": 0.0241, "step": 34540 }, { - "epoch": 0.37, - "learning_rate": 0.00024397418434196015, - "loss": 0.0275, + "epoch": 0.17, + "learning_rate": 0.0002738536206365943, + "loss": 0.0273, "step": 34550 }, { - "epoch": 0.37, - "learning_rate": 0.00024395796847635724, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.0002738460529435803, + "loss": 0.0228, "step": 34560 }, { - "epoch": 0.37, - "learning_rate": 0.00024394175261075436, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.0002738384852505663, + "loss": 0.0235, "step": 34570 }, { - "epoch": 0.37, - "learning_rate": 0.00024392553674515145, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.00027383091755755226, + "loss": 0.0268, "step": 34580 }, { - "epoch": 0.37, - "learning_rate": 0.00024390932087954852, - "loss": 0.0221, + "epoch": 0.17, + "learning_rate": 0.00027382334986453824, + "loss": 0.0245, "step": 34590 }, { - "epoch": 0.37, - "learning_rate": 0.0002438931050139456, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.0002738157821715242, + "loss": 0.0313, "step": 34600 }, { - "epoch": 0.37, - "learning_rate": 0.00024387688914834273, - "loss": 0.025, + "epoch": 0.17, + "learning_rate": 0.00027380821447851026, + "loss": 0.0229, "step": 34610 }, { - "epoch": 0.37, - "learning_rate": 0.00024386067328273982, - "loss": 0.0232, + "epoch": 0.17, + "learning_rate": 0.00027380064678549624, + "loss": 0.0182, "step": 34620 }, { - "epoch": 0.37, - "learning_rate": 0.0002438444574171369, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002737930790924822, + "loss": 0.0224, "step": 34630 }, { - "epoch": 0.37, - "learning_rate": 0.000243828241551534, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.0002737855113994682, + "loss": 0.026, "step": 34640 }, { - "epoch": 0.37, - "learning_rate": 0.0002438120256859311, - "loss": 0.0239, + "epoch": 0.17, + "learning_rate": 0.0002737779437064542, + "loss": 0.0218, "step": 34650 }, { - "epoch": 0.37, - "learning_rate": 0.0002437958098203282, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027377037601344017, + "loss": 0.024, "step": 34660 }, { - "epoch": 0.37, - "learning_rate": 0.00024377959395472526, - "loss": 0.0216, + "epoch": 0.17, + "learning_rate": 0.00027376280832042615, + "loss": 0.0258, "step": 34670 }, { - "epoch": 0.37, - "learning_rate": 0.00024376337808912238, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.0002737552406274122, + "loss": 0.0192, "step": 34680 }, { - "epoch": 0.38, - "learning_rate": 0.00024374716222351947, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.00027374767293439817, + "loss": 0.0239, "step": 34690 }, { - "epoch": 0.38, - "learning_rate": 0.0002437309463579166, - "loss": 0.024, + "epoch": 0.18, + "learning_rate": 0.00027374010524138415, + "loss": 0.0198, "step": 34700 }, { - "epoch": 0.38, - "learning_rate": 0.00024371473049231366, - "loss": 0.0233, + "epoch": 0.18, + "learning_rate": 0.00027373253754837013, + "loss": 0.0267, "step": 34710 }, { - "epoch": 0.38, - "learning_rate": 0.00024369851462671075, - "loss": 0.0228, + "epoch": 0.18, + "learning_rate": 0.0002737249698553561, + "loss": 0.0285, "step": 34720 }, { - "epoch": 0.38, - "learning_rate": 0.00024368229876110784, - "loss": 0.0226, + "epoch": 0.18, + "learning_rate": 0.0002737174021623421, + "loss": 0.0223, "step": 34730 }, { - "epoch": 0.38, - "learning_rate": 0.00024366608289550496, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.00027370983446932813, + "loss": 0.0228, "step": 34740 }, { - "epoch": 0.38, - "learning_rate": 0.00024364986702990203, - "loss": 0.0249, + "epoch": 0.18, + "learning_rate": 0.0002737022667763141, + "loss": 0.0204, "step": 34750 }, { - "epoch": 0.38, - "learning_rate": 0.00024363365116429912, - "loss": 0.0238, + "epoch": 0.18, + "learning_rate": 0.0002736946990833001, + "loss": 0.0211, "step": 34760 }, { - "epoch": 0.38, - "learning_rate": 0.00024361743529869624, - "loss": 0.0241, + "epoch": 0.18, + "learning_rate": 0.00027368713139028607, + "loss": 0.0231, "step": 34770 }, { - "epoch": 0.38, - "learning_rate": 0.00024360121943309333, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.00027367956369727205, + "loss": 0.0251, "step": 34780 }, { - "epoch": 0.38, - "learning_rate": 0.0002435850035674904, - "loss": 0.0245, + "epoch": 0.18, + "learning_rate": 0.00027367199600425804, + "loss": 0.0243, "step": 34790 }, { - "epoch": 0.38, - "learning_rate": 0.0002435687877018875, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.00027366442831124407, + "loss": 0.0338, "step": 34800 }, { - "epoch": 0.38, - "learning_rate": 0.0002435525718362846, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.00027365686061823005, + "loss": 0.026, "step": 34810 }, { - "epoch": 0.38, - "learning_rate": 0.0002435363559706817, - "loss": 0.0234, + "epoch": 0.18, + "learning_rate": 0.00027364929292521603, + "loss": 0.0304, "step": 34820 }, { - "epoch": 0.38, - "learning_rate": 0.00024352014010507877, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.000273641725232202, + "loss": 0.0239, "step": 34830 }, { - "epoch": 0.38, - "learning_rate": 0.0002435039242394759, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.000273634157539188, + "loss": 0.0232, "step": 34840 }, { - "epoch": 0.38, - "learning_rate": 0.00024348770837387298, - "loss": 0.0211, + "epoch": 0.18, + "learning_rate": 0.000273626589846174, + "loss": 0.0273, "step": 34850 }, { - "epoch": 0.38, - "learning_rate": 0.00024347149250827007, - "loss": 0.0233, + "epoch": 0.18, + "learning_rate": 0.00027361902215315996, + "loss": 0.0241, "step": 34860 }, { - "epoch": 0.38, - "learning_rate": 0.00024345527664266714, - "loss": 0.0259, + "epoch": 0.18, + "learning_rate": 0.000273611454460146, + "loss": 0.0213, "step": 34870 }, { - "epoch": 0.38, - "learning_rate": 0.00024343906077706426, - "loss": 0.0265, + "epoch": 0.18, + "learning_rate": 0.000273603886767132, + "loss": 0.0225, "step": 34880 }, { - "epoch": 0.38, - "learning_rate": 0.00024342284491146135, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.00027359631907411796, + "loss": 0.0259, "step": 34890 }, { - "epoch": 0.38, - "learning_rate": 0.00024340662904585845, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.00027358875138110394, + "loss": 0.0226, "step": 34900 }, { - "epoch": 0.38, - "learning_rate": 0.00024339041318025554, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.0002735811836880899, + "loss": 0.0247, "step": 34910 }, { - "epoch": 0.38, - "learning_rate": 0.00024337419731465263, - "loss": 0.022, + "epoch": 0.18, + "learning_rate": 0.0002735736159950759, + "loss": 0.0255, "step": 34920 }, { - "epoch": 0.38, - "learning_rate": 0.00024335798144904972, - "loss": 0.0228, + "epoch": 0.18, + "learning_rate": 0.00027356604830206194, + "loss": 0.0268, "step": 34930 }, { - "epoch": 0.38, - "learning_rate": 0.00024334176558344684, - "loss": 0.0257, + "epoch": 0.18, + "learning_rate": 0.0002735584806090479, + "loss": 0.0275, "step": 34940 }, { - "epoch": 0.38, - "learning_rate": 0.0002433255497178439, - "loss": 0.0234, + "epoch": 0.18, + "learning_rate": 0.0002735509129160339, + "loss": 0.0252, "step": 34950 }, { - "epoch": 0.38, - "learning_rate": 0.000243309333852241, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.0002735433452230199, + "loss": 0.0232, "step": 34960 }, { - "epoch": 0.38, - "learning_rate": 0.0002432931179866381, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.00027353577753000586, + "loss": 0.0231, "step": 34970 }, { - "epoch": 0.38, - "learning_rate": 0.00024327690212103522, - "loss": 0.0248, + "epoch": 0.18, + "learning_rate": 0.00027352820983699185, + "loss": 0.0299, "step": 34980 }, { - "epoch": 0.38, - "learning_rate": 0.00024326068625543228, - "loss": 0.0249, + "epoch": 0.18, + "learning_rate": 0.0002735206421439778, + "loss": 0.0257, "step": 34990 }, { - "epoch": 0.38, - "learning_rate": 0.00024324447038982937, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.00027351307445096386, + "loss": 0.0209, "step": 35000 }, { - "epoch": 0.38, - "eval_cer": 0.9215729704657623, - "eval_loss": 0.016215071082115173, - "eval_runtime": 121.5329, - "eval_samples_per_second": 16.456, - "eval_steps_per_second": 4.114, + "epoch": 0.18, + "eval_cer": 0.9144683151109114, + "eval_loss": 0.01787448488175869, + "eval_runtime": 117.4101, + "eval_samples_per_second": 17.034, + "eval_steps_per_second": 4.259, "step": 35000 }, { - "epoch": 0.38, - "learning_rate": 0.0002432282545242265, - "loss": 0.0251, + "epoch": 0.18, + "learning_rate": 0.00027350550675794984, + "loss": 0.0287, "step": 35010 }, { - "epoch": 0.38, - "learning_rate": 0.00024321203865862359, - "loss": 0.0213, + "epoch": 0.18, + "learning_rate": 0.0002734979390649358, + "loss": 0.0266, "step": 35020 }, { - "epoch": 0.38, - "learning_rate": 0.00024319582279302065, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.0002734903713719218, + "loss": 0.0211, "step": 35030 }, { - "epoch": 0.38, - "learning_rate": 0.00024317960692741777, - "loss": 0.0226, + "epoch": 0.18, + "learning_rate": 0.0002734828036789078, + "loss": 0.0224, "step": 35040 }, { - "epoch": 0.38, - "learning_rate": 0.00024316339106181486, - "loss": 0.0222, + "epoch": 0.18, + "learning_rate": 0.00027347523598589377, + "loss": 0.0237, "step": 35050 }, { - "epoch": 0.38, - "learning_rate": 0.00024314717519621196, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002734676682928798, + "loss": 0.0263, "step": 35060 }, { - "epoch": 0.38, - "learning_rate": 0.00024313095933060902, - "loss": 0.0219, + "epoch": 0.18, + "learning_rate": 0.0002734601005998658, + "loss": 0.0274, "step": 35070 }, { - "epoch": 0.38, - "learning_rate": 0.00024311474346500614, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027345253290685177, + "loss": 0.0227, "step": 35080 }, { - "epoch": 0.38, - "learning_rate": 0.00024309852759940324, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.00027344496521383775, + "loss": 0.0284, "step": 35090 }, { - "epoch": 0.38, - "learning_rate": 0.00024308231173380033, - "loss": 0.0236, + "epoch": 0.18, + "learning_rate": 0.00027343739752082373, + "loss": 0.0232, "step": 35100 }, { - "epoch": 0.38, - "learning_rate": 0.00024306609586819742, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.0002734298298278097, + "loss": 0.0241, "step": 35110 }, { - "epoch": 0.38, - "learning_rate": 0.0002430498800025945, - "loss": 0.0243, + "epoch": 0.18, + "learning_rate": 0.00027342226213479575, + "loss": 0.025, "step": 35120 }, { - "epoch": 0.38, - "learning_rate": 0.0002430336641369916, - "loss": 0.0252, + "epoch": 0.18, + "learning_rate": 0.00027341469444178173, + "loss": 0.0251, "step": 35130 }, { - "epoch": 0.38, - "learning_rate": 0.00024301744827138873, - "loss": 0.022, + "epoch": 0.18, + "learning_rate": 0.0002734071267487677, + "loss": 0.0227, "step": 35140 }, { - "epoch": 0.38, - "learning_rate": 0.0002430012324057858, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.0002733995590557537, + "loss": 0.0239, "step": 35150 }, { - "epoch": 0.38, - "learning_rate": 0.00024298501654018288, - "loss": 0.0244, + "epoch": 0.18, + "learning_rate": 0.0002733919913627397, + "loss": 0.0263, "step": 35160 }, { - "epoch": 0.38, - "learning_rate": 0.00024296880067457998, - "loss": 0.024, + "epoch": 0.18, + "learning_rate": 0.00027338442366972566, + "loss": 0.0257, "step": 35170 }, { - "epoch": 0.38, - "learning_rate": 0.0002429525848089771, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.00027337685597671164, + "loss": 0.0263, "step": 35180 }, { - "epoch": 0.38, - "learning_rate": 0.00024293636894337416, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027336928828369767, + "loss": 0.0274, "step": 35190 }, { - "epoch": 0.38, - "learning_rate": 0.00024292015307777126, - "loss": 0.0203, + "epoch": 0.18, + "learning_rate": 0.00027336172059068365, + "loss": 0.0238, "step": 35200 }, { - "epoch": 0.38, - "learning_rate": 0.00024290393721216838, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.00027335415289766964, + "loss": 0.0302, "step": 35210 }, { - "epoch": 0.38, - "learning_rate": 0.00024288772134656547, - "loss": 0.024, + "epoch": 0.18, + "learning_rate": 0.0002733465852046556, + "loss": 0.0245, "step": 35220 }, { - "epoch": 0.38, - "learning_rate": 0.00024287150548096253, - "loss": 0.0213, + "epoch": 0.18, + "learning_rate": 0.0002733390175116416, + "loss": 0.0286, "step": 35230 }, { - "epoch": 0.38, - "learning_rate": 0.00024285528961535963, - "loss": 0.0232, + "epoch": 0.18, + "learning_rate": 0.0002733314498186276, + "loss": 0.028, "step": 35240 }, { - "epoch": 0.38, - "learning_rate": 0.00024283907374975675, - "loss": 0.0239, + "epoch": 0.18, + "learning_rate": 0.0002733238821256136, + "loss": 0.0231, "step": 35250 }, { - "epoch": 0.38, - "learning_rate": 0.00024282285788415384, - "loss": 0.0231, + "epoch": 0.18, + "learning_rate": 0.0002733163144325996, + "loss": 0.0244, "step": 35260 }, { - "epoch": 0.38, - "learning_rate": 0.00024280664201855096, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.0002733087467395856, + "loss": 0.0279, "step": 35270 }, { - "epoch": 0.38, - "learning_rate": 0.00024279042615294802, - "loss": 0.0234, + "epoch": 0.18, + "learning_rate": 0.00027330117904657156, + "loss": 0.0198, "step": 35280 }, { - "epoch": 0.38, - "learning_rate": 0.00024277421028734512, - "loss": 0.0264, + "epoch": 0.18, + "learning_rate": 0.00027329361135355754, + "loss": 0.0243, "step": 35290 }, { - "epoch": 0.38, - "learning_rate": 0.0002427579944217422, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002732860436605435, + "loss": 0.0212, "step": 35300 }, { - "epoch": 0.38, - "learning_rate": 0.00024274177855613933, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.00027327847596752956, + "loss": 0.0283, "step": 35310 }, { - "epoch": 0.38, - "learning_rate": 0.0002427255626905364, - "loss": 0.025, + "epoch": 0.18, + "learning_rate": 0.00027327090827451554, + "loss": 0.0241, "step": 35320 }, { - "epoch": 0.38, - "learning_rate": 0.0002427093468249335, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002732633405815015, + "loss": 0.0221, "step": 35330 }, { - "epoch": 0.38, - "learning_rate": 0.0002426931309593306, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002732557728884875, + "loss": 0.023, "step": 35340 }, { - "epoch": 0.38, - "learning_rate": 0.0002426769150937277, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.0002732482051954735, + "loss": 0.0209, "step": 35350 }, { - "epoch": 0.38, - "learning_rate": 0.00024266069922812477, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.00027324063750245947, + "loss": 0.0215, "step": 35360 }, { - "epoch": 0.38, - "learning_rate": 0.00024264448336252186, - "loss": 0.0249, + "epoch": 0.18, + "learning_rate": 0.00027323306980944545, + "loss": 0.0196, "step": 35370 }, { - "epoch": 0.38, - "learning_rate": 0.00024262826749691898, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002732255021164315, + "loss": 0.0241, "step": 35380 }, { - "epoch": 0.38, - "learning_rate": 0.00024261205163131607, - "loss": 0.0238, + "epoch": 0.18, + "learning_rate": 0.00027321793442341746, + "loss": 0.0289, "step": 35390 }, { - "epoch": 0.38, - "learning_rate": 0.00024259583576571314, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.00027321036673040345, + "loss": 0.0303, "step": 35400 }, { - "epoch": 0.38, - "learning_rate": 0.00024257961990011026, - "loss": 0.0235, + "epoch": 0.18, + "learning_rate": 0.0002732027990373894, + "loss": 0.0211, "step": 35410 }, { - "epoch": 0.38, - "learning_rate": 0.00024256340403450735, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.0002731952313443754, + "loss": 0.025, "step": 35420 }, { - "epoch": 0.38, - "learning_rate": 0.00024254718816890444, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.0002731876636513614, + "loss": 0.0214, "step": 35430 }, { - "epoch": 0.38, - "learning_rate": 0.0002425309723033015, - "loss": 0.0213, + "epoch": 0.18, + "learning_rate": 0.0002731800959583474, + "loss": 0.0198, "step": 35440 }, { - "epoch": 0.38, - "learning_rate": 0.00024251475643769863, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.0002731725282653334, + "loss": 0.0235, "step": 35450 }, { - "epoch": 0.38, - "learning_rate": 0.00024249854057209572, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.0002731649605723194, + "loss": 0.0231, "step": 35460 }, { - "epoch": 0.38, - "learning_rate": 0.00024248232470649281, - "loss": 0.0222, + "epoch": 0.18, + "learning_rate": 0.00027315739287930537, + "loss": 0.0221, "step": 35470 }, { - "epoch": 0.38, - "learning_rate": 0.0002424661088408899, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.00027314982518629135, + "loss": 0.0224, "step": 35480 }, { - "epoch": 0.38, - "learning_rate": 0.000242449892975287, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.00027314225749327733, + "loss": 0.0221, "step": 35490 }, { - "epoch": 0.38, - "learning_rate": 0.0002424336771096841, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.0002731346898002633, + "loss": 0.024, "step": 35500 }, { - "epoch": 0.38, - "learning_rate": 0.0002424174612440812, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.00027312712210724935, + "loss": 0.0291, "step": 35510 }, { - "epoch": 0.38, - "learning_rate": 0.00024240124537847828, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.00027311955441423533, + "loss": 0.0322, "step": 35520 }, { - "epoch": 0.38, - "learning_rate": 0.00024238502951287537, - "loss": 0.0291, + "epoch": 0.18, + "learning_rate": 0.0002731119867212213, + "loss": 0.0227, "step": 35530 }, { - "epoch": 0.38, - "learning_rate": 0.00024236881364727246, - "loss": 0.0229, + "epoch": 0.18, + "learning_rate": 0.0002731044190282073, + "loss": 0.026, "step": 35540 }, { - "epoch": 0.38, - "learning_rate": 0.00024235259778166958, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002730968513351933, + "loss": 0.0252, "step": 35550 }, { - "epoch": 0.38, - "learning_rate": 0.00024233638191606665, - "loss": 0.0222, + "epoch": 0.18, + "learning_rate": 0.00027308928364217926, + "loss": 0.0342, "step": 35560 }, { - "epoch": 0.38, - "learning_rate": 0.00024232016605046374, - "loss": 0.0247, + "epoch": 0.18, + "learning_rate": 0.0002730817159491653, + "loss": 0.0298, "step": 35570 }, { - "epoch": 0.38, - "learning_rate": 0.00024230395018486086, - "loss": 0.023, + "epoch": 0.18, + "learning_rate": 0.0002730741482561513, + "loss": 0.0258, "step": 35580 }, { - "epoch": 0.38, - "learning_rate": 0.00024228773431925795, - "loss": 0.0227, + "epoch": 0.18, + "learning_rate": 0.00027306658056313726, + "loss": 0.0257, "step": 35590 }, { - "epoch": 0.38, - "learning_rate": 0.00024227151845365502, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.00027305901287012324, + "loss": 0.0302, "step": 35600 }, { - "epoch": 0.38, - "learning_rate": 0.0002422553025880521, - "loss": 0.0219, + "epoch": 0.18, + "learning_rate": 0.0002730514451771092, + "loss": 0.0247, "step": 35610 }, { - "epoch": 0.39, - "learning_rate": 0.00024223908672244923, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.0002730438774840952, + "loss": 0.0255, "step": 35620 }, { - "epoch": 0.39, - "learning_rate": 0.00024222287085684632, - "loss": 0.0234, + "epoch": 0.18, + "learning_rate": 0.00027303630979108124, + "loss": 0.0271, "step": 35630 }, { - "epoch": 0.39, - "learning_rate": 0.0002422066549912434, - "loss": 0.0207, + "epoch": 0.18, + "learning_rate": 0.0002730287420980672, + "loss": 0.0264, "step": 35640 }, { - "epoch": 0.39, - "learning_rate": 0.0002421904391256405, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.0002730211744050532, + "loss": 0.0195, "step": 35650 }, { - "epoch": 0.39, - "learning_rate": 0.0002421742232600376, - "loss": 0.0213, + "epoch": 0.18, + "learning_rate": 0.0002730136067120392, + "loss": 0.0241, "step": 35660 }, { - "epoch": 0.39, - "learning_rate": 0.0002421580073944347, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027300603901902516, + "loss": 0.0244, "step": 35670 }, { - "epoch": 0.39, - "learning_rate": 0.00024214179152883176, - "loss": 0.0185, + "epoch": 0.18, + "learning_rate": 0.00027299847132601114, + "loss": 0.0245, "step": 35680 }, { - "epoch": 0.39, - "learning_rate": 0.00024212557566322888, - "loss": 0.0231, + "epoch": 0.18, + "learning_rate": 0.0002729909036329971, + "loss": 0.0234, "step": 35690 }, { - "epoch": 0.39, - "learning_rate": 0.00024210935979762597, - "loss": 0.023, + "epoch": 0.18, + "learning_rate": 0.00027298333593998316, + "loss": 0.0209, "step": 35700 }, { - "epoch": 0.39, - "learning_rate": 0.0002420931439320231, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.00027297576824696914, + "loss": 0.0244, "step": 35710 }, { - "epoch": 0.39, - "learning_rate": 0.00024207692806642016, - "loss": 0.0179, + "epoch": 0.18, + "learning_rate": 0.0002729682005539551, + "loss": 0.0224, "step": 35720 }, { - "epoch": 0.39, - "learning_rate": 0.00024206071220081725, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.0002729606328609411, + "loss": 0.0231, "step": 35730 }, { - "epoch": 0.39, - "learning_rate": 0.00024204449633521434, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.0002729530651679271, + "loss": 0.0246, "step": 35740 }, { - "epoch": 0.39, - "learning_rate": 0.00024202828046961146, - "loss": 0.0235, + "epoch": 0.18, + "learning_rate": 0.00027294549747491307, + "loss": 0.0195, "step": 35750 }, { - "epoch": 0.39, - "learning_rate": 0.00024201206460400853, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.0002729379297818991, + "loss": 0.0239, "step": 35760 }, { - "epoch": 0.39, - "learning_rate": 0.00024199584873840562, - "loss": 0.0211, + "epoch": 0.18, + "learning_rate": 0.0002729303620888851, + "loss": 0.0248, "step": 35770 }, { - "epoch": 0.39, - "learning_rate": 0.00024197963287280274, - "loss": 0.0228, + "epoch": 0.18, + "learning_rate": 0.00027292279439587107, + "loss": 0.0257, "step": 35780 }, { - "epoch": 0.39, - "learning_rate": 0.00024196341700719984, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.00027291522670285705, + "loss": 0.0179, "step": 35790 }, { - "epoch": 0.39, - "learning_rate": 0.0002419472011415969, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.00027290765900984303, + "loss": 0.0221, "step": 35800 }, { - "epoch": 0.39, - "learning_rate": 0.000241930985275994, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.000272900091316829, + "loss": 0.0205, "step": 35810 }, { - "epoch": 0.39, - "learning_rate": 0.00024191476941039111, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.000272892523623815, + "loss": 0.0231, "step": 35820 }, { - "epoch": 0.39, - "learning_rate": 0.0002418985535447882, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.00027288495593080097, + "loss": 0.0268, "step": 35830 }, { - "epoch": 0.39, - "learning_rate": 0.00024188233767918527, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027287738823778695, + "loss": 0.0242, "step": 35840 }, { - "epoch": 0.39, - "learning_rate": 0.0002418661218135824, - "loss": 0.0269, + "epoch": 0.18, + "learning_rate": 0.00027286982054477294, + "loss": 0.0212, "step": 35850 }, { - "epoch": 0.39, - "learning_rate": 0.00024184990594797948, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.00027286225285175897, + "loss": 0.0261, "step": 35860 }, { - "epoch": 0.39, - "learning_rate": 0.00024183369008237658, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.00027285468515874495, + "loss": 0.0323, "step": 35870 }, { - "epoch": 0.39, - "learning_rate": 0.00024181747421677364, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.00027284711746573093, + "loss": 0.0225, "step": 35880 }, { - "epoch": 0.39, - "learning_rate": 0.00024180125835117076, - "loss": 0.0241, + "epoch": 0.18, + "learning_rate": 0.0002728395497727169, + "loss": 0.0265, "step": 35890 }, { - "epoch": 0.39, - "learning_rate": 0.00024178504248556786, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.0002728319820797029, + "loss": 0.0262, "step": 35900 }, { - "epoch": 0.39, - "learning_rate": 0.00024176882661996495, - "loss": 0.0243, + "epoch": 0.18, + "learning_rate": 0.0002728244143866889, + "loss": 0.0237, "step": 35910 }, { - "epoch": 0.39, - "learning_rate": 0.00024175261075436204, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.00027281684669367486, + "loss": 0.0243, "step": 35920 }, { - "epoch": 0.39, - "learning_rate": 0.00024173639488875913, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.0002728092790006609, + "loss": 0.0249, "step": 35930 }, { - "epoch": 0.39, - "learning_rate": 0.00024172017902315623, - "loss": 0.0232, + "epoch": 0.18, + "learning_rate": 0.0002728017113076469, + "loss": 0.0273, "step": 35940 }, { - "epoch": 0.39, - "learning_rate": 0.00024170396315755335, - "loss": 0.0222, + "epoch": 0.18, + "learning_rate": 0.00027279414361463286, + "loss": 0.0284, "step": 35950 }, { - "epoch": 0.39, - "learning_rate": 0.0002416877472919504, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.00027278657592161884, + "loss": 0.0232, "step": 35960 }, { - "epoch": 0.39, - "learning_rate": 0.0002416715314263475, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002727790082286048, + "loss": 0.0257, "step": 35970 }, { - "epoch": 0.39, - "learning_rate": 0.0002416553155607446, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.0002727714405355908, + "loss": 0.0219, "step": 35980 }, { - "epoch": 0.39, - "learning_rate": 0.00024163909969514172, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.00027276387284257684, + "loss": 0.0303, "step": 35990 }, { - "epoch": 0.39, - "learning_rate": 0.0002416228838295388, - "loss": 0.0159, + "epoch": 0.18, + "learning_rate": 0.0002727563051495628, + "loss": 0.0288, "step": 36000 }, { - "epoch": 0.39, - "eval_cer": 0.9215590728184603, - "eval_loss": 0.01598510891199112, - "eval_runtime": 121.8638, - "eval_samples_per_second": 16.412, - "eval_steps_per_second": 4.103, + "epoch": 0.18, + "eval_cer": 0.9144993677869243, + "eval_loss": 0.017736734822392464, + "eval_runtime": 117.3015, + "eval_samples_per_second": 17.05, + "eval_steps_per_second": 4.263, "step": 36000 }, { - "epoch": 0.39, - "learning_rate": 0.00024160666796393588, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002727487374565488, + "loss": 0.024, "step": 36010 }, { - "epoch": 0.39, - "learning_rate": 0.000241590452098333, - "loss": 0.0232, + "epoch": 0.18, + "learning_rate": 0.0002727411697635348, + "loss": 0.0263, "step": 36020 }, { - "epoch": 0.39, - "learning_rate": 0.0002415742362327301, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.00027273360207052076, + "loss": 0.0304, "step": 36030 }, { - "epoch": 0.39, - "learning_rate": 0.00024155802036712718, - "loss": 0.0173, + "epoch": 0.18, + "learning_rate": 0.00027272603437750675, + "loss": 0.0227, "step": 36040 }, { - "epoch": 0.39, - "learning_rate": 0.00024154180450152427, - "loss": 0.0229, + "epoch": 0.18, + "learning_rate": 0.0002727184666844927, + "loss": 0.0254, "step": 36050 }, { - "epoch": 0.39, - "learning_rate": 0.00024152558863592137, - "loss": 0.0228, + "epoch": 0.18, + "learning_rate": 0.00027271089899147876, + "loss": 0.0246, "step": 36060 }, { - "epoch": 0.39, - "learning_rate": 0.00024150937277031846, - "loss": 0.0248, + "epoch": 0.18, + "learning_rate": 0.00027270333129846474, + "loss": 0.0275, "step": 36070 }, { - "epoch": 0.39, - "learning_rate": 0.00024149315690471558, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.0002726957636054507, + "loss": 0.0228, "step": 36080 }, { - "epoch": 0.39, - "learning_rate": 0.00024147694103911265, - "loss": 0.0246, + "epoch": 0.18, + "learning_rate": 0.0002726881959124367, + "loss": 0.0233, "step": 36090 }, { - "epoch": 0.39, - "learning_rate": 0.00024146072517350974, - "loss": 0.024, + "epoch": 0.18, + "learning_rate": 0.0002726806282194227, + "loss": 0.0226, "step": 36100 }, { - "epoch": 0.39, - "learning_rate": 0.00024144450930790683, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.00027267306052640867, + "loss": 0.0244, "step": 36110 }, { - "epoch": 0.39, - "learning_rate": 0.00024142829344230395, - "loss": 0.0251, + "epoch": 0.18, + "learning_rate": 0.0002726654928333947, + "loss": 0.0246, "step": 36120 }, { - "epoch": 0.39, - "learning_rate": 0.00024141207757670102, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.0002726579251403807, + "loss": 0.0263, "step": 36130 }, { - "epoch": 0.39, - "learning_rate": 0.0002413958617110981, - "loss": 0.0239, + "epoch": 0.18, + "learning_rate": 0.00027265035744736667, + "loss": 0.0262, "step": 36140 }, { - "epoch": 0.39, - "learning_rate": 0.00024137964584549523, - "loss": 0.0245, + "epoch": 0.18, + "learning_rate": 0.00027264278975435265, + "loss": 0.0247, "step": 36150 }, { - "epoch": 0.39, - "learning_rate": 0.00024136342997989232, - "loss": 0.0245, + "epoch": 0.18, + "learning_rate": 0.00027263522206133863, + "loss": 0.0173, "step": 36160 }, { - "epoch": 0.39, - "learning_rate": 0.0002413472141142894, - "loss": 0.0215, + "epoch": 0.18, + "learning_rate": 0.0002726276543683246, + "loss": 0.0275, "step": 36170 }, { - "epoch": 0.39, - "learning_rate": 0.00024133099824868648, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.00027262008667531065, + "loss": 0.0216, "step": 36180 }, { - "epoch": 0.39, - "learning_rate": 0.0002413147823830836, - "loss": 0.0264, + "epoch": 0.18, + "learning_rate": 0.00027261251898229663, + "loss": 0.0252, "step": 36190 }, { - "epoch": 0.39, - "learning_rate": 0.0002412985665174807, - "loss": 0.0251, + "epoch": 0.18, + "learning_rate": 0.0002726049512892826, + "loss": 0.0233, "step": 36200 }, { - "epoch": 0.39, - "learning_rate": 0.00024128235065187776, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.0002725973835962686, + "loss": 0.0243, "step": 36210 }, { - "epoch": 0.39, - "learning_rate": 0.00024126613478627488, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.0002725898159032546, + "loss": 0.0275, "step": 36220 }, { - "epoch": 0.39, - "learning_rate": 0.00024124991892067197, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.00027258224821024056, + "loss": 0.0284, "step": 36230 }, { - "epoch": 0.39, - "learning_rate": 0.00024123370305506906, - "loss": 0.0258, + "epoch": 0.18, + "learning_rate": 0.00027257468051722654, + "loss": 0.034, "step": 36240 }, { - "epoch": 0.39, - "learning_rate": 0.00024121748718946613, - "loss": 0.018, + "epoch": 0.18, + "learning_rate": 0.00027256711282421257, + "loss": 0.024, "step": 36250 }, { - "epoch": 0.39, - "learning_rate": 0.00024120127132386325, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.00027255954513119855, + "loss": 0.0281, "step": 36260 }, { - "epoch": 0.39, - "learning_rate": 0.00024118505545826034, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.00027255197743818454, + "loss": 0.0238, "step": 36270 }, { - "epoch": 0.39, - "learning_rate": 0.00024116883959265746, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.0002725444097451705, + "loss": 0.0279, "step": 36280 }, { - "epoch": 0.39, - "learning_rate": 0.00024115262372705453, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.0002725368420521565, + "loss": 0.0303, "step": 36290 }, { - "epoch": 0.39, - "learning_rate": 0.00024113640786145162, - "loss": 0.0242, + "epoch": 0.18, + "learning_rate": 0.0002725292743591425, + "loss": 0.0305, "step": 36300 }, { - "epoch": 0.39, - "learning_rate": 0.0002411201919958487, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.0002725217066661285, + "loss": 0.0226, "step": 36310 }, { - "epoch": 0.39, - "learning_rate": 0.00024110397613024583, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.0002725141389731145, + "loss": 0.0211, "step": 36320 }, { - "epoch": 0.39, - "learning_rate": 0.0002410877602646429, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.0002725065712801005, + "loss": 0.0224, "step": 36330 }, { - "epoch": 0.39, - "learning_rate": 0.00024107154439904, - "loss": 0.0285, + "epoch": 0.18, + "learning_rate": 0.00027249900358708646, + "loss": 0.021, "step": 36340 }, { - "epoch": 0.39, - "learning_rate": 0.0002410553285334371, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.00027249143589407244, + "loss": 0.0276, "step": 36350 }, { - "epoch": 0.39, - "learning_rate": 0.0002410391126678342, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002724838682010584, + "loss": 0.0245, "step": 36360 }, { - "epoch": 0.39, - "learning_rate": 0.00024102289680223127, - "loss": 0.0243, + "epoch": 0.18, + "learning_rate": 0.00027247630050804446, + "loss": 0.024, "step": 36370 }, { - "epoch": 0.39, - "learning_rate": 0.00024100668093662836, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027246873281503044, + "loss": 0.0213, "step": 36380 }, { - "epoch": 0.39, - "learning_rate": 0.00024099046507102548, - "loss": 0.0195, + "epoch": 0.18, + "learning_rate": 0.0002724611651220164, + "loss": 0.0307, "step": 36390 }, { - "epoch": 0.39, - "learning_rate": 0.00024097424920542257, - "loss": 0.022, + "epoch": 0.18, + "learning_rate": 0.0002724535974290024, + "loss": 0.0263, "step": 36400 }, { - "epoch": 0.39, - "learning_rate": 0.00024095803333981964, - "loss": 0.0226, + "epoch": 0.18, + "learning_rate": 0.0002724460297359884, + "loss": 0.0227, "step": 36410 }, { - "epoch": 0.39, - "learning_rate": 0.00024094181747421676, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.00027243846204297437, + "loss": 0.0236, "step": 36420 }, { - "epoch": 0.39, - "learning_rate": 0.00024092560160861385, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.00027243089434996035, + "loss": 0.026, "step": 36430 }, { - "epoch": 0.39, - "learning_rate": 0.00024090938574301095, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002724233266569464, + "loss": 0.0254, "step": 36440 }, { - "epoch": 0.39, - "learning_rate": 0.000240893169877408, - "loss": 0.0226, + "epoch": 0.18, + "learning_rate": 0.00027241575896393236, + "loss": 0.0281, "step": 36450 }, { - "epoch": 0.39, - "learning_rate": 0.00024087695401180513, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.00027240819127091835, + "loss": 0.0232, "step": 36460 }, { - "epoch": 0.39, - "learning_rate": 0.00024086073814620222, - "loss": 0.0268, + "epoch": 0.18, + "learning_rate": 0.0002724006235779043, + "loss": 0.0223, "step": 36470 }, { - "epoch": 0.39, - "learning_rate": 0.00024084452228059932, - "loss": 0.029, + "epoch": 0.18, + "learning_rate": 0.0002723930558848903, + "loss": 0.0208, "step": 36480 }, { - "epoch": 0.39, - "learning_rate": 0.0002408283064149964, - "loss": 0.0236, + "epoch": 0.18, + "learning_rate": 0.0002723854881918763, + "loss": 0.0249, "step": 36490 }, { - "epoch": 0.39, - "learning_rate": 0.0002408120905493935, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002723779204988623, + "loss": 0.023, "step": 36500 }, { - "epoch": 0.39, - "learning_rate": 0.0002407958746837906, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.0002723703528058483, + "loss": 0.021, "step": 36510 }, { - "epoch": 0.39, - "learning_rate": 0.00024077965881818771, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.0002723627851128343, + "loss": 0.03, "step": 36520 }, { - "epoch": 0.39, - "learning_rate": 0.00024076344295258478, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.00027235521741982027, + "loss": 0.0234, "step": 36530 }, { - "epoch": 0.4, - "learning_rate": 0.00024074722708698187, - "loss": 0.0207, + "epoch": 0.18, + "learning_rate": 0.00027234764972680625, + "loss": 0.0242, "step": 36540 }, { - "epoch": 0.4, - "learning_rate": 0.00024073101122137897, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.00027234008203379223, + "loss": 0.0294, "step": 36550 }, { - "epoch": 0.4, - "learning_rate": 0.00024071479535577609, - "loss": 0.0236, + "epoch": 0.18, + "learning_rate": 0.0002723325143407782, + "loss": 0.0256, "step": 36560 }, { - "epoch": 0.4, - "learning_rate": 0.00024069857949017315, - "loss": 0.0229, + "epoch": 0.18, + "learning_rate": 0.00027232494664776425, + "loss": 0.021, "step": 36570 }, { - "epoch": 0.4, - "learning_rate": 0.00024068236362457024, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.00027231737895475023, + "loss": 0.0243, "step": 36580 }, { - "epoch": 0.4, - "learning_rate": 0.00024066614775896736, - "loss": 0.0235, + "epoch": 0.18, + "learning_rate": 0.0002723098112617362, + "loss": 0.028, "step": 36590 }, { - "epoch": 0.4, - "learning_rate": 0.00024064993189336446, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002723022435687222, + "loss": 0.0244, "step": 36600 }, { - "epoch": 0.4, - "learning_rate": 0.00024063371602776152, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.0002722946758757082, + "loss": 0.0219, "step": 36610 }, { - "epoch": 0.4, - "learning_rate": 0.00024061750016215861, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.00027228710818269416, + "loss": 0.026, "step": 36620 }, { - "epoch": 0.4, - "learning_rate": 0.00024060128429655573, - "loss": 0.0207, + "epoch": 0.18, + "learning_rate": 0.0002722795404896802, + "loss": 0.0216, "step": 36630 }, { - "epoch": 0.4, - "learning_rate": 0.00024058506843095283, - "loss": 0.0266, + "epoch": 0.18, + "learning_rate": 0.0002722719727966662, + "loss": 0.0226, "step": 36640 }, { - "epoch": 0.4, - "learning_rate": 0.0002405688525653499, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.00027226440510365216, + "loss": 0.0201, "step": 36650 }, { - "epoch": 0.4, - "learning_rate": 0.000240552636699747, - "loss": 0.022, + "epoch": 0.18, + "learning_rate": 0.00027225683741063814, + "loss": 0.0263, "step": 36660 }, { - "epoch": 0.4, - "learning_rate": 0.0002405364208341441, - "loss": 0.0262, + "epoch": 0.19, + "learning_rate": 0.0002722492697176241, + "loss": 0.0205, "step": 36670 }, { - "epoch": 0.4, - "learning_rate": 0.0002405202049685412, - "loss": 0.0233, + "epoch": 0.19, + "learning_rate": 0.0002722417020246101, + "loss": 0.0231, "step": 36680 }, { - "epoch": 0.4, - "learning_rate": 0.00024050398910293832, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027223413433159614, + "loss": 0.0238, "step": 36690 }, { - "epoch": 0.4, - "learning_rate": 0.00024048777323733538, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002722265666385821, + "loss": 0.0249, "step": 36700 }, { - "epoch": 0.4, - "learning_rate": 0.00024047155737173248, - "loss": 0.0214, + "epoch": 0.19, + "learning_rate": 0.0002722189989455681, + "loss": 0.0224, "step": 36710 }, { - "epoch": 0.4, - "learning_rate": 0.0002404553415061296, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.0002722114312525541, + "loss": 0.0221, "step": 36720 }, { - "epoch": 0.4, - "learning_rate": 0.0002404391256405267, - "loss": 0.0199, + "epoch": 0.19, + "learning_rate": 0.00027220386355954006, + "loss": 0.0247, "step": 36730 }, { - "epoch": 0.4, - "learning_rate": 0.00024042290977492375, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027219629586652604, + "loss": 0.0195, "step": 36740 }, { - "epoch": 0.4, - "learning_rate": 0.00024040669390932085, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.000272188728173512, + "loss": 0.0206, "step": 36750 }, { - "epoch": 0.4, - "learning_rate": 0.00024039047804371797, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.00027218116048049806, + "loss": 0.0219, "step": 36760 }, { - "epoch": 0.4, - "learning_rate": 0.00024037426217811506, - "loss": 0.0224, + "epoch": 0.19, + "learning_rate": 0.00027217359278748404, + "loss": 0.0263, "step": 36770 }, { - "epoch": 0.4, - "learning_rate": 0.00024035804631251213, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.00027216602509447, + "loss": 0.0195, "step": 36780 }, { - "epoch": 0.4, - "learning_rate": 0.00024034183044690925, - "loss": 0.023, + "epoch": 0.19, + "learning_rate": 0.000272158457401456, + "loss": 0.0277, "step": 36790 }, { - "epoch": 0.4, - "learning_rate": 0.00024032561458130634, - "loss": 0.0263, + "epoch": 0.19, + "learning_rate": 0.000272150889708442, + "loss": 0.0247, "step": 36800 }, { - "epoch": 0.4, - "learning_rate": 0.00024030939871570343, - "loss": 0.0256, + "epoch": 0.19, + "learning_rate": 0.00027214332201542797, + "loss": 0.0289, "step": 36810 }, { - "epoch": 0.4, - "learning_rate": 0.0002402931828501005, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.000272135754322414, + "loss": 0.0276, "step": 36820 }, { - "epoch": 0.4, - "learning_rate": 0.00024027696698449762, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002721281866294, + "loss": 0.0266, "step": 36830 }, { - "epoch": 0.4, - "learning_rate": 0.0002402607511188947, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027212061893638597, + "loss": 0.0258, "step": 36840 }, { - "epoch": 0.4, - "learning_rate": 0.0002402445352532918, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.00027211305124337195, + "loss": 0.0262, "step": 36850 }, { - "epoch": 0.4, - "learning_rate": 0.0002402283193876889, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027210548355035793, + "loss": 0.0253, "step": 36860 }, { - "epoch": 0.4, - "learning_rate": 0.000240212103522086, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.0002720979158573439, + "loss": 0.028, "step": 36870 }, { - "epoch": 0.4, - "learning_rate": 0.00024019588765648308, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.00027209034816432995, + "loss": 0.0239, "step": 36880 }, { - "epoch": 0.4, - "learning_rate": 0.0002401796717908802, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002720827804713159, + "loss": 0.0191, "step": 36890 }, { - "epoch": 0.4, - "learning_rate": 0.00024016345592527727, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.0002720752127783019, + "loss": 0.0267, "step": 36900 }, { - "epoch": 0.4, - "learning_rate": 0.00024014724005967436, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002720676450852879, + "loss": 0.0195, "step": 36910 }, { - "epoch": 0.4, - "learning_rate": 0.00024013102419407145, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.00027206007739227387, + "loss": 0.0199, "step": 36920 }, { - "epoch": 0.4, - "learning_rate": 0.00024011480832846857, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.00027205250969925985, + "loss": 0.02, "step": 36930 }, { - "epoch": 0.4, - "learning_rate": 0.00024009859246286564, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.00027204494200624583, + "loss": 0.0271, "step": 36940 }, { - "epoch": 0.4, - "learning_rate": 0.00024008237659726273, - "loss": 0.0239, + "epoch": 0.19, + "learning_rate": 0.00027203737431323187, + "loss": 0.021, "step": 36950 }, { - "epoch": 0.4, - "learning_rate": 0.00024006616073165985, - "loss": 0.0271, + "epoch": 0.19, + "learning_rate": 0.00027202980662021785, + "loss": 0.0229, "step": 36960 }, { - "epoch": 0.4, - "learning_rate": 0.00024004994486605694, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.00027202223892720383, + "loss": 0.0295, "step": 36970 }, { - "epoch": 0.4, - "learning_rate": 0.000240033729000454, - "loss": 0.0246, + "epoch": 0.19, + "learning_rate": 0.0002720146712341898, + "loss": 0.0239, "step": 36980 }, { - "epoch": 0.4, - "learning_rate": 0.0002400175131348511, - "loss": 0.0247, + "epoch": 0.19, + "learning_rate": 0.0002720071035411758, + "loss": 0.0301, "step": 36990 }, { - "epoch": 0.4, - "learning_rate": 0.00024000129726924822, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002719995358481618, + "loss": 0.0227, "step": 37000 }, { - "epoch": 0.4, - "eval_cer": 0.9216033715692354, - "eval_loss": 0.01503350492566824, - "eval_runtime": 121.5384, - "eval_samples_per_second": 16.456, - "eval_steps_per_second": 4.114, + "epoch": 0.19, + "eval_cer": 0.9144654039225352, + "eval_loss": 0.018076682463288307, + "eval_runtime": 117.2546, + "eval_samples_per_second": 17.057, + "eval_steps_per_second": 4.264, "step": 37000 }, { - "epoch": 0.4, - "learning_rate": 0.0002399850814036453, - "loss": 0.0237, + "epoch": 0.19, + "learning_rate": 0.0002719919681551478, + "loss": 0.0242, "step": 37010 }, { - "epoch": 0.4, - "learning_rate": 0.00023996886553804238, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002719844004621338, + "loss": 0.0248, "step": 37020 }, { - "epoch": 0.4, - "learning_rate": 0.0002399526496724395, - "loss": 0.0214, + "epoch": 0.19, + "learning_rate": 0.0002719768327691198, + "loss": 0.0234, "step": 37030 }, { - "epoch": 0.4, - "learning_rate": 0.0002399364338068366, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.00027196926507610576, + "loss": 0.0233, "step": 37040 }, { - "epoch": 0.4, - "learning_rate": 0.00023992021794123368, - "loss": 0.0224, + "epoch": 0.19, + "learning_rate": 0.00027196169738309174, + "loss": 0.022, "step": 37050 }, { - "epoch": 0.4, - "learning_rate": 0.00023990400207563078, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.0002719541296900777, + "loss": 0.0241, "step": 37060 }, { - "epoch": 0.4, - "learning_rate": 0.00023988778621002787, - "loss": 0.0258, + "epoch": 0.19, + "learning_rate": 0.0002719465619970637, + "loss": 0.0235, "step": 37070 }, { - "epoch": 0.4, - "learning_rate": 0.00023987157034442496, - "loss": 0.0233, + "epoch": 0.19, + "learning_rate": 0.0002719389943040497, + "loss": 0.0225, "step": 37080 }, { - "epoch": 0.4, - "learning_rate": 0.00023985535447882208, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027193142661103566, + "loss": 0.0228, "step": 37090 }, { - "epoch": 0.4, - "learning_rate": 0.00023983913861321915, - "loss": 0.0224, + "epoch": 0.19, + "learning_rate": 0.00027192385891802165, + "loss": 0.0285, "step": 37100 }, { - "epoch": 0.4, - "learning_rate": 0.00023982292274761624, - "loss": 0.0215, + "epoch": 0.19, + "learning_rate": 0.00027191629122500763, + "loss": 0.0269, "step": 37110 }, { - "epoch": 0.4, - "learning_rate": 0.00023980670688201333, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.00027190872353199366, + "loss": 0.0351, "step": 37120 }, { - "epoch": 0.4, - "learning_rate": 0.00023979049101641045, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.00027190115583897964, + "loss": 0.022, "step": 37130 }, { - "epoch": 0.4, - "learning_rate": 0.00023977427515080752, - "loss": 0.0222, + "epoch": 0.19, + "learning_rate": 0.0002718935881459656, + "loss": 0.0265, "step": 37140 }, { - "epoch": 0.4, - "learning_rate": 0.0002397580592852046, - "loss": 0.0247, + "epoch": 0.19, + "learning_rate": 0.0002718860204529516, + "loss": 0.0259, "step": 37150 }, { - "epoch": 0.4, - "learning_rate": 0.00023974184341960173, - "loss": 0.0273, + "epoch": 0.19, + "learning_rate": 0.0002718784527599376, + "loss": 0.0287, "step": 37160 }, { - "epoch": 0.4, - "learning_rate": 0.00023972562755399882, - "loss": 0.0215, + "epoch": 0.19, + "learning_rate": 0.00027187088506692357, + "loss": 0.0231, "step": 37170 }, { - "epoch": 0.4, - "learning_rate": 0.0002397094116883959, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.0002718633173739096, + "loss": 0.0226, "step": 37180 }, { - "epoch": 0.4, - "learning_rate": 0.00023969319582279298, - "loss": 0.0267, + "epoch": 0.19, + "learning_rate": 0.0002718557496808956, + "loss": 0.0229, "step": 37190 }, { - "epoch": 0.4, - "learning_rate": 0.0002396769799571901, - "loss": 0.0248, + "epoch": 0.19, + "learning_rate": 0.00027184818198788157, + "loss": 0.0229, "step": 37200 }, { - "epoch": 0.4, - "learning_rate": 0.0002396607640915872, - "loss": 0.0237, + "epoch": 0.19, + "learning_rate": 0.00027184061429486755, + "loss": 0.0209, "step": 37210 }, { - "epoch": 0.4, - "learning_rate": 0.00023964454822598426, - "loss": 0.0235, + "epoch": 0.19, + "learning_rate": 0.00027183304660185353, + "loss": 0.0271, "step": 37220 }, { - "epoch": 0.4, - "learning_rate": 0.00023962833236038138, - "loss": 0.0251, + "epoch": 0.19, + "learning_rate": 0.0002718254789088395, + "loss": 0.0244, "step": 37230 }, { - "epoch": 0.4, - "learning_rate": 0.00023961211649477847, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.00027181791121582555, + "loss": 0.0243, "step": 37240 }, { - "epoch": 0.4, - "learning_rate": 0.00023959590062917557, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.00027181034352281153, + "loss": 0.0232, "step": 37250 }, { - "epoch": 0.4, - "learning_rate": 0.00023957968476357263, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.0002718027758297975, + "loss": 0.0268, "step": 37260 }, { - "epoch": 0.4, - "learning_rate": 0.00023956346889796975, - "loss": 0.025, + "epoch": 0.19, + "learning_rate": 0.0002717952081367835, + "loss": 0.0252, "step": 37270 }, { - "epoch": 0.4, - "learning_rate": 0.00023954725303236684, - "loss": 0.1174, + "epoch": 0.19, + "learning_rate": 0.0002717876404437695, + "loss": 0.0229, "step": 37280 }, { - "epoch": 0.4, - "learning_rate": 0.00023953103716676396, - "loss": 0.0407, + "epoch": 0.19, + "learning_rate": 0.00027178007275075546, + "loss": 0.0231, "step": 37290 }, { - "epoch": 0.4, - "learning_rate": 0.00023951482130116103, - "loss": 0.0245, + "epoch": 0.19, + "learning_rate": 0.00027177250505774144, + "loss": 0.0274, "step": 37300 }, { - "epoch": 0.4, - "learning_rate": 0.00023949860543555812, - "loss": 0.0299, + "epoch": 0.19, + "learning_rate": 0.00027176493736472747, + "loss": 0.0264, "step": 37310 }, { - "epoch": 0.4, - "learning_rate": 0.00023948238956995522, - "loss": 0.0321, + "epoch": 0.19, + "learning_rate": 0.00027175736967171345, + "loss": 0.0235, "step": 37320 }, { - "epoch": 0.4, - "learning_rate": 0.00023946617370435233, - "loss": 0.0268, + "epoch": 0.19, + "learning_rate": 0.00027174980197869944, + "loss": 0.0239, "step": 37330 }, { - "epoch": 0.4, - "learning_rate": 0.0002394499578387494, - "loss": 0.0201, + "epoch": 0.19, + "learning_rate": 0.0002717422342856854, + "loss": 0.0247, "step": 37340 }, { - "epoch": 0.4, - "learning_rate": 0.0002394337419731465, - "loss": 0.0222, + "epoch": 0.19, + "learning_rate": 0.0002717346665926714, + "loss": 0.0207, "step": 37350 }, { - "epoch": 0.4, - "learning_rate": 0.0002394175261075436, - "loss": 0.0215, + "epoch": 0.19, + "learning_rate": 0.0002717270988996574, + "loss": 0.024, "step": 37360 }, { - "epoch": 0.4, - "learning_rate": 0.0002394013102419407, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002717195312066434, + "loss": 0.023, "step": 37370 }, { - "epoch": 0.4, - "learning_rate": 0.00023938509437633777, + "epoch": 0.19, + "learning_rate": 0.0002717119635136294, "loss": 0.0235, "step": 37380 }, { - "epoch": 0.4, - "learning_rate": 0.00023936887851073486, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002717043958206154, + "loss": 0.0214, "step": 37390 }, { - "epoch": 0.4, - "learning_rate": 0.00023935266264513198, - "loss": 0.0294, + "epoch": 0.19, + "learning_rate": 0.00027169682812760136, + "loss": 0.0215, "step": 37400 }, { - "epoch": 0.4, - "learning_rate": 0.00023933644677952908, - "loss": 0.0462, + "epoch": 0.19, + "learning_rate": 0.00027168926043458734, + "loss": 0.0285, "step": 37410 }, { - "epoch": 0.4, - "learning_rate": 0.00023932023091392617, - "loss": 0.0237, + "epoch": 0.19, + "learning_rate": 0.0002716816927415733, + "loss": 0.0205, "step": 37420 }, { - "epoch": 0.4, - "learning_rate": 0.00023930401504832326, - "loss": 0.0236, + "epoch": 0.19, + "learning_rate": 0.00027167412504855936, + "loss": 0.0256, "step": 37430 }, { - "epoch": 0.4, - "learning_rate": 0.00023928779918272036, - "loss": 0.0269, + "epoch": 0.19, + "learning_rate": 0.00027166655735554534, + "loss": 0.0243, "step": 37440 }, { - "epoch": 0.4, - "learning_rate": 0.00023927158331711745, - "loss": 0.0191, + "epoch": 0.19, + "learning_rate": 0.0002716589896625313, + "loss": 0.0226, "step": 37450 }, { - "epoch": 0.4, - "learning_rate": 0.00023925536745151457, - "loss": 0.022, + "epoch": 0.19, + "learning_rate": 0.0002716514219695173, + "loss": 0.0223, "step": 37460 }, { - "epoch": 0.41, - "learning_rate": 0.00023923915158591163, - "loss": 0.0244, + "epoch": 0.19, + "learning_rate": 0.0002716438542765033, + "loss": 0.0222, "step": 37470 }, { - "epoch": 0.41, - "learning_rate": 0.00023922293572030873, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027163628658348927, + "loss": 0.0239, "step": 37480 }, { - "epoch": 0.41, - "learning_rate": 0.00023920671985470582, - "loss": 0.0215, + "epoch": 0.19, + "learning_rate": 0.00027162871889047525, + "loss": 0.0225, "step": 37490 }, { - "epoch": 0.41, - "learning_rate": 0.00023919050398910294, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.0002716211511974613, + "loss": 0.0236, "step": 37500 }, { - "epoch": 0.41, - "learning_rate": 0.0002391742881235, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027161358350444726, + "loss": 0.0356, "step": 37510 }, { - "epoch": 0.41, - "learning_rate": 0.0002391580722578971, - "loss": 0.0239, + "epoch": 0.19, + "learning_rate": 0.00027160601581143325, + "loss": 0.0258, "step": 37520 }, { - "epoch": 0.41, - "learning_rate": 0.00023914185639229422, - "loss": 0.0172, + "epoch": 0.19, + "learning_rate": 0.00027159844811841923, + "loss": 0.0573, "step": 37530 }, { - "epoch": 0.41, - "learning_rate": 0.0002391256405266913, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.0002715908804254052, + "loss": 0.0224, "step": 37540 }, { - "epoch": 0.41, - "learning_rate": 0.00023910942466108838, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.0002715833127323912, + "loss": 0.029, "step": 37550 }, { - "epoch": 0.41, - "learning_rate": 0.00023909320879548547, - "loss": 0.0206, + "epoch": 0.19, + "learning_rate": 0.0002715757450393772, + "loss": 0.0239, "step": 37560 }, { - "epoch": 0.41, - "learning_rate": 0.0002390769929298826, - "loss": 0.0233, + "epoch": 0.19, + "learning_rate": 0.0002715681773463632, + "loss": 0.0277, "step": 37570 }, { - "epoch": 0.41, - "learning_rate": 0.00023906077706427968, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.0002715606096533492, + "loss": 0.0256, "step": 37580 }, { - "epoch": 0.41, - "learning_rate": 0.00023904456119867675, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.00027155304196033517, + "loss": 0.0228, "step": 37590 }, { - "epoch": 0.41, - "learning_rate": 0.00023902834533307387, - "loss": 0.0237, + "epoch": 0.19, + "learning_rate": 0.00027154547426732115, + "loss": 0.0249, "step": 37600 }, { - "epoch": 0.41, - "learning_rate": 0.00023901212946747096, - "loss": 0.0144, + "epoch": 0.19, + "learning_rate": 0.00027153790657430713, + "loss": 0.0267, "step": 37610 }, { - "epoch": 0.41, - "learning_rate": 0.00023899591360186805, - "loss": 0.022, + "epoch": 0.19, + "learning_rate": 0.0002715303388812931, + "loss": 0.0274, "step": 37620 }, { - "epoch": 0.41, - "learning_rate": 0.00023897969773626512, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027152277118827915, + "loss": 0.0216, "step": 37630 }, { - "epoch": 0.41, - "learning_rate": 0.00023896348187066224, - "loss": 0.0218, + "epoch": 0.19, + "learning_rate": 0.00027151520349526513, + "loss": 0.0267, "step": 37640 }, { - "epoch": 0.41, - "learning_rate": 0.00023894726600505933, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.0002715076358022511, + "loss": 0.0227, "step": 37650 }, { - "epoch": 0.41, - "learning_rate": 0.00023893105013945645, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.0002715000681092371, + "loss": 0.0254, "step": 37660 }, { - "epoch": 0.41, - "learning_rate": 0.00023891483427385352, - "loss": 0.0199, + "epoch": 0.19, + "learning_rate": 0.0002714925004162231, + "loss": 0.0251, "step": 37670 }, { - "epoch": 0.41, - "learning_rate": 0.0002388986184082506, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.00027148493272320906, + "loss": 0.0245, "step": 37680 }, { - "epoch": 0.41, - "learning_rate": 0.0002388824025426477, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.0002714773650301951, + "loss": 0.0204, "step": 37690 }, { - "epoch": 0.41, - "learning_rate": 0.00023886618667704482, - "loss": 0.0228, + "epoch": 0.19, + "learning_rate": 0.0002714697973371811, + "loss": 0.0244, "step": 37700 }, { - "epoch": 0.41, - "learning_rate": 0.00023884997081144189, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027146222964416706, + "loss": 0.0219, "step": 37710 }, { - "epoch": 0.41, - "learning_rate": 0.00023883375494583898, - "loss": 0.0198, + "epoch": 0.19, + "learning_rate": 0.00027145466195115304, + "loss": 0.0314, "step": 37720 }, { - "epoch": 0.41, - "learning_rate": 0.0002388175390802361, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.000271447094258139, + "loss": 0.0242, "step": 37730 }, { - "epoch": 0.41, - "learning_rate": 0.0002388013232146332, - "loss": 0.0256, + "epoch": 0.19, + "learning_rate": 0.000271439526565125, + "loss": 0.0268, "step": 37740 }, { - "epoch": 0.41, - "learning_rate": 0.00023878510734903026, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027143195887211104, + "loss": 0.0227, "step": 37750 }, { - "epoch": 0.41, - "learning_rate": 0.00023876889148342735, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.000271424391179097, + "loss": 0.0201, "step": 37760 }, { - "epoch": 0.41, - "learning_rate": 0.00023875267561782447, - "loss": 0.0242, + "epoch": 0.19, + "learning_rate": 0.000271416823486083, + "loss": 0.0246, "step": 37770 }, { - "epoch": 0.41, - "learning_rate": 0.00023873645975222156, - "loss": 0.0234, + "epoch": 0.19, + "learning_rate": 0.000271409255793069, + "loss": 0.0236, "step": 37780 }, { - "epoch": 0.41, - "learning_rate": 0.00023872024388661863, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.00027140168810005496, + "loss": 0.0226, "step": 37790 }, { - "epoch": 0.41, - "learning_rate": 0.00023870402802101575, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027139412040704094, + "loss": 0.0216, "step": 37800 }, { - "epoch": 0.41, - "learning_rate": 0.00023868781215541284, - "loss": 0.0225, + "epoch": 0.19, + "learning_rate": 0.0002713865527140269, + "loss": 0.0255, "step": 37810 }, { - "epoch": 0.41, - "learning_rate": 0.00023867159628980993, - "loss": 0.0218, + "epoch": 0.19, + "learning_rate": 0.00027137898502101296, + "loss": 0.0256, "step": 37820 }, { - "epoch": 0.41, - "learning_rate": 0.000238655380424207, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027137141732799894, + "loss": 0.0245, "step": 37830 }, { - "epoch": 0.41, - "learning_rate": 0.00023863916455860412, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002713638496349849, + "loss": 0.0247, "step": 37840 }, { - "epoch": 0.41, - "learning_rate": 0.0002386229486930012, - "loss": 0.0214, + "epoch": 0.19, + "learning_rate": 0.0002713562819419709, + "loss": 0.0286, "step": 37850 }, { - "epoch": 0.41, - "learning_rate": 0.0002386067328273983, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.0002713487142489569, + "loss": 0.0241, "step": 37860 }, { - "epoch": 0.41, - "learning_rate": 0.0002385905169617954, - "loss": 0.0224, + "epoch": 0.19, + "learning_rate": 0.00027134114655594287, + "loss": 0.0217, "step": 37870 }, { - "epoch": 0.41, - "learning_rate": 0.0002385743010961925, - "loss": 0.0331, + "epoch": 0.19, + "learning_rate": 0.0002713335788629289, + "loss": 0.0241, "step": 37880 }, { - "epoch": 0.41, - "learning_rate": 0.00023855808523058958, - "loss": 0.0294, + "epoch": 0.19, + "learning_rate": 0.0002713260111699149, + "loss": 0.0218, "step": 37890 }, { - "epoch": 0.41, - "learning_rate": 0.0002385418693649867, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.00027131844347690087, + "loss": 0.0275, "step": 37900 }, { - "epoch": 0.41, - "learning_rate": 0.00023852565349938377, - "loss": 0.0237, + "epoch": 0.19, + "learning_rate": 0.00027131087578388685, + "loss": 0.0215, "step": 37910 }, { - "epoch": 0.41, - "learning_rate": 0.00023850943763378086, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.00027130330809087283, + "loss": 0.0254, "step": 37920 }, { - "epoch": 0.41, - "learning_rate": 0.00023849322176817795, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002712957403978588, + "loss": 0.0232, "step": 37930 }, { - "epoch": 0.41, - "learning_rate": 0.00023847700590257507, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.00027128817270484485, + "loss": 0.024, "step": 37940 }, { - "epoch": 0.41, - "learning_rate": 0.00023846079003697214, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027128060501183083, + "loss": 0.0253, "step": 37950 }, { - "epoch": 0.41, - "learning_rate": 0.00023844457417136923, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.0002712730373188168, + "loss": 0.0263, "step": 37960 }, { - "epoch": 0.41, - "learning_rate": 0.00023842835830576635, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002712654696258028, + "loss": 0.0271, "step": 37970 }, { - "epoch": 0.41, - "learning_rate": 0.00023841214244016344, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.00027125790193278877, + "loss": 0.028, "step": 37980 }, { - "epoch": 0.41, - "learning_rate": 0.0002383959265745605, - "loss": 0.0268, + "epoch": 0.19, + "learning_rate": 0.00027125033423977475, + "loss": 0.0321, "step": 37990 }, { - "epoch": 0.41, - "learning_rate": 0.0002383797107089576, - "loss": 0.0197, + "epoch": 0.19, + "learning_rate": 0.00027124276654676073, + "loss": 0.0245, "step": 38000 }, { - "epoch": 0.41, - "eval_cer": 0.9215773134805442, - "eval_loss": 0.015152968466281891, - "eval_runtime": 121.8268, - "eval_samples_per_second": 16.417, - "eval_steps_per_second": 4.104, + "epoch": 0.19, + "eval_cer": 0.9144780190721654, + "eval_loss": 0.018160896375775337, + "eval_runtime": 117.0624, + "eval_samples_per_second": 17.085, + "eval_steps_per_second": 4.271, "step": 38000 }, { - "epoch": 0.41, - "learning_rate": 0.00023836349484335472, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.00027123519885374677, + "loss": 0.0257, "step": 38010 }, { - "epoch": 0.41, - "learning_rate": 0.00023834727897775182, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.00027122763116073275, + "loss": 0.0244, "step": 38020 }, { - "epoch": 0.41, - "learning_rate": 0.00023833106311214888, - "loss": 0.0226, + "epoch": 0.19, + "learning_rate": 0.00027122006346771873, + "loss": 0.0204, "step": 38030 }, { - "epoch": 0.41, - "learning_rate": 0.000238314847246546, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.0002712124957747047, + "loss": 0.0242, "step": 38040 }, { - "epoch": 0.41, - "learning_rate": 0.0002382986313809431, - "loss": 0.0182, + "epoch": 0.19, + "learning_rate": 0.0002712049280816907, + "loss": 0.0324, "step": 38050 }, { - "epoch": 0.41, - "learning_rate": 0.0002382824155153402, - "loss": 0.0312, + "epoch": 0.19, + "learning_rate": 0.0002711973603886767, + "loss": 0.0269, "step": 38060 }, { - "epoch": 0.41, - "learning_rate": 0.00023826619964973728, - "loss": 0.0229, + "epoch": 0.19, + "learning_rate": 0.0002711897926956627, + "loss": 0.0237, "step": 38070 }, { - "epoch": 0.41, - "learning_rate": 0.00023824998378413437, - "loss": 0.0219, + "epoch": 0.19, + "learning_rate": 0.0002711822250026487, + "loss": 0.0293, "step": 38080 }, { - "epoch": 0.41, - "learning_rate": 0.00023823376791853146, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.0002711746573096347, + "loss": 0.0288, "step": 38090 }, { - "epoch": 0.41, - "learning_rate": 0.00023821755205292858, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.00027116708961662066, + "loss": 0.0234, "step": 38100 }, { - "epoch": 0.41, - "learning_rate": 0.00023820133618732565, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.00027115952192360664, + "loss": 0.0216, "step": 38110 }, { - "epoch": 0.41, - "learning_rate": 0.00023818512032172274, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002711519542305926, + "loss": 0.0203, "step": 38120 }, { - "epoch": 0.41, - "learning_rate": 0.00023816890445611984, - "loss": 0.0245, + "epoch": 0.19, + "learning_rate": 0.0002711443865375786, + "loss": 0.0267, "step": 38130 }, { - "epoch": 0.41, - "learning_rate": 0.00023815268859051696, - "loss": 0.0225, + "epoch": 0.19, + "learning_rate": 0.00027113681884456464, + "loss": 0.0253, "step": 38140 }, { - "epoch": 0.41, - "learning_rate": 0.00023813647272491405, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.0002711292511515506, + "loss": 0.0211, "step": 38150 }, { - "epoch": 0.41, - "learning_rate": 0.00023812025685931111, - "loss": 0.0241, + "epoch": 0.19, + "learning_rate": 0.0002711216834585366, + "loss": 0.0251, "step": 38160 }, { - "epoch": 0.41, - "learning_rate": 0.00023810404099370823, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.0002711141157655226, + "loss": 0.0225, "step": 38170 }, { - "epoch": 0.41, - "learning_rate": 0.00023808782512810533, - "loss": 0.0235, + "epoch": 0.19, + "learning_rate": 0.00027110654807250856, + "loss": 0.024, "step": 38180 }, { - "epoch": 0.41, - "learning_rate": 0.00023807160926250242, - "loss": 0.023, + "epoch": 0.19, + "learning_rate": 0.00027109898037949454, + "loss": 0.0287, "step": 38190 }, { - "epoch": 0.41, - "learning_rate": 0.00023805539339689948, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.0002710914126864806, + "loss": 0.0216, "step": 38200 }, { - "epoch": 0.41, - "learning_rate": 0.0002380391775312966, - "loss": 0.0235, + "epoch": 0.19, + "learning_rate": 0.00027108384499346656, + "loss": 0.0233, "step": 38210 }, { - "epoch": 0.41, - "learning_rate": 0.0002380229616656937, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.00027107627730045254, + "loss": 0.0227, "step": 38220 }, { - "epoch": 0.41, - "learning_rate": 0.0002380067458000908, - "loss": 0.0236, + "epoch": 0.19, + "learning_rate": 0.0002710687096074385, + "loss": 0.0231, "step": 38230 }, { - "epoch": 0.41, - "learning_rate": 0.00023799052993448788, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.0002710611419144245, + "loss": 0.0255, "step": 38240 }, { - "epoch": 0.41, - "learning_rate": 0.00023797431406888498, + "epoch": 0.19, + "learning_rate": 0.0002710535742214105, "loss": 0.0211, "step": 38250 }, { - "epoch": 0.41, - "learning_rate": 0.00023795809820328207, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.0002710460065283965, + "loss": 0.0203, "step": 38260 }, { - "epoch": 0.41, - "learning_rate": 0.0002379418823376792, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002710384388353825, + "loss": 0.0245, "step": 38270 }, { - "epoch": 0.41, - "learning_rate": 0.00023792566647207625, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.0002710308711423685, + "loss": 0.025, "step": 38280 }, { - "epoch": 0.41, - "learning_rate": 0.00023790945060647335, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.00027102330344935447, + "loss": 0.0281, "step": 38290 }, { - "epoch": 0.41, - "learning_rate": 0.00023789323474087047, - "loss": 0.0199, + "epoch": 0.19, + "learning_rate": 0.00027101573575634045, + "loss": 0.021, "step": 38300 }, { - "epoch": 0.41, - "learning_rate": 0.00023787701887526756, - "loss": 0.0231, + "epoch": 0.19, + "learning_rate": 0.00027100816806332643, + "loss": 0.023, "step": 38310 }, { - "epoch": 0.41, - "learning_rate": 0.00023786080300966462, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.0002710006003703124, + "loss": 0.0235, "step": 38320 }, { - "epoch": 0.41, - "learning_rate": 0.00023784458714406172, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.00027099303267729845, + "loss": 0.0246, "step": 38330 }, { - "epoch": 0.41, - "learning_rate": 0.00023782837127845884, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.0002709854649842844, + "loss": 0.0232, "step": 38340 }, { - "epoch": 0.41, - "learning_rate": 0.00023781215541285593, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.00027097789729127036, + "loss": 0.0277, "step": 38350 }, { - "epoch": 0.41, - "learning_rate": 0.000237795939547253, - "loss": 0.022, + "epoch": 0.19, + "learning_rate": 0.00027097032959825634, + "loss": 0.0221, "step": 38360 }, { - "epoch": 0.41, - "learning_rate": 0.00023777972368165012, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.0002709627619052424, + "loss": 0.0253, "step": 38370 }, { - "epoch": 0.41, - "learning_rate": 0.0002377635078160472, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.00027095519421222835, + "loss": 0.0246, "step": 38380 }, { - "epoch": 0.42, - "learning_rate": 0.0002377472919504443, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.00027094762651921434, + "loss": 0.0213, "step": 38390 }, { - "epoch": 0.42, - "learning_rate": 0.00023773107608484137, - "loss": 0.0232, + "epoch": 0.19, + "learning_rate": 0.0002709400588262003, + "loss": 0.0234, "step": 38400 }, { - "epoch": 0.42, - "learning_rate": 0.0002377148602192385, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.0002709324911331863, + "loss": 0.0238, "step": 38410 }, { - "epoch": 0.42, - "learning_rate": 0.00023769864435363558, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.0002709249234401723, + "loss": 0.0233, "step": 38420 }, { - "epoch": 0.42, - "learning_rate": 0.00023768242848803267, - "loss": 0.0216, + "epoch": 0.19, + "learning_rate": 0.0002709173557471583, + "loss": 0.0229, "step": 38430 }, { - "epoch": 0.42, - "learning_rate": 0.00023766621262242977, - "loss": 0.0225, + "epoch": 0.19, + "learning_rate": 0.0002709097880541443, + "loss": 0.0246, "step": 38440 }, { - "epoch": 0.42, - "learning_rate": 0.00023764999675682686, - "loss": 0.0279, + "epoch": 0.19, + "learning_rate": 0.0002709022203611303, + "loss": 0.0203, "step": 38450 }, { - "epoch": 0.42, - "learning_rate": 0.00023763378089122395, - "loss": 0.025, + "epoch": 0.19, + "learning_rate": 0.00027089465266811626, + "loss": 0.0255, "step": 38460 }, { - "epoch": 0.42, - "learning_rate": 0.00023761756502562107, - "loss": 0.0254, + "epoch": 0.19, + "learning_rate": 0.00027088708497510224, + "loss": 0.0275, "step": 38470 }, { - "epoch": 0.42, - "learning_rate": 0.00023760134916001814, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.0002708795172820882, + "loss": 0.0227, "step": 38480 }, { - "epoch": 0.42, - "learning_rate": 0.00023758513329441523, - "loss": 0.0201, + "epoch": 0.19, + "learning_rate": 0.00027087194958907426, + "loss": 0.0208, "step": 38490 }, { - "epoch": 0.42, - "learning_rate": 0.00023756891742881232, - "loss": 0.0191, + "epoch": 0.19, + "learning_rate": 0.00027086438189606024, + "loss": 0.027, "step": 38500 }, { - "epoch": 0.42, - "learning_rate": 0.00023755270156320944, - "loss": 0.0225, + "epoch": 0.19, + "learning_rate": 0.0002708568142030462, + "loss": 0.0239, "step": 38510 }, { - "epoch": 0.42, - "learning_rate": 0.0002375364856976065, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002708492465100322, + "loss": 0.0232, "step": 38520 }, { - "epoch": 0.42, - "learning_rate": 0.0002375202698320036, - "loss": 0.0216, + "epoch": 0.19, + "learning_rate": 0.0002708416788170182, + "loss": 0.0218, "step": 38530 }, { - "epoch": 0.42, - "learning_rate": 0.00023750405396640072, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.00027083411112400417, + "loss": 0.023, "step": 38540 }, { - "epoch": 0.42, - "learning_rate": 0.0002374878381007978, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.00027082654343099015, + "loss": 0.0222, "step": 38550 }, { - "epoch": 0.42, - "learning_rate": 0.00023747162223519488, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.0002708189757379762, + "loss": 0.024, "step": 38560 }, { - "epoch": 0.42, - "learning_rate": 0.00023745540636959197, - "loss": 0.0233, + "epoch": 0.19, + "learning_rate": 0.00027081140804496216, + "loss": 0.026, "step": 38570 }, { - "epoch": 0.42, - "learning_rate": 0.0002374391905039891, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.00027080384035194815, + "loss": 0.0221, "step": 38580 }, { - "epoch": 0.42, - "learning_rate": 0.00023742297463838618, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027079627265893413, + "loss": 0.0228, "step": 38590 }, { - "epoch": 0.42, - "learning_rate": 0.00023740675877278325, - "loss": 0.0243, + "epoch": 0.19, + "learning_rate": 0.0002707887049659201, + "loss": 0.0223, "step": 38600 }, { - "epoch": 0.42, - "learning_rate": 0.00023739054290718037, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002707811372729061, + "loss": 0.0238, "step": 38610 }, { - "epoch": 0.42, - "learning_rate": 0.00023737432704157746, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.0002707735695798921, + "loss": 0.0237, "step": 38620 }, { - "epoch": 0.42, - "learning_rate": 0.00023735811117597455, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.0002707660018868781, + "loss": 0.0234, "step": 38630 }, { - "epoch": 0.42, - "learning_rate": 0.00023734189531037162, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002707584341938641, + "loss": 0.0358, "step": 38640 }, { - "epoch": 0.42, - "learning_rate": 0.00023732567944476874, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.00027075086650085007, + "loss": 0.023, "step": 38650 }, { - "epoch": 0.42, - "learning_rate": 0.00023730946357916583, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.00027074329880783605, + "loss": 0.0247, "step": 38660 }, { - "epoch": 0.42, - "learning_rate": 0.00023729324771356295, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.00027073573111482203, + "loss": 0.023, "step": 38670 }, { - "epoch": 0.42, - "learning_rate": 0.00023727703184796002, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00027072816342180807, + "loss": 0.0261, "step": 38680 }, { - "epoch": 0.42, - "learning_rate": 0.0002372608159823571, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.00027072059572879405, + "loss": 0.0218, "step": 38690 }, { - "epoch": 0.42, - "learning_rate": 0.0002372446001167542, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00027071302803578003, + "loss": 0.0213, "step": 38700 }, { - "epoch": 0.42, - "learning_rate": 0.00023722838425115132, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.000270705460342766, + "loss": 0.0222, "step": 38710 }, { - "epoch": 0.42, - "learning_rate": 0.0002372121683855484, - "loss": 0.0187, + "epoch": 0.2, + "learning_rate": 0.000270697892649752, + "loss": 0.0201, "step": 38720 }, { - "epoch": 0.42, - "learning_rate": 0.00023719595251994548, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.000270690324956738, + "loss": 0.0257, "step": 38730 }, { - "epoch": 0.42, - "learning_rate": 0.0002371797366543426, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.00027068275726372396, + "loss": 0.0273, "step": 38740 }, { - "epoch": 0.42, - "learning_rate": 0.0002371635207887397, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.00027067518957071, + "loss": 0.0246, "step": 38750 }, { - "epoch": 0.42, - "learning_rate": 0.00023714730492313676, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.000270667621877696, + "loss": 0.0204, "step": 38760 }, { - "epoch": 0.42, - "learning_rate": 0.00023713108905753385, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.00027066005418468196, + "loss": 0.0256, "step": 38770 }, { - "epoch": 0.42, - "learning_rate": 0.00023711487319193097, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.00027065248649166794, + "loss": 0.0281, "step": 38780 }, { - "epoch": 0.42, - "learning_rate": 0.00023709865732632807, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.0002706449187986539, + "loss": 0.025, "step": 38790 }, { - "epoch": 0.42, - "learning_rate": 0.00023708244146072513, - "loss": 0.0226, + "epoch": 0.2, + "learning_rate": 0.0002706373511056399, + "loss": 0.0248, "step": 38800 }, { - "epoch": 0.42, - "learning_rate": 0.00023706622559512225, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.00027062978341262594, + "loss": 0.021, "step": 38810 }, { - "epoch": 0.42, - "learning_rate": 0.00023705000972951934, - "loss": 0.0194, + "epoch": 0.2, + "learning_rate": 0.0002706222157196119, + "loss": 0.022, "step": 38820 }, { - "epoch": 0.42, - "learning_rate": 0.00023703379386391644, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002706146480265979, + "loss": 0.0228, "step": 38830 }, { - "epoch": 0.42, - "learning_rate": 0.0002370175779983135, - "loss": 0.0243, + "epoch": 0.2, + "learning_rate": 0.0002706070803335839, + "loss": 0.025, "step": 38840 }, { - "epoch": 0.42, - "learning_rate": 0.00023700136213271062, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00027059951264056986, + "loss": 0.0249, "step": 38850 }, { - "epoch": 0.42, - "learning_rate": 0.00023698514626710771, - "loss": 0.0252, + "epoch": 0.2, + "learning_rate": 0.00027059194494755584, + "loss": 0.0241, "step": 38860 }, { - "epoch": 0.42, - "learning_rate": 0.0002369689304015048, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.0002705843772545418, + "loss": 0.0215, "step": 38870 }, { - "epoch": 0.42, - "learning_rate": 0.00023695271453590193, - "loss": 0.0432, + "epoch": 0.2, + "learning_rate": 0.00027057680956152786, + "loss": 0.0224, "step": 38880 }, { - "epoch": 0.42, - "learning_rate": 0.000236936498670299, - "loss": 0.023, + "epoch": 0.2, + "learning_rate": 0.00027056924186851384, + "loss": 0.0258, "step": 38890 }, { - "epoch": 0.42, - "learning_rate": 0.00023692028280469609, - "loss": 0.0287, + "epoch": 0.2, + "learning_rate": 0.0002705616741754998, + "loss": 0.0223, "step": 38900 }, { - "epoch": 0.42, - "learning_rate": 0.0002369040669390932, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002705541064824858, + "loss": 0.0228, "step": 38910 }, { - "epoch": 0.42, - "learning_rate": 0.0002368878510734903, - "loss": 0.0276, + "epoch": 0.2, + "learning_rate": 0.0002705465387894718, + "loss": 0.0234, "step": 38920 }, { - "epoch": 0.42, - "learning_rate": 0.00023687163520788736, - "loss": 0.0228, + "epoch": 0.2, + "learning_rate": 0.00027053897109645777, + "loss": 0.0203, "step": 38930 }, { - "epoch": 0.42, - "learning_rate": 0.00023685541934228446, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.0002705314034034438, + "loss": 0.0235, "step": 38940 }, { - "epoch": 0.42, - "learning_rate": 0.00023683920347668158, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.0002705238357104298, + "loss": 0.0233, "step": 38950 }, { - "epoch": 0.42, - "learning_rate": 0.00023682298761107867, - "loss": 0.0226, + "epoch": 0.2, + "learning_rate": 0.00027051626801741577, + "loss": 0.0212, "step": 38960 }, { - "epoch": 0.42, - "learning_rate": 0.00023680677174547573, - "loss": 0.0214, + "epoch": 0.2, + "learning_rate": 0.00027050870032440175, + "loss": 0.024, "step": 38970 }, { - "epoch": 0.42, - "learning_rate": 0.00023679055587987285, - "loss": 0.022, + "epoch": 0.2, + "learning_rate": 0.00027050113263138773, + "loss": 0.0266, "step": 38980 }, { - "epoch": 0.42, - "learning_rate": 0.00023677434001426995, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.0002704935649383737, + "loss": 0.0206, "step": 38990 }, { - "epoch": 0.42, - "learning_rate": 0.00023675812414866704, - "loss": 0.0205, + "epoch": 0.2, + "learning_rate": 0.00027048599724535975, + "loss": 0.0195, "step": 39000 }, { - "epoch": 0.42, - "eval_cer": 0.9215512553918529, - "eval_loss": 0.015001688152551651, - "eval_runtime": 121.88, - "eval_samples_per_second": 16.41, - "eval_steps_per_second": 4.102, + "epoch": 0.2, + "eval_cer": 0.9144702559031622, + "eval_loss": 0.017209572717547417, + "eval_runtime": 117.1365, + "eval_samples_per_second": 17.074, + "eval_steps_per_second": 4.269, "step": 39000 }, { - "epoch": 0.42, - "learning_rate": 0.0002367419082830641, - "loss": 0.023, + "epoch": 0.2, + "learning_rate": 0.00027047842955234573, + "loss": 0.0312, "step": 39010 }, { - "epoch": 0.42, - "learning_rate": 0.00023672569241746123, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.0002704708618593317, + "loss": 0.0205, "step": 39020 }, { - "epoch": 0.42, - "learning_rate": 0.00023670947655185832, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.0002704632941663177, + "loss": 0.0229, "step": 39030 }, { - "epoch": 0.42, - "learning_rate": 0.00023669326068625544, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.00027045572647330367, + "loss": 0.0261, "step": 39040 }, { - "epoch": 0.42, - "learning_rate": 0.0002366770448206525, - "loss": 0.0246, + "epoch": 0.2, + "learning_rate": 0.00027044815878028965, + "loss": 0.0239, "step": 39050 }, { - "epoch": 0.42, - "learning_rate": 0.0002366608289550496, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.00027044059108727563, + "loss": 0.0226, "step": 39060 }, { - "epoch": 0.42, - "learning_rate": 0.0002366446130894467, - "loss": 0.0311, + "epoch": 0.2, + "learning_rate": 0.00027043302339426167, + "loss": 0.02, "step": 39070 }, { - "epoch": 0.42, - "learning_rate": 0.0002366283972238438, - "loss": 0.0237, + "epoch": 0.2, + "learning_rate": 0.00027042545570124765, + "loss": 0.0231, "step": 39080 }, { - "epoch": 0.42, - "learning_rate": 0.00023661218135824087, - "loss": 0.0214, + "epoch": 0.2, + "learning_rate": 0.00027041788800823363, + "loss": 0.0229, "step": 39090 }, { - "epoch": 0.42, - "learning_rate": 0.00023659596549263797, - "loss": 0.0207, + "epoch": 0.2, + "learning_rate": 0.0002704103203152196, + "loss": 0.0216, "step": 39100 }, { - "epoch": 0.42, - "learning_rate": 0.0002365797496270351, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002704027526222056, + "loss": 0.0231, "step": 39110 }, { - "epoch": 0.42, - "learning_rate": 0.00023656353376143218, - "loss": 0.0235, + "epoch": 0.2, + "learning_rate": 0.0002703951849291916, + "loss": 0.0219, "step": 39120 }, { - "epoch": 0.42, - "learning_rate": 0.00023654731789582925, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.0002703876172361776, + "loss": 0.0231, "step": 39130 }, { - "epoch": 0.42, - "learning_rate": 0.00023653110203022634, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.0002703800495431636, + "loss": 0.0235, "step": 39140 }, { - "epoch": 0.42, - "learning_rate": 0.00023651488616462346, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.0002703724818501496, + "loss": 0.0223, "step": 39150 }, { - "epoch": 0.42, - "learning_rate": 0.00023649867029902055, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.00027036491415713556, + "loss": 0.0233, "step": 39160 }, { - "epoch": 0.42, - "learning_rate": 0.00023648245443341762, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.00027035734646412154, + "loss": 0.0252, "step": 39170 }, { - "epoch": 0.42, - "learning_rate": 0.00023646623856781474, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.0002703497787711075, + "loss": 0.0246, "step": 39180 }, { - "epoch": 0.42, - "learning_rate": 0.00023645002270221183, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.00027034221107809356, + "loss": 0.0284, "step": 39190 }, { - "epoch": 0.42, - "learning_rate": 0.00023643380683660892, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00027033464338507954, + "loss": 0.0259, "step": 39200 }, { - "epoch": 0.42, - "learning_rate": 0.000236417590971006, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.0002703270756920655, + "loss": 0.0266, "step": 39210 }, { - "epoch": 0.42, - "learning_rate": 0.0002364013751054031, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.0002703195079990515, + "loss": 0.0246, "step": 39220 }, { - "epoch": 0.42, - "learning_rate": 0.0002363851592398002, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.0002703119403060375, + "loss": 0.0243, "step": 39230 }, { - "epoch": 0.42, - "learning_rate": 0.0002363689433741973, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00027030437261302346, + "loss": 0.024, "step": 39240 }, { - "epoch": 0.42, - "learning_rate": 0.00023635272750859439, - "loss": 0.0237, + "epoch": 0.2, + "learning_rate": 0.00027029680492000944, + "loss": 0.021, "step": 39250 }, { - "epoch": 0.42, - "learning_rate": 0.00023633651164299148, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.0002702892372269955, + "loss": 0.0294, "step": 39260 }, { - "epoch": 0.42, - "learning_rate": 0.00023632029577738857, - "loss": 0.0244, + "epoch": 0.2, + "learning_rate": 0.00027028166953398146, + "loss": 0.0238, "step": 39270 }, { - "epoch": 0.42, - "learning_rate": 0.0002363040799117857, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.00027027410184096744, + "loss": 0.0232, "step": 39280 }, { - "epoch": 0.42, - "learning_rate": 0.00023628786404618276, - "loss": 0.021, + "epoch": 0.2, + "learning_rate": 0.0002702665341479534, + "loss": 0.0227, "step": 39290 }, { - "epoch": 0.42, - "learning_rate": 0.00023627164818057985, - "loss": 0.0199, + "epoch": 0.2, + "learning_rate": 0.0002702589664549394, + "loss": 0.023, "step": 39300 }, { - "epoch": 0.42, - "learning_rate": 0.00023625543231497697, - "loss": 0.0252, + "epoch": 0.2, + "learning_rate": 0.0002702513987619254, + "loss": 0.0287, "step": 39310 }, { - "epoch": 0.43, - "learning_rate": 0.00023623921644937406, - "loss": 0.0207, + "epoch": 0.2, + "learning_rate": 0.0002702438310689114, + "loss": 0.0228, "step": 39320 }, { - "epoch": 0.43, - "learning_rate": 0.00023622300058377113, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.0002702362633758974, + "loss": 0.0206, "step": 39330 }, { - "epoch": 0.43, - "learning_rate": 0.00023620678471816822, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002702286956828834, + "loss": 0.0241, "step": 39340 }, { - "epoch": 0.43, - "learning_rate": 0.00023619056885256534, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00027022112798986937, + "loss": 0.0253, "step": 39350 }, { - "epoch": 0.43, - "learning_rate": 0.00023617435298696243, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00027021356029685535, + "loss": 0.0273, "step": 39360 }, { - "epoch": 0.43, - "learning_rate": 0.0002361581371213595, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.00027020599260384133, + "loss": 0.0271, "step": 39370 }, { - "epoch": 0.43, - "learning_rate": 0.00023614192125575662, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.0002701984249108273, + "loss": 0.0256, "step": 39380 }, { - "epoch": 0.43, - "learning_rate": 0.0002361257053901537, - "loss": 0.0249, + "epoch": 0.2, + "learning_rate": 0.00027019085721781335, + "loss": 0.0234, "step": 39390 }, { - "epoch": 0.43, - "learning_rate": 0.0002361094895245508, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.00027018328952479933, + "loss": 0.0229, "step": 39400 }, { - "epoch": 0.43, - "learning_rate": 0.00023609327365894787, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.0002701757218317853, + "loss": 0.025, "step": 39410 }, { - "epoch": 0.43, - "learning_rate": 0.000236077057793345, - "loss": 0.0187, + "epoch": 0.2, + "learning_rate": 0.0002701681541387713, + "loss": 0.0244, "step": 39420 }, { - "epoch": 0.43, - "learning_rate": 0.00023606084192774208, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002701605864457573, + "loss": 0.0249, "step": 39430 }, { - "epoch": 0.43, - "learning_rate": 0.00023604462606213917, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00027015301875274325, + "loss": 0.0284, "step": 39440 }, { - "epoch": 0.43, - "learning_rate": 0.00023602841019653627, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002701454510597293, + "loss": 0.0252, "step": 39450 }, { - "epoch": 0.43, - "learning_rate": 0.00023601219433093336, - "loss": 0.0226, + "epoch": 0.2, + "learning_rate": 0.00027013788336671527, + "loss": 0.023, "step": 39460 }, { - "epoch": 0.43, - "learning_rate": 0.00023599597846533045, - "loss": 0.0199, + "epoch": 0.2, + "learning_rate": 0.00027013031567370125, + "loss": 0.0229, "step": 39470 }, { - "epoch": 0.43, - "learning_rate": 0.00023597976259972757, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00027012274798068723, + "loss": 0.025, "step": 39480 }, { - "epoch": 0.43, - "learning_rate": 0.00023596354673412464, - "loss": 0.0228, + "epoch": 0.2, + "learning_rate": 0.0002701151802876732, + "loss": 0.0308, "step": 39490 }, { - "epoch": 0.43, - "learning_rate": 0.00023594733086852173, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002701076125946592, + "loss": 0.0258, "step": 39500 }, { - "epoch": 0.43, - "learning_rate": 0.00023593111500291882, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027010004490164523, + "loss": 0.024, "step": 39510 }, { - "epoch": 0.43, - "learning_rate": 0.00023591489913731594, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.0002700924772086312, + "loss": 0.0216, "step": 39520 }, { - "epoch": 0.43, - "learning_rate": 0.000235898683271713, - "loss": 0.0223, + "epoch": 0.2, + "learning_rate": 0.0002700849095156172, + "loss": 0.0224, "step": 39530 }, { - "epoch": 0.43, - "learning_rate": 0.0002358824674061101, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002700773418226032, + "loss": 0.0296, "step": 39540 }, { - "epoch": 0.43, - "learning_rate": 0.00023586625154050722, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.00027006977412958916, + "loss": 0.0229, "step": 39550 }, { - "epoch": 0.43, - "learning_rate": 0.00023585003567490431, - "loss": 0.023, + "epoch": 0.2, + "learning_rate": 0.00027006220643657514, + "loss": 0.0238, "step": 39560 }, { - "epoch": 0.43, - "learning_rate": 0.0002358338198093014, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002700546387435611, + "loss": 0.0227, "step": 39570 }, { - "epoch": 0.43, - "learning_rate": 0.00023581760394369847, - "loss": 0.0194, + "epoch": 0.2, + "learning_rate": 0.00027004707105054716, + "loss": 0.0227, "step": 39580 }, { - "epoch": 0.43, - "learning_rate": 0.0002358013880780956, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.00027003950335753314, + "loss": 0.0235, "step": 39590 }, { - "epoch": 0.43, - "learning_rate": 0.00023578517221249269, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.00027003193566451907, + "loss": 0.0265, "step": 39600 }, { - "epoch": 0.43, - "learning_rate": 0.0002357689563468898, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.00027002436797150505, + "loss": 0.0229, "step": 39610 }, { - "epoch": 0.43, - "learning_rate": 0.00023575274048128687, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.0002700168002784911, + "loss": 0.0259, "step": 39620 }, { - "epoch": 0.43, - "learning_rate": 0.00023573652461568396, + "epoch": 0.2, + "learning_rate": 0.00027000923258547706, "loss": 0.021, "step": 39630 }, { - "epoch": 0.43, - "learning_rate": 0.00023572030875008106, - "loss": 0.0179, - "step": 39640 + "epoch": 0.2, + "learning_rate": 0.00027000166489246305, + "loss": 0.0199, + "step": 39640 }, { - "epoch": 0.43, - "learning_rate": 0.00023570409288447818, - "loss": 0.0236, + "epoch": 0.2, + "learning_rate": 0.00026999409719944903, + "loss": 0.0248, "step": 39650 }, { - "epoch": 0.43, - "learning_rate": 0.00023568787701887524, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.000269986529506435, + "loss": 0.0259, "step": 39660 }, { - "epoch": 0.43, - "learning_rate": 0.00023567166115327234, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.000269978961813421, + "loss": 0.0222, "step": 39670 }, { - "epoch": 0.43, - "learning_rate": 0.00023565544528766945, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.000269971394120407, + "loss": 0.0292, "step": 39680 }, { - "epoch": 0.43, - "learning_rate": 0.00023563922942206655, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.000269963826427393, + "loss": 0.0235, "step": 39690 }, { - "epoch": 0.43, - "learning_rate": 0.0002356230135564636, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.000269956258734379, + "loss": 0.0219, "step": 39700 }, { - "epoch": 0.43, - "learning_rate": 0.0002356067976908607, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.00026994869104136497, + "loss": 0.0204, "step": 39710 }, { - "epoch": 0.43, - "learning_rate": 0.00023559058182525783, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.00026994112334835095, + "loss": 0.0247, "step": 39720 }, { - "epoch": 0.43, - "learning_rate": 0.00023557436595965492, - "loss": 0.0224, + "epoch": 0.2, + "learning_rate": 0.00026993355565533693, + "loss": 0.0252, "step": 39730 }, { - "epoch": 0.43, - "learning_rate": 0.00023555815009405198, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.00026992598796232297, + "loss": 0.0226, "step": 39740 }, { - "epoch": 0.43, - "learning_rate": 0.0002355419342284491, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.00026991842026930895, + "loss": 0.0288, "step": 39750 }, { - "epoch": 0.43, - "learning_rate": 0.0002355257183628462, - "loss": 0.0238, + "epoch": 0.2, + "learning_rate": 0.00026991085257629493, + "loss": 0.0283, "step": 39760 }, { - "epoch": 0.43, - "learning_rate": 0.0002355095024972433, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.0002699032848832809, + "loss": 0.0258, "step": 39770 }, { - "epoch": 0.43, - "learning_rate": 0.00023549328663164036, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.0002698957171902669, + "loss": 0.0237, "step": 39780 }, { - "epoch": 0.43, - "learning_rate": 0.00023547707076603748, - "loss": 0.022, + "epoch": 0.2, + "learning_rate": 0.0002698881494972529, + "loss": 0.0233, "step": 39790 }, { - "epoch": 0.43, - "learning_rate": 0.00023546085490043457, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00026988058180423886, + "loss": 0.0244, "step": 39800 }, { - "epoch": 0.43, - "learning_rate": 0.00023544463903483166, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.0002698730141112249, + "loss": 0.0241, "step": 39810 }, { - "epoch": 0.43, - "learning_rate": 0.00023542842316922875, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.0002698654464182109, + "loss": 0.0213, "step": 39820 }, { - "epoch": 0.43, - "learning_rate": 0.00023541220730362585, - "loss": 0.017, + "epoch": 0.2, + "learning_rate": 0.00026985787872519686, + "loss": 0.0202, "step": 39830 }, { - "epoch": 0.43, - "learning_rate": 0.00023539599143802294, - "loss": 0.0148, + "epoch": 0.2, + "learning_rate": 0.00026985031103218284, + "loss": 0.0214, "step": 39840 }, { - "epoch": 0.43, - "learning_rate": 0.00023537977557242006, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002698427433391688, + "loss": 0.0229, "step": 39850 }, { - "epoch": 0.43, - "learning_rate": 0.00023536355970681712, - "loss": 0.0224, + "epoch": 0.2, + "learning_rate": 0.0002698351756461548, + "loss": 0.0242, "step": 39860 }, { - "epoch": 0.43, - "learning_rate": 0.00023534734384121422, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.00026982760795314084, + "loss": 0.024, "step": 39870 }, { - "epoch": 0.43, - "learning_rate": 0.0002353311279756113, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002698200402601268, + "loss": 0.0255, "step": 39880 }, { - "epoch": 0.43, - "learning_rate": 0.00023531491211000843, - "loss": 0.0221, + "epoch": 0.2, + "learning_rate": 0.0002698124725671128, + "loss": 0.0256, "step": 39890 }, { - "epoch": 0.43, - "learning_rate": 0.0002352986962444055, - "loss": 0.0248, + "epoch": 0.2, + "learning_rate": 0.0002698049048740988, + "loss": 0.0242, "step": 39900 }, { - "epoch": 0.43, - "learning_rate": 0.0002352824803788026, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.00026979733718108476, + "loss": 0.0215, "step": 39910 }, { - "epoch": 0.43, - "learning_rate": 0.0002352662645131997, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00026978976948807074, + "loss": 0.0348, "step": 39920 }, { - "epoch": 0.43, - "learning_rate": 0.0002352500486475968, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.0002697822017950567, + "loss": 0.0344, "step": 39930 }, { - "epoch": 0.43, - "learning_rate": 0.00023523383278199387, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.00026977463410204276, + "loss": 0.0237, "step": 39940 }, { - "epoch": 0.43, - "learning_rate": 0.00023521761691639096, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00026976706640902874, + "loss": 0.0288, "step": 39950 }, { - "epoch": 0.43, - "learning_rate": 0.00023520140105078808, - "loss": 0.0236, + "epoch": 0.2, + "learning_rate": 0.0002697594987160147, + "loss": 0.0227, "step": 39960 }, { - "epoch": 0.43, - "learning_rate": 0.00023518518518518517, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002697519310230007, + "loss": 0.0276, "step": 39970 }, { - "epoch": 0.43, - "learning_rate": 0.00023516896931958224, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002697443633299867, + "loss": 0.0226, "step": 39980 }, { - "epoch": 0.43, - "learning_rate": 0.00023515275345397936, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.00026973679563697267, + "loss": 0.0191, "step": 39990 }, { - "epoch": 0.43, - "learning_rate": 0.00023513653758837645, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002697292279439587, + "loss": 0.0253, "step": 40000 }, { - "epoch": 0.43, - "eval_cer": 0.9215938169367153, - "eval_loss": 0.014509420841932297, - "eval_runtime": 121.8906, - "eval_samples_per_second": 16.408, - "eval_steps_per_second": 4.102, + "epoch": 0.2, + "eval_cer": 0.9144896638256703, + "eval_loss": 0.017527606338262558, + "eval_runtime": 117.0438, + "eval_samples_per_second": 17.088, + "eval_steps_per_second": 4.272, "step": 40000 }, { - "epoch": 0.43, - "learning_rate": 0.00023512032172277354, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002697216602509447, + "loss": 0.0219, "step": 40010 }, { - "epoch": 0.43, - "learning_rate": 0.0002351041058571706, - "loss": 0.0214, + "epoch": 0.2, + "learning_rate": 0.00026971409255793067, + "loss": 0.024, "step": 40020 }, { - "epoch": 0.43, - "learning_rate": 0.00023508788999156773, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.00026970652486491665, + "loss": 0.0232, "step": 40030 }, { - "epoch": 0.43, - "learning_rate": 0.00023507167412596482, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00026969895717190263, + "loss": 0.0238, "step": 40040 }, { - "epoch": 0.43, - "learning_rate": 0.00023505545826036194, - "loss": 0.024, + "epoch": 0.2, + "learning_rate": 0.0002696913894788886, + "loss": 0.0242, "step": 40050 }, { - "epoch": 0.43, - "learning_rate": 0.000235039242394759, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.00026968382178587465, + "loss": 0.0253, "step": 40060 }, { - "epoch": 0.43, - "learning_rate": 0.0002350230265291561, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.00026967625409286063, + "loss": 0.0212, "step": 40070 }, { - "epoch": 0.43, - "learning_rate": 0.0002350068106635532, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.0002696686863998466, + "loss": 0.0224, "step": 40080 }, { - "epoch": 0.43, - "learning_rate": 0.0002349905947979503, - "loss": 0.0215, + "epoch": 0.2, + "learning_rate": 0.0002696611187068326, + "loss": 0.0264, "step": 40090 }, { - "epoch": 0.43, - "learning_rate": 0.00023497437893234738, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.00026965355101381857, + "loss": 0.0214, "step": 40100 }, { - "epoch": 0.43, - "learning_rate": 0.00023495816306674447, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.00026964598332080455, + "loss": 0.0193, "step": 40110 }, { - "epoch": 0.43, - "learning_rate": 0.0002349419472011416, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00026963841562779054, + "loss": 0.023, "step": 40120 }, { - "epoch": 0.43, - "learning_rate": 0.00023492573133553868, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.00026963084793477657, + "loss": 0.0233, "step": 40130 }, { - "epoch": 0.43, - "learning_rate": 0.00023490951546993575, - "loss": 0.0205, + "epoch": 0.2, + "learning_rate": 0.00026962328024176255, + "loss": 0.0214, "step": 40140 }, { - "epoch": 0.43, - "learning_rate": 0.00023489329960433284, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.00026961571254874853, + "loss": 0.0225, "step": 40150 }, { - "epoch": 0.43, - "learning_rate": 0.00023487708373872996, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002696081448557345, + "loss": 0.0234, "step": 40160 }, { - "epoch": 0.43, - "learning_rate": 0.00023486086787312705, - "loss": 0.023, + "epoch": 0.2, + "learning_rate": 0.0002696005771627205, + "loss": 0.0214, "step": 40170 }, { - "epoch": 0.43, - "learning_rate": 0.00023484465200752412, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.0002695930094697065, + "loss": 0.021, "step": 40180 }, { - "epoch": 0.43, - "learning_rate": 0.00023482843614192124, - "loss": 0.0199, + "epoch": 0.2, + "learning_rate": 0.0002695854417766925, + "loss": 0.0198, "step": 40190 }, { - "epoch": 0.43, - "learning_rate": 0.00023481222027631833, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.0002695778740836785, + "loss": 0.023, "step": 40200 }, { - "epoch": 0.43, - "learning_rate": 0.00023479600441071542, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.0002695703063906645, + "loss": 0.0218, "step": 40210 }, { - "epoch": 0.43, - "learning_rate": 0.0002347797885451125, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.00026956273869765046, + "loss": 0.021, "step": 40220 }, { - "epoch": 0.43, - "learning_rate": 0.0002347635726795096, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.00026955517100463644, + "loss": 0.021, "step": 40230 }, { - "epoch": 0.44, - "learning_rate": 0.0002347473568139067, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002695476033116224, + "loss": 0.0228, "step": 40240 }, { - "epoch": 0.44, - "learning_rate": 0.0002347311409483038, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.00026954003561860846, + "loss": 0.018, "step": 40250 }, { - "epoch": 0.44, - "learning_rate": 0.0002347149250827009, - "loss": 0.0229, + "epoch": 0.2, + "learning_rate": 0.00026953246792559444, + "loss": 0.0233, "step": 40260 }, { - "epoch": 0.44, - "learning_rate": 0.00023469870921709798, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.0002695249002325804, + "loss": 0.0248, "step": 40270 }, { - "epoch": 0.44, - "learning_rate": 0.00023468249335149507, - "loss": 0.0191, + "epoch": 0.2, + "learning_rate": 0.0002695173325395664, + "loss": 0.0231, "step": 40280 }, { - "epoch": 0.44, - "learning_rate": 0.0002346662774858922, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.0002695097648465524, + "loss": 0.0194, "step": 40290 }, { - "epoch": 0.44, - "learning_rate": 0.00023465006162028929, - "loss": 0.0205, + "epoch": 0.2, + "learning_rate": 0.00026950219715353836, + "loss": 0.0268, "step": 40300 }, { - "epoch": 0.44, - "learning_rate": 0.00023463384575468635, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.00026949462946052435, + "loss": 0.0225, "step": 40310 }, { - "epoch": 0.44, - "learning_rate": 0.00023461762988908344, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.0002694870617675104, + "loss": 0.021, "step": 40320 }, { - "epoch": 0.44, - "learning_rate": 0.00023460141402348056, - "loss": 0.0269, + "epoch": 0.2, + "learning_rate": 0.00026947949407449636, + "loss": 0.0212, "step": 40330 }, { - "epoch": 0.44, - "learning_rate": 0.00023458519815787766, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.00026947192638148234, + "loss": 0.0196, "step": 40340 }, { - "epoch": 0.44, - "learning_rate": 0.00023456898229227472, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.0002694643586884683, + "loss": 0.0207, "step": 40350 }, { - "epoch": 0.44, - "learning_rate": 0.00023455276642667184, - "loss": 0.021, + "epoch": 0.2, + "learning_rate": 0.0002694567909954543, + "loss": 0.0239, "step": 40360 }, { - "epoch": 0.44, - "learning_rate": 0.00023453655056106894, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.0002694492233024403, + "loss": 0.0247, "step": 40370 }, { - "epoch": 0.44, - "learning_rate": 0.00023452033469546603, - "loss": 0.0215, + "epoch": 0.2, + "learning_rate": 0.0002694416556094263, + "loss": 0.0192, "step": 40380 }, { - "epoch": 0.44, - "learning_rate": 0.00023450411882986312, - "loss": 0.0241, + "epoch": 0.2, + "learning_rate": 0.0002694340879164123, + "loss": 0.023, "step": 40390 }, { - "epoch": 0.44, - "learning_rate": 0.00023448790296426021, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002694265202233983, + "loss": 0.0229, "step": 40400 }, { - "epoch": 0.44, - "learning_rate": 0.0002344716870986573, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.00026941895253038427, + "loss": 0.0219, "step": 40410 }, { - "epoch": 0.44, - "learning_rate": 0.00023445547123305443, - "loss": 0.0281, + "epoch": 0.2, + "learning_rate": 0.00026941138483737025, + "loss": 0.0203, "step": 40420 }, { - "epoch": 0.44, - "learning_rate": 0.0002344392553674515, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00026940381714435623, + "loss": 0.0248, "step": 40430 }, { - "epoch": 0.44, - "learning_rate": 0.00023442303950184858, - "loss": 0.0336, + "epoch": 0.2, + "learning_rate": 0.0002693962494513422, + "loss": 0.0201, "step": 40440 }, { - "epoch": 0.44, - "learning_rate": 0.00023440682363624568, - "loss": 0.0243, + "epoch": 0.2, + "learning_rate": 0.00026938868175832825, + "loss": 0.0244, "step": 40450 }, { - "epoch": 0.44, - "learning_rate": 0.0002343906077706428, - "loss": 0.0297, + "epoch": 0.2, + "learning_rate": 0.00026938111406531423, + "loss": 0.0253, "step": 40460 }, { - "epoch": 0.44, - "learning_rate": 0.00023437439190503986, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.0002693735463723002, + "loss": 0.0213, "step": 40470 }, { - "epoch": 0.44, - "learning_rate": 0.00023435817603943696, - "loss": 0.037, + "epoch": 0.2, + "learning_rate": 0.0002693659786792862, + "loss": 0.0182, "step": 40480 }, { - "epoch": 0.44, - "learning_rate": 0.00023434196017383408, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.0002693584109862722, + "loss": 0.0214, "step": 40490 }, { - "epoch": 0.44, - "learning_rate": 0.00023432574430823117, - "loss": 0.0221, + "epoch": 0.2, + "learning_rate": 0.00026935084329325816, + "loss": 0.0233, "step": 40500 }, { - "epoch": 0.44, - "learning_rate": 0.00023430952844262823, - "loss": 0.0623, + "epoch": 0.2, + "learning_rate": 0.0002693432756002442, + "loss": 0.0219, "step": 40510 }, { - "epoch": 0.44, - "learning_rate": 0.00023429331257702533, - "loss": 0.0249, + "epoch": 0.2, + "learning_rate": 0.00026933570790723017, + "loss": 0.0238, "step": 40520 }, { - "epoch": 0.44, - "learning_rate": 0.00023427709671142245, - "loss": 0.0252, + "epoch": 0.2, + "learning_rate": 0.00026932814021421615, + "loss": 0.0237, "step": 40530 }, { - "epoch": 0.44, - "learning_rate": 0.00023426088084581954, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00026932057252120214, + "loss": 0.027, "step": 40540 }, { - "epoch": 0.44, - "learning_rate": 0.0002342446649802166, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002693130048281881, + "loss": 0.027, "step": 40550 }, { - "epoch": 0.44, - "learning_rate": 0.00023422844911461372, - "loss": 0.022, + "epoch": 0.2, + "learning_rate": 0.0002693054371351741, + "loss": 0.0249, "step": 40560 }, { - "epoch": 0.44, - "learning_rate": 0.00023421223324901082, - "loss": 0.0218, + "epoch": 0.2, + "learning_rate": 0.00026929786944216013, + "loss": 0.0266, "step": 40570 }, { - "epoch": 0.44, - "learning_rate": 0.0002341960173834079, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.0002692903017491461, + "loss": 0.0279, "step": 40580 }, { - "epoch": 0.44, - "learning_rate": 0.00023417980151780498, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.0002692827340561321, + "loss": 0.0205, "step": 40590 }, { - "epoch": 0.44, - "learning_rate": 0.0002341635856522021, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002692751663631181, + "loss": 0.0219, "step": 40600 }, { - "epoch": 0.44, - "learning_rate": 0.0002341473697865992, - "loss": 0.0218, + "epoch": 0.2, + "learning_rate": 0.00026926759867010406, + "loss": 0.0209, "step": 40610 }, { - "epoch": 0.44, - "learning_rate": 0.0002341311539209963, - "loss": 0.021, + "epoch": 0.2, + "learning_rate": 0.00026926003097709004, + "loss": 0.0262, "step": 40620 }, { - "epoch": 0.44, - "learning_rate": 0.00023411493805539337, - "loss": 0.0228, + "epoch": 0.2, + "learning_rate": 0.000269252463284076, + "loss": 0.022, "step": 40630 }, { - "epoch": 0.44, - "learning_rate": 0.00023409872218979047, - "loss": 0.0226, + "epoch": 0.21, + "learning_rate": 0.00026924489559106206, + "loss": 0.0214, "step": 40640 }, { - "epoch": 0.44, - "learning_rate": 0.00023408250632418756, - "loss": 0.0241, + "epoch": 0.21, + "learning_rate": 0.00026923732789804804, + "loss": 0.0227, "step": 40650 }, { - "epoch": 0.44, - "learning_rate": 0.00023406629045858468, - "loss": 0.0298, + "epoch": 0.21, + "learning_rate": 0.000269229760205034, + "loss": 0.0242, "step": 40660 }, { - "epoch": 0.44, - "learning_rate": 0.00023405007459298174, - "loss": 0.0223, + "epoch": 0.21, + "learning_rate": 0.00026922219251202, + "loss": 0.0278, "step": 40670 }, { - "epoch": 0.44, - "learning_rate": 0.00023403385872737884, - "loss": 0.0277, + "epoch": 0.21, + "learning_rate": 0.000269214624819006, + "loss": 0.0184, "step": 40680 }, { - "epoch": 0.44, - "learning_rate": 0.00023401764286177596, - "loss": 0.0224, + "epoch": 0.21, + "learning_rate": 0.00026920705712599197, + "loss": 0.0232, "step": 40690 }, { - "epoch": 0.44, - "learning_rate": 0.00023400142699617305, - "loss": 0.0231, + "epoch": 0.21, + "learning_rate": 0.000269199489432978, + "loss": 0.0224, "step": 40700 }, { - "epoch": 0.44, - "learning_rate": 0.00023398521113057012, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.000269191921739964, + "loss": 0.0214, "step": 40710 }, { - "epoch": 0.44, - "learning_rate": 0.0002339689952649672, - "loss": 0.0232, + "epoch": 0.21, + "learning_rate": 0.00026918435404694996, + "loss": 0.0192, "step": 40720 }, { - "epoch": 0.44, - "learning_rate": 0.00023395277939936433, - "loss": 0.0228, + "epoch": 0.21, + "learning_rate": 0.00026917678635393595, + "loss": 0.0214, "step": 40730 }, { - "epoch": 0.44, - "learning_rate": 0.00023393656353376142, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.0002691692186609219, + "loss": 0.0217, "step": 40740 }, { - "epoch": 0.44, - "learning_rate": 0.0002339203476681585, - "loss": 0.0197, + "epoch": 0.21, + "learning_rate": 0.0002691616509679079, + "loss": 0.0259, "step": 40750 }, { - "epoch": 0.44, - "learning_rate": 0.0002339041318025556, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.00026915408327489394, + "loss": 0.0215, "step": 40760 }, { - "epoch": 0.44, - "learning_rate": 0.0002338879159369527, - "loss": 0.0217, + "epoch": 0.21, + "learning_rate": 0.0002691465155818799, + "loss": 0.0231, "step": 40770 }, { - "epoch": 0.44, - "learning_rate": 0.0002338717000713498, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.0002691389478888659, + "loss": 0.0236, "step": 40780 }, { - "epoch": 0.44, - "learning_rate": 0.00023385548420574686, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002691313801958519, + "loss": 0.0194, "step": 40790 }, { - "epoch": 0.44, - "learning_rate": 0.00023383926834014398, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.00026912381250283787, + "loss": 0.0237, "step": 40800 }, { - "epoch": 0.44, - "learning_rate": 0.00023382305247454107, - "loss": 0.0233, + "epoch": 0.21, + "learning_rate": 0.00026911624480982385, + "loss": 0.0226, "step": 40810 }, { - "epoch": 0.44, - "learning_rate": 0.00023380683660893816, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026910867711680983, + "loss": 0.0246, "step": 40820 }, { - "epoch": 0.44, - "learning_rate": 0.00023379062074333526, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.00026910110942379587, + "loss": 0.0228, "step": 40830 }, { - "epoch": 0.44, - "learning_rate": 0.00023377440487773235, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.00026909354173078185, + "loss": 0.0255, "step": 40840 }, { - "epoch": 0.44, - "learning_rate": 0.00023375818901212944, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.0002690859740377678, + "loss": 0.0248, "step": 40850 }, { - "epoch": 0.44, - "learning_rate": 0.00023374197314652656, - "loss": 0.0211, + "epoch": 0.21, + "learning_rate": 0.00026907840634475376, + "loss": 0.0238, "step": 40860 }, { - "epoch": 0.44, - "learning_rate": 0.00023372575728092363, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002690708386517398, + "loss": 0.0216, "step": 40870 }, { - "epoch": 0.44, - "learning_rate": 0.00023370954141532072, - "loss": 0.0247, + "epoch": 0.21, + "learning_rate": 0.0002690632709587258, + "loss": 0.0244, "step": 40880 }, { - "epoch": 0.44, - "learning_rate": 0.0002336933255497178, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.00026905570326571176, + "loss": 0.0219, "step": 40890 }, { - "epoch": 0.44, - "learning_rate": 0.00023367710968411493, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.00026904813557269774, + "loss": 0.024, "step": 40900 }, { - "epoch": 0.44, - "learning_rate": 0.000233660893818512, - "loss": 0.0266, + "epoch": 0.21, + "learning_rate": 0.0002690405678796837, + "loss": 0.0252, "step": 40910 }, { - "epoch": 0.44, - "learning_rate": 0.0002336446779529091, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.0002690330001866697, + "loss": 0.0234, "step": 40920 }, { - "epoch": 0.44, - "learning_rate": 0.0002336284620873062, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026902543249365574, + "loss": 0.0234, "step": 40930 }, { - "epoch": 0.44, - "learning_rate": 0.0002336122462217033, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.0002690178648006417, + "loss": 0.0217, "step": 40940 }, { - "epoch": 0.44, - "learning_rate": 0.00023359603035610037, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.0002690102971076277, + "loss": 0.0212, "step": 40950 }, { - "epoch": 0.44, - "learning_rate": 0.00023357981449049746, - "loss": 0.0238, + "epoch": 0.21, + "learning_rate": 0.0002690027294146137, + "loss": 0.0267, "step": 40960 }, { - "epoch": 0.44, - "learning_rate": 0.00023356359862489458, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026899516172159966, + "loss": 0.0248, "step": 40970 }, { - "epoch": 0.44, - "learning_rate": 0.00023354738275929167, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.00026898759402858564, + "loss": 0.025, "step": 40980 }, { - "epoch": 0.44, - "learning_rate": 0.00023353116689368874, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.0002689800263355716, + "loss": 0.0233, "step": 40990 }, { - "epoch": 0.44, - "learning_rate": 0.00023351495102808586, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.00026897245864255766, + "loss": 0.0207, "step": 41000 }, { - "epoch": 0.44, - "eval_cer": 0.9215903425248898, - "eval_loss": 0.013930886052548885, - "eval_runtime": 121.8476, - "eval_samples_per_second": 16.414, - "eval_steps_per_second": 4.103, + "epoch": 0.21, + "eval_cer": 0.914467344714786, + "eval_loss": 0.01699613220989704, + "eval_runtime": 117.194, + "eval_samples_per_second": 17.066, + "eval_steps_per_second": 4.266, "step": 41000 }, { - "epoch": 0.44, - "learning_rate": 0.00023349873516248295, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.00026896489094954364, + "loss": 0.0217, "step": 41010 }, { - "epoch": 0.44, - "learning_rate": 0.00023348251929688005, - "loss": 0.0246, + "epoch": 0.21, + "learning_rate": 0.0002689573232565296, + "loss": 0.0221, "step": 41020 }, { - "epoch": 0.44, - "learning_rate": 0.00023346630343127717, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.0002689497555635156, + "loss": 0.023, "step": 41030 }, { - "epoch": 0.44, - "learning_rate": 0.00023345008756567423, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002689421878705016, + "loss": 0.0222, "step": 41040 }, { - "epoch": 0.44, - "learning_rate": 0.00023343387170007132, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.00026893462017748757, + "loss": 0.0222, "step": 41050 }, { - "epoch": 0.44, - "learning_rate": 0.00023341765583446844, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.0002689270524844736, + "loss": 0.0221, "step": 41060 }, { - "epoch": 0.44, - "learning_rate": 0.00023340143996886554, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.0002689194847914596, + "loss": 0.0231, "step": 41070 }, { - "epoch": 0.44, - "learning_rate": 0.0002333852241032626, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.00026891191709844557, + "loss": 0.0243, "step": 41080 }, { - "epoch": 0.44, - "learning_rate": 0.0002333690082376597, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.00026890434940543155, + "loss": 0.023, "step": 41090 }, { - "epoch": 0.44, - "learning_rate": 0.00023335279237205681, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026889678171241753, + "loss": 0.0216, "step": 41100 }, { - "epoch": 0.44, - "learning_rate": 0.0002333365765064539, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002688892140194035, + "loss": 0.0208, "step": 41110 }, { - "epoch": 0.44, - "learning_rate": 0.00023332036064085097, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026888164632638955, + "loss": 0.0247, "step": 41120 }, { - "epoch": 0.44, - "learning_rate": 0.0002333041447752481, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026887407863337553, + "loss": 0.0211, "step": 41130 }, { - "epoch": 0.44, - "learning_rate": 0.00023328792890964519, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.0002688665109403615, + "loss": 0.0257, "step": 41140 }, { - "epoch": 0.44, - "learning_rate": 0.00023327171304404228, - "loss": 0.0227, + "epoch": 0.21, + "learning_rate": 0.0002688589432473475, + "loss": 0.025, "step": 41150 }, { - "epoch": 0.44, - "learning_rate": 0.00023325549717843934, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026885137555433347, + "loss": 0.0201, "step": 41160 }, { - "epoch": 0.45, - "learning_rate": 0.00023323928131283646, - "loss": 0.0227, + "epoch": 0.21, + "learning_rate": 0.00026884380786131945, + "loss": 0.0224, "step": 41170 }, { - "epoch": 0.45, - "learning_rate": 0.00023322306544723356, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.00026883624016830544, + "loss": 0.0261, "step": 41180 }, { - "epoch": 0.45, - "learning_rate": 0.00023320684958163065, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026882867247529147, + "loss": 0.0214, "step": 41190 }, { - "epoch": 0.45, - "learning_rate": 0.00023319063371602774, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026882110478227745, + "loss": 0.0231, "step": 41200 }, { - "epoch": 0.45, - "learning_rate": 0.00023317441785042483, - "loss": 0.0229, + "epoch": 0.21, + "learning_rate": 0.00026881353708926343, + "loss": 0.0228, "step": 41210 }, { - "epoch": 0.45, - "learning_rate": 0.00023315820198482193, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.0002688059693962494, + "loss": 0.0238, "step": 41220 }, { - "epoch": 0.45, - "learning_rate": 0.00023314198611921905, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.0002687984017032354, + "loss": 0.023, "step": 41230 }, { - "epoch": 0.45, - "learning_rate": 0.0002331257702536161, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.0002687908340102214, + "loss": 0.022, "step": 41240 }, { - "epoch": 0.45, - "learning_rate": 0.0002331095543880132, - "loss": 0.0196, + "epoch": 0.21, + "learning_rate": 0.0002687832663172074, + "loss": 0.0272, "step": 41250 }, { - "epoch": 0.45, - "learning_rate": 0.0002330933385224103, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.0002687756986241934, + "loss": 0.0235, "step": 41260 }, { - "epoch": 0.45, - "learning_rate": 0.00023307712265680742, - "loss": 0.0233, + "epoch": 0.21, + "learning_rate": 0.0002687681309311794, + "loss": 0.0283, "step": 41270 }, { - "epoch": 0.45, - "learning_rate": 0.00023306090679120448, - "loss": 0.0226, + "epoch": 0.21, + "learning_rate": 0.00026876056323816536, + "loss": 0.0257, "step": 41280 }, { - "epoch": 0.45, - "learning_rate": 0.00023304469092560158, - "loss": 0.0209, + "epoch": 0.21, + "learning_rate": 0.00026875299554515134, + "loss": 0.0235, "step": 41290 }, { - "epoch": 0.45, - "learning_rate": 0.0002330284750599987, - "loss": 0.0196, + "epoch": 0.21, + "learning_rate": 0.0002687454278521373, + "loss": 0.0202, "step": 41300 }, { - "epoch": 0.45, - "learning_rate": 0.0002330122591943958, - "loss": 0.0213, + "epoch": 0.21, + "learning_rate": 0.00026873786015912336, + "loss": 0.0221, "step": 41310 }, { - "epoch": 0.45, - "learning_rate": 0.00023299604332879285, - "loss": 0.0207, + "epoch": 0.21, + "learning_rate": 0.00026873029246610934, + "loss": 0.029, "step": 41320 }, { - "epoch": 0.45, - "learning_rate": 0.00023297982746318995, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.0002687227247730953, + "loss": 0.0238, "step": 41330 }, { - "epoch": 0.45, - "learning_rate": 0.00023296361159758707, - "loss": 0.0227, + "epoch": 0.21, + "learning_rate": 0.0002687151570800813, + "loss": 0.024, "step": 41340 }, { - "epoch": 0.45, - "learning_rate": 0.00023294739573198416, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.0002687075893870673, + "loss": 0.0215, "step": 41350 }, { - "epoch": 0.45, - "learning_rate": 0.00023293117986638123, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.00026870002169405326, + "loss": 0.0202, "step": 41360 }, { - "epoch": 0.45, - "learning_rate": 0.00023291496400077835, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026869245400103925, + "loss": 0.026, "step": 41370 }, { - "epoch": 0.45, - "learning_rate": 0.00023289874813517544, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.0002686848863080253, + "loss": 0.026, "step": 41380 }, { - "epoch": 0.45, - "learning_rate": 0.00023288253226957253, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.00026867731861501126, + "loss": 0.0239, "step": 41390 }, { - "epoch": 0.45, - "learning_rate": 0.00023286631640396962, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.00026866975092199724, + "loss": 0.0218, "step": 41400 }, { - "epoch": 0.45, - "learning_rate": 0.00023285010053836672, - "loss": 0.0206, + "epoch": 0.21, + "learning_rate": 0.0002686621832289832, + "loss": 0.0221, "step": 41410 }, { - "epoch": 0.45, - "learning_rate": 0.0002328338846727638, - "loss": 0.0209, + "epoch": 0.21, + "learning_rate": 0.0002686546155359692, + "loss": 0.0244, "step": 41420 }, { - "epoch": 0.45, - "learning_rate": 0.00023281766880716093, - "loss": 0.0215, + "epoch": 0.21, + "learning_rate": 0.0002686470478429552, + "loss": 0.0188, "step": 41430 }, { - "epoch": 0.45, - "learning_rate": 0.000232801452941558, - "loss": 0.026, + "epoch": 0.21, + "learning_rate": 0.0002686394801499412, + "loss": 0.0235, "step": 41440 }, { - "epoch": 0.45, - "learning_rate": 0.0002327852370759551, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.0002686319124569272, + "loss": 0.0242, "step": 41450 }, { - "epoch": 0.45, - "learning_rate": 0.00023276902121035218, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002686243447639132, + "loss": 0.0242, "step": 41460 }, { - "epoch": 0.45, - "learning_rate": 0.0002327528053447493, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.00026861677707089917, + "loss": 0.02, "step": 41470 }, { - "epoch": 0.45, - "learning_rate": 0.00023273658947914637, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.00026860920937788515, + "loss": 0.0226, "step": 41480 }, { - "epoch": 0.45, - "learning_rate": 0.00023272037361354346, - "loss": 0.0217, + "epoch": 0.21, + "learning_rate": 0.00026860164168487113, + "loss": 0.0202, "step": 41490 }, { - "epoch": 0.45, - "learning_rate": 0.00023270415774794058, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.0002685940739918571, + "loss": 0.0231, "step": 41500 }, { - "epoch": 0.45, - "learning_rate": 0.00023268794188233767, - "loss": 0.0241, + "epoch": 0.21, + "learning_rate": 0.00026858650629884315, + "loss": 0.0227, "step": 41510 }, { - "epoch": 0.45, - "learning_rate": 0.00023267172601673474, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.00026857893860582913, + "loss": 0.0243, "step": 41520 }, { - "epoch": 0.45, - "learning_rate": 0.00023265551015113183, - "loss": 0.0151, + "epoch": 0.21, + "learning_rate": 0.0002685713709128151, + "loss": 0.0223, "step": 41530 }, { - "epoch": 0.45, - "learning_rate": 0.00023263929428552895, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.0002685638032198011, + "loss": 0.0314, "step": 41540 }, { - "epoch": 0.45, - "learning_rate": 0.00023262307841992604, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.0002685562355267871, + "loss": 0.0217, "step": 41550 }, { - "epoch": 0.45, - "learning_rate": 0.0002326068625543231, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.00026854866783377306, + "loss": 0.0286, "step": 41560 }, { - "epoch": 0.45, - "learning_rate": 0.00023259064668872023, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.0002685411001407591, + "loss": 0.0293, "step": 41570 }, { - "epoch": 0.45, - "learning_rate": 0.00023257443082311732, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.00026853353244774507, + "loss": 0.0253, "step": 41580 }, { - "epoch": 0.45, - "learning_rate": 0.0002325582149575144, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.00026852596475473105, + "loss": 0.0232, "step": 41590 }, { - "epoch": 0.45, - "learning_rate": 0.00023254199909191148, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026851839706171704, + "loss": 0.0243, "step": 41600 }, { - "epoch": 0.45, - "learning_rate": 0.0002325257832263086, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.000268510829368703, + "loss": 0.0246, "step": 41610 }, { - "epoch": 0.45, - "learning_rate": 0.0002325095673607057, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.000268503261675689, + "loss": 0.0231, "step": 41620 }, { - "epoch": 0.45, - "learning_rate": 0.0002324933514951028, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.00026849569398267503, + "loss": 0.0237, "step": 41630 }, { - "epoch": 0.45, - "learning_rate": 0.00023247713562949988, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.000268488126289661, + "loss": 0.0277, "step": 41640 }, { - "epoch": 0.45, - "learning_rate": 0.00023246091976389697, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.000268480558596647, + "loss": 0.0246, "step": 41650 }, { - "epoch": 0.45, - "learning_rate": 0.00023244470389829406, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.000268472990903633, + "loss": 0.0216, "step": 41660 }, { - "epoch": 0.45, - "learning_rate": 0.00023242848803269118, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026846542321061896, + "loss": 0.0244, "step": 41670 }, { - "epoch": 0.45, - "learning_rate": 0.00023241227216708825, - "loss": 0.0217, + "epoch": 0.21, + "learning_rate": 0.00026845785551760494, + "loss": 0.0221, "step": 41680 }, { - "epoch": 0.45, - "learning_rate": 0.00023239605630148534, - "loss": 0.0248, + "epoch": 0.21, + "learning_rate": 0.0002684502878245909, + "loss": 0.0221, "step": 41690 }, { - "epoch": 0.45, - "learning_rate": 0.00023237984043588246, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026844272013157696, + "loss": 0.026, "step": 41700 }, { - "epoch": 0.45, - "learning_rate": 0.00023236362457027955, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.00026843515243856294, + "loss": 0.0245, "step": 41710 }, { - "epoch": 0.45, - "learning_rate": 0.00023234740870467665, - "loss": 0.0228, + "epoch": 0.21, + "learning_rate": 0.0002684275847455489, + "loss": 0.0195, "step": 41720 }, { - "epoch": 0.45, - "learning_rate": 0.0002323311928390737, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002684200170525349, + "loss": 0.0212, "step": 41730 }, { - "epoch": 0.45, - "learning_rate": 0.00023231497697347083, - "loss": 0.0254, + "epoch": 0.21, + "learning_rate": 0.0002684124493595209, + "loss": 0.0242, "step": 41740 }, { - "epoch": 0.45, - "learning_rate": 0.00023229876110786792, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.00026840488166650687, + "loss": 0.0231, "step": 41750 }, { - "epoch": 0.45, - "learning_rate": 0.00023228254524226502, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.0002683973139734929, + "loss": 0.0249, "step": 41760 }, { - "epoch": 0.45, - "learning_rate": 0.0002322663293766621, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002683897462804789, + "loss": 0.0244, "step": 41770 }, { - "epoch": 0.45, - "learning_rate": 0.0002322501135110592, - "loss": 0.0197, + "epoch": 0.21, + "learning_rate": 0.00026838217858746486, + "loss": 0.0243, "step": 41780 }, { - "epoch": 0.45, - "learning_rate": 0.0002322338976454563, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.00026837461089445085, + "loss": 0.0263, "step": 41790 }, { - "epoch": 0.45, - "learning_rate": 0.00023221768177985341, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.0002683670432014368, + "loss": 0.0243, "step": 41800 }, { - "epoch": 0.45, - "learning_rate": 0.00023220146591425048, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.0002683594755084228, + "loss": 0.0245, "step": 41810 }, { - "epoch": 0.45, - "learning_rate": 0.00023218525004864757, - "loss": 0.0236, + "epoch": 0.21, + "learning_rate": 0.00026835190781540884, + "loss": 0.0203, "step": 41820 }, { - "epoch": 0.45, - "learning_rate": 0.00023216903418304467, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.0002683443401223948, + "loss": 0.0245, "step": 41830 }, { - "epoch": 0.45, - "learning_rate": 0.00023215281831744179, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.0002683367724293808, + "loss": 0.0206, "step": 41840 }, { - "epoch": 0.45, - "learning_rate": 0.00023213660245183885, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.0002683292047363668, + "loss": 0.0231, "step": 41850 }, { - "epoch": 0.45, - "learning_rate": 0.00023212038658623594, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026832163704335277, + "loss": 0.0256, "step": 41860 }, { - "epoch": 0.45, - "learning_rate": 0.00023210417072063306, - "loss": 0.0249, + "epoch": 0.21, + "learning_rate": 0.00026831406935033875, + "loss": 0.0225, "step": 41870 }, { - "epoch": 0.45, - "learning_rate": 0.00023208795485503016, - "loss": 0.0197, + "epoch": 0.21, + "learning_rate": 0.00026830650165732473, + "loss": 0.022, "step": 41880 }, { - "epoch": 0.45, - "learning_rate": 0.00023207173898942722, - "loss": 0.0221, + "epoch": 0.21, + "learning_rate": 0.00026829893396431077, + "loss": 0.0211, "step": 41890 }, { - "epoch": 0.45, - "learning_rate": 0.00023205552312382432, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.00026829136627129675, + "loss": 0.0196, "step": 41900 }, { - "epoch": 0.45, - "learning_rate": 0.00023203930725822143, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026828379857828273, + "loss": 0.0222, "step": 41910 }, { - "epoch": 0.45, - "learning_rate": 0.00023202309139261853, - "loss": 0.0209, + "epoch": 0.21, + "learning_rate": 0.0002682762308852687, + "loss": 0.0221, "step": 41920 }, { - "epoch": 0.45, - "learning_rate": 0.0002320068755270156, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002682686631922547, + "loss": 0.0218, "step": 41930 }, { - "epoch": 0.45, - "learning_rate": 0.0002319906596614127, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.0002682610954992407, + "loss": 0.0212, "step": 41940 }, { - "epoch": 0.45, - "learning_rate": 0.0002319744437958098, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002682535278062267, + "loss": 0.0238, "step": 41950 }, { - "epoch": 0.45, - "learning_rate": 0.0002319582279302069, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.0002682459601132127, + "loss": 0.0307, "step": 41960 }, { - "epoch": 0.45, - "learning_rate": 0.00023194201206460396, - "loss": 0.0287, + "epoch": 0.21, + "learning_rate": 0.0002682383924201987, + "loss": 0.0334, "step": 41970 }, { - "epoch": 0.45, - "learning_rate": 0.00023192579619900108, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026823082472718466, + "loss": 0.0275, "step": 41980 }, { - "epoch": 0.45, - "learning_rate": 0.00023190958033339818, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026822325703417064, + "loss": 0.0235, "step": 41990 }, { - "epoch": 0.45, - "learning_rate": 0.0002318933644677953, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.0002682156893411566, + "loss": 0.0311, "step": 42000 }, { - "epoch": 0.45, - "eval_cer": 0.9215564670095912, - "eval_loss": 0.014593328349292278, - "eval_runtime": 121.8424, - "eval_samples_per_second": 16.415, - "eval_steps_per_second": 4.104, + "epoch": 0.21, + "eval_cer": 0.9144421144155256, + "eval_loss": 0.01655089110136032, + "eval_runtime": 117.2639, + "eval_samples_per_second": 17.056, + "eval_steps_per_second": 4.264, "step": 42000 }, { - "epoch": 0.45, - "learning_rate": 0.00023187714860219236, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.0002682081216481426, + "loss": 0.0264, "step": 42010 }, { - "epoch": 0.45, - "learning_rate": 0.00023186093273658946, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.00026820055395512864, + "loss": 0.0291, "step": 42020 }, { - "epoch": 0.45, - "learning_rate": 0.00023184471687098655, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002681929862621146, + "loss": 0.0261, "step": 42030 }, { - "epoch": 0.45, - "learning_rate": 0.00023182850100538367, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.0002681854185691006, + "loss": 0.0209, "step": 42040 }, { - "epoch": 0.45, - "learning_rate": 0.00023181228513978073, - "loss": 0.0206, + "epoch": 0.21, + "learning_rate": 0.0002681778508760866, + "loss": 0.0226, "step": 42050 }, { - "epoch": 0.45, - "learning_rate": 0.00023179606927417783, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026817028318307256, + "loss": 0.0231, "step": 42060 }, { - "epoch": 0.45, - "learning_rate": 0.00023177985340857495, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.00026816271549005854, + "loss": 0.0239, "step": 42070 }, { - "epoch": 0.45, - "learning_rate": 0.00023176363754297204, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.0002681551477970446, + "loss": 0.0293, "step": 42080 }, { - "epoch": 0.46, - "learning_rate": 0.0002317474216773691, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.00026814758010403056, + "loss": 0.0192, "step": 42090 }, { - "epoch": 0.46, - "learning_rate": 0.0002317312058117662, - "loss": 0.0286, + "epoch": 0.21, + "learning_rate": 0.00026814001241101654, + "loss": 0.0228, "step": 42100 }, { - "epoch": 0.46, - "learning_rate": 0.00023171498994616332, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026813244471800247, + "loss": 0.0269, "step": 42110 }, { - "epoch": 0.46, - "learning_rate": 0.0002316987740805604, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.0002681248770249885, + "loss": 0.0225, "step": 42120 }, { - "epoch": 0.46, - "learning_rate": 0.00023168255821495748, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.0002681173093319745, + "loss": 0.024, "step": 42130 }, { - "epoch": 0.46, - "learning_rate": 0.0002316663423493546, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026810974163896047, + "loss": 0.0257, "step": 42140 }, { - "epoch": 0.46, - "learning_rate": 0.0002316501264837517, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026810217394594645, + "loss": 0.0231, "step": 42150 }, { - "epoch": 0.46, - "learning_rate": 0.00023163391061814878, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.00026809460625293243, + "loss": 0.0231, "step": 42160 }, { - "epoch": 0.46, - "learning_rate": 0.00023161769475254585, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.0002680870385599184, + "loss": 0.0223, "step": 42170 }, { - "epoch": 0.46, - "learning_rate": 0.00023160147888694297, - "loss": 0.0169, - "step": 42180 + "epoch": 0.21, + "learning_rate": 0.00026807947086690445, + "loss": 0.0225, + "step": 42180 }, { - "epoch": 0.46, - "learning_rate": 0.00023158526302134006, - "loss": 0.0245, + "epoch": 0.21, + "learning_rate": 0.00026807190317389043, + "loss": 0.02, "step": 42190 }, { - "epoch": 0.46, - "learning_rate": 0.00023156904715573715, - "loss": 0.0226, + "epoch": 0.21, + "learning_rate": 0.0002680643354808764, + "loss": 0.0242, "step": 42200 }, { - "epoch": 0.46, - "learning_rate": 0.00023155283129013424, - "loss": 0.0248, + "epoch": 0.21, + "learning_rate": 0.0002680567677878624, + "loss": 0.0179, "step": 42210 }, { - "epoch": 0.46, - "learning_rate": 0.00023153661542453134, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.00026804920009484837, + "loss": 0.0194, "step": 42220 }, { - "epoch": 0.46, - "learning_rate": 0.00023152039955892843, - "loss": 0.0229, + "epoch": 0.21, + "learning_rate": 0.00026804163240183435, + "loss": 0.021, "step": 42230 }, { - "epoch": 0.46, - "learning_rate": 0.00023150418369332555, - "loss": 0.0245, + "epoch": 0.21, + "learning_rate": 0.00026803406470882034, + "loss": 0.018, "step": 42240 }, { - "epoch": 0.46, - "learning_rate": 0.00023148796782772262, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.00026802649701580637, + "loss": 0.0221, "step": 42250 }, { - "epoch": 0.46, - "learning_rate": 0.0002314717519621197, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.00026801892932279235, + "loss": 0.0242, "step": 42260 }, { - "epoch": 0.46, - "learning_rate": 0.0002314555360965168, - "loss": 0.0217, + "epoch": 0.21, + "learning_rate": 0.00026801136162977833, + "loss": 0.0258, "step": 42270 }, { - "epoch": 0.46, - "learning_rate": 0.00023143932023091392, - "loss": 0.0171, + "epoch": 0.21, + "learning_rate": 0.0002680037939367643, + "loss": 0.0204, "step": 42280 }, { - "epoch": 0.46, - "learning_rate": 0.00023142310436531099, - "loss": 0.0241, + "epoch": 0.21, + "learning_rate": 0.0002679962262437503, + "loss": 0.023, "step": 42290 }, { - "epoch": 0.46, - "learning_rate": 0.00023140688849970808, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.0002679886585507363, + "loss": 0.0242, "step": 42300 }, { - "epoch": 0.46, - "learning_rate": 0.0002313906726341052, - "loss": 0.0248, + "epoch": 0.21, + "learning_rate": 0.0002679810908577223, + "loss": 0.0187, "step": 42310 }, { - "epoch": 0.46, - "learning_rate": 0.0002313744567685023, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002679735231647083, + "loss": 0.019, "step": 42320 }, { - "epoch": 0.46, - "learning_rate": 0.00023135824090289936, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002679659554716943, + "loss": 0.0214, "step": 42330 }, { - "epoch": 0.46, - "learning_rate": 0.00023134202503729645, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026795838777868026, + "loss": 0.0222, "step": 42340 }, { - "epoch": 0.46, - "learning_rate": 0.00023132580917169357, - "loss": 0.0224, + "epoch": 0.21, + "learning_rate": 0.00026795082008566624, + "loss": 0.0202, "step": 42350 }, { - "epoch": 0.46, - "learning_rate": 0.00023130959330609066, - "loss": 0.0235, + "epoch": 0.21, + "learning_rate": 0.0002679432523926522, + "loss": 0.0223, "step": 42360 }, { - "epoch": 0.46, - "learning_rate": 0.00023129337744048773, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.00026793568469963826, + "loss": 0.0238, "step": 42370 }, { - "epoch": 0.46, - "learning_rate": 0.00023127716157488485, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.00026792811700662424, + "loss": 0.0199, "step": 42380 }, { - "epoch": 0.46, - "learning_rate": 0.00023126094570928194, - "loss": 0.0215, + "epoch": 0.21, + "learning_rate": 0.0002679205493136102, + "loss": 0.021, "step": 42390 }, { - "epoch": 0.46, - "learning_rate": 0.00023124472984367903, - "loss": 0.0225, + "epoch": 0.21, + "learning_rate": 0.0002679129816205962, + "loss": 0.0234, "step": 42400 }, { - "epoch": 0.46, - "learning_rate": 0.00023122851397807613, - "loss": 0.0244, + "epoch": 0.21, + "learning_rate": 0.0002679054139275822, + "loss": 0.0234, "step": 42410 }, { - "epoch": 0.46, - "learning_rate": 0.00023121229811247322, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.00026789784623456816, + "loss": 0.0229, "step": 42420 }, { - "epoch": 0.46, - "learning_rate": 0.0002311960822468703, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.00026789027854155415, + "loss": 0.0213, "step": 42430 }, { - "epoch": 0.46, - "learning_rate": 0.00023117986638126743, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.0002678827108485402, + "loss": 0.0188, "step": 42440 }, { - "epoch": 0.46, - "learning_rate": 0.00023116365051566452, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.00026787514315552616, + "loss": 0.0209, "step": 42450 }, { - "epoch": 0.46, - "learning_rate": 0.0002311474346500616, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.00026786757546251214, + "loss": 0.0246, "step": 42460 }, { - "epoch": 0.46, - "learning_rate": 0.00023113121878445868, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.0002678600077694981, + "loss": 0.0231, "step": 42470 }, { - "epoch": 0.46, - "learning_rate": 0.0002311150029188558, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.0002678524400764841, + "loss": 0.0214, "step": 42480 }, { - "epoch": 0.46, - "learning_rate": 0.0002310987870532529, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.0002678448723834701, + "loss": 0.0195, "step": 42490 }, { - "epoch": 0.46, - "learning_rate": 0.00023108257118764996, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.0002678373046904561, + "loss": 0.0219, "step": 42500 }, { - "epoch": 0.46, - "learning_rate": 0.00023106635532204708, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.0002678297369974421, + "loss": 0.0203, "step": 42510 }, { - "epoch": 0.46, - "learning_rate": 0.00023105013945644417, - "loss": 0.0197, + "epoch": 0.21, + "learning_rate": 0.0002678221693044281, + "loss": 0.0226, "step": 42520 }, { - "epoch": 0.46, - "learning_rate": 0.00023103392359084127, - "loss": 0.024, + "epoch": 0.21, + "learning_rate": 0.00026781460161141407, + "loss": 0.0229, "step": 42530 }, { - "epoch": 0.46, - "learning_rate": 0.00023101770772523833, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026780703391840005, + "loss": 0.0261, "step": 42540 }, { - "epoch": 0.46, - "learning_rate": 0.00023100149185963545, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.00026779946622538603, + "loss": 0.0243, "step": 42550 }, { - "epoch": 0.46, - "learning_rate": 0.00023098527599403254, - "loss": 0.0177, + "epoch": 0.21, + "learning_rate": 0.00026779189853237207, + "loss": 0.0204, "step": 42560 }, { - "epoch": 0.46, - "learning_rate": 0.00023096906012842964, - "loss": 0.0234, + "epoch": 0.21, + "learning_rate": 0.00026778433083935805, + "loss": 0.0246, "step": 42570 }, { - "epoch": 0.46, - "learning_rate": 0.00023095284426282673, - "loss": 0.0221, + "epoch": 0.21, + "learning_rate": 0.00026777676314634403, + "loss": 0.0189, "step": 42580 }, { - "epoch": 0.46, - "learning_rate": 0.00023093662839722382, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.00026776919545333, + "loss": 0.0214, "step": 42590 }, { - "epoch": 0.46, - "learning_rate": 0.00023092041253162092, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.000267761627760316, + "loss": 0.022, "step": 42600 }, { - "epoch": 0.46, - "learning_rate": 0.00023090419666601804, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.000267754060067302, + "loss": 0.0232, "step": 42610 }, { - "epoch": 0.46, - "learning_rate": 0.0002308879808004151, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.00026774649237428796, + "loss": 0.022, "step": 42620 }, { - "epoch": 0.46, - "learning_rate": 0.0002308717649348122, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.000267738924681274, + "loss": 0.0212, "step": 42630 }, { - "epoch": 0.46, - "learning_rate": 0.00023085554906920931, - "loss": 0.0204, + "epoch": 0.22, + "learning_rate": 0.00026773135698825997, + "loss": 0.0227, "step": 42640 }, { - "epoch": 0.46, - "learning_rate": 0.0002308393332036064, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026772378929524595, + "loss": 0.0223, "step": 42650 }, { - "epoch": 0.46, - "learning_rate": 0.00023082311733800347, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026771622160223194, + "loss": 0.022, "step": 42660 }, { - "epoch": 0.46, - "learning_rate": 0.00023080690147240056, - "loss": 0.0221, + "epoch": 0.22, + "learning_rate": 0.0002677086539092179, + "loss": 0.0231, "step": 42670 }, { - "epoch": 0.46, - "learning_rate": 0.00023079068560679768, - "loss": 0.0199, + "epoch": 0.22, + "learning_rate": 0.0002677010862162039, + "loss": 0.0209, "step": 42680 }, { - "epoch": 0.46, - "learning_rate": 0.00023077446974119478, - "loss": 0.0182, + "epoch": 0.22, + "learning_rate": 0.00026769351852318993, + "loss": 0.0256, "step": 42690 }, { - "epoch": 0.46, - "learning_rate": 0.00023075825387559184, - "loss": 0.0213, + "epoch": 0.22, + "learning_rate": 0.0002676859508301759, + "loss": 0.0274, "step": 42700 }, { - "epoch": 0.46, - "learning_rate": 0.00023074203800998896, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.0002676783831371619, + "loss": 0.024, "step": 42710 }, { - "epoch": 0.46, - "learning_rate": 0.00023072582214438606, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.0002676708154441479, + "loss": 0.0265, "step": 42720 }, { - "epoch": 0.46, - "learning_rate": 0.00023070960627878315, - "loss": 0.0198, + "epoch": 0.22, + "learning_rate": 0.00026766324775113386, + "loss": 0.0192, "step": 42730 }, { - "epoch": 0.46, - "learning_rate": 0.00023069339041318021, - "loss": 0.0178, + "epoch": 0.22, + "learning_rate": 0.00026765568005811984, + "loss": 0.0212, "step": 42740 }, { - "epoch": 0.46, - "learning_rate": 0.00023067717454757733, - "loss": 0.022, + "epoch": 0.22, + "learning_rate": 0.0002676481123651058, + "loss": 0.0235, "step": 42750 }, { - "epoch": 0.46, - "learning_rate": 0.00023066095868197443, + "epoch": 0.22, + "learning_rate": 0.00026764054467209186, "loss": 0.0211, "step": 42760 }, { - "epoch": 0.46, - "learning_rate": 0.00023064474281637152, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.00026763297697907784, + "loss": 0.0212, "step": 42770 }, { - "epoch": 0.46, - "learning_rate": 0.0002306285269507686, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002676254092860638, + "loss": 0.022, "step": 42780 }, { - "epoch": 0.46, - "learning_rate": 0.0002306123110851657, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002676178415930498, + "loss": 0.0222, "step": 42790 }, { - "epoch": 0.46, - "learning_rate": 0.0002305960952195628, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.0002676102739000358, + "loss": 0.0208, "step": 42800 }, { - "epoch": 0.46, - "learning_rate": 0.00023057987935395992, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026760270620702177, + "loss": 0.0224, "step": 42810 }, { - "epoch": 0.46, - "learning_rate": 0.00023056366348835698, - "loss": 0.0209, + "epoch": 0.22, + "learning_rate": 0.0002675951385140078, + "loss": 0.0195, "step": 42820 }, { - "epoch": 0.46, - "learning_rate": 0.00023054744762275408, - "loss": 0.0247, + "epoch": 0.22, + "learning_rate": 0.0002675875708209938, + "loss": 0.0269, "step": 42830 }, { - "epoch": 0.46, - "learning_rate": 0.00023053123175715117, - "loss": 0.0208, + "epoch": 0.22, + "learning_rate": 0.00026758000312797976, + "loss": 0.0266, "step": 42840 }, { - "epoch": 0.46, - "learning_rate": 0.0002305150158915483, - "loss": 0.0182, + "epoch": 0.22, + "learning_rate": 0.00026757243543496575, + "loss": 0.0244, "step": 42850 }, { - "epoch": 0.46, - "learning_rate": 0.00023049880002594535, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.00026756486774195173, + "loss": 0.0231, "step": 42860 }, { - "epoch": 0.46, - "learning_rate": 0.00023048258416034245, - "loss": 0.0247, + "epoch": 0.22, + "learning_rate": 0.0002675573000489377, + "loss": 0.0253, "step": 42870 }, { - "epoch": 0.46, - "learning_rate": 0.00023046636829473957, - "loss": 0.0199, + "epoch": 0.22, + "learning_rate": 0.00026754973235592374, + "loss": 0.0207, "step": 42880 }, { - "epoch": 0.46, - "learning_rate": 0.00023045015242913666, - "loss": 0.0228, + "epoch": 0.22, + "learning_rate": 0.0002675421646629097, + "loss": 0.0204, "step": 42890 }, { - "epoch": 0.46, - "learning_rate": 0.00023043393656353372, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002675345969698957, + "loss": 0.0212, "step": 42900 }, { - "epoch": 0.46, - "learning_rate": 0.00023041772069793082, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.0002675270292768817, + "loss": 0.0285, "step": 42910 }, { - "epoch": 0.46, - "learning_rate": 0.00023040150483232794, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.00026751946158386767, + "loss": 0.0214, "step": 42920 }, { - "epoch": 0.46, - "learning_rate": 0.00023038528896672503, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026751189389085365, + "loss": 0.0294, "step": 42930 }, { - "epoch": 0.46, - "learning_rate": 0.0002303690731011221, - "loss": 0.025, + "epoch": 0.22, + "learning_rate": 0.00026750432619783963, + "loss": 0.0213, "step": 42940 }, { - "epoch": 0.46, - "learning_rate": 0.00023035285723551922, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026749675850482567, + "loss": 0.0254, "step": 42950 }, { - "epoch": 0.46, - "learning_rate": 0.0002303366413699163, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.00026748919081181165, + "loss": 0.0196, "step": 42960 }, { - "epoch": 0.46, - "learning_rate": 0.0002303204255043134, - "loss": 0.0197, + "epoch": 0.22, + "learning_rate": 0.00026748162311879763, + "loss": 0.0287, "step": 42970 }, { - "epoch": 0.46, - "learning_rate": 0.00023030420963871047, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.0002674740554257836, + "loss": 0.0214, "step": 42980 }, { - "epoch": 0.46, - "learning_rate": 0.0002302879937731076, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.0002674664877327696, + "loss": 0.0244, "step": 42990 }, { - "epoch": 0.46, - "learning_rate": 0.00023027177790750468, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.0002674589200397556, + "loss": 0.024, "step": 43000 }, { - "epoch": 0.46, - "eval_cer": 0.9215425693622891, - "eval_loss": 0.013244155794382095, - "eval_runtime": 121.8128, - "eval_samples_per_second": 16.419, - "eval_steps_per_second": 4.105, + "epoch": 0.22, + "eval_cer": 0.9144954862024227, + "eval_loss": 0.01679139770567417, + "eval_runtime": 117.1853, + "eval_samples_per_second": 17.067, + "eval_steps_per_second": 4.267, "step": 43000 }, { - "epoch": 0.46, - "learning_rate": 0.0002302555620419018, - "loss": 0.0225, + "epoch": 0.22, + "learning_rate": 0.0002674513523467416, + "loss": 0.0234, "step": 43010 }, { - "epoch": 0.47, - "learning_rate": 0.00023023934617629886, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.0002674437846537276, + "loss": 0.0265, "step": 43020 }, { - "epoch": 0.47, - "learning_rate": 0.00023022313031069596, - "loss": 0.0222, + "epoch": 0.22, + "learning_rate": 0.0002674362169607136, + "loss": 0.0239, "step": 43030 }, { - "epoch": 0.47, - "learning_rate": 0.00023020691444509305, - "loss": 0.0198, + "epoch": 0.22, + "learning_rate": 0.00026742864926769956, + "loss": 0.0224, "step": 43040 }, { - "epoch": 0.47, - "learning_rate": 0.00023019069857949017, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026742108157468554, + "loss": 0.0224, "step": 43050 }, { - "epoch": 0.47, - "learning_rate": 0.00023017448271388724, - "loss": 0.0203, + "epoch": 0.22, + "learning_rate": 0.0002674135138816715, + "loss": 0.0209, "step": 43060 }, { - "epoch": 0.47, - "learning_rate": 0.00023015826684828433, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.00026740594618865755, + "loss": 0.0221, "step": 43070 }, { - "epoch": 0.47, - "learning_rate": 0.00023014205098268145, - "loss": 0.0199, + "epoch": 0.22, + "learning_rate": 0.00026739837849564354, + "loss": 0.0219, "step": 43080 }, { - "epoch": 0.47, - "learning_rate": 0.00023012583511707854, - "loss": 0.0231, + "epoch": 0.22, + "learning_rate": 0.0002673908108026295, + "loss": 0.02, "step": 43090 }, { - "epoch": 0.47, - "learning_rate": 0.0002301096192514756, - "loss": 0.0228, + "epoch": 0.22, + "learning_rate": 0.0002673832431096155, + "loss": 0.0235, "step": 43100 }, { - "epoch": 0.47, - "learning_rate": 0.0002300934033858727, - "loss": 0.0244, + "epoch": 0.22, + "learning_rate": 0.0002673756754166015, + "loss": 0.0226, "step": 43110 }, { - "epoch": 0.47, - "learning_rate": 0.00023007718752026982, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.00026736810772358746, + "loss": 0.0228, "step": 43120 }, { - "epoch": 0.47, - "learning_rate": 0.0002300609716546669, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026736054003057344, + "loss": 0.0192, "step": 43130 }, { - "epoch": 0.47, - "learning_rate": 0.00023004475578906398, - "loss": 0.0218, + "epoch": 0.22, + "learning_rate": 0.0002673529723375595, + "loss": 0.022, "step": 43140 }, { - "epoch": 0.47, - "learning_rate": 0.0002300285399234611, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.00026734540464454546, + "loss": 0.0229, "step": 43150 }, { - "epoch": 0.47, - "learning_rate": 0.0002300123240578582, - "loss": 0.0209, + "epoch": 0.22, + "learning_rate": 0.00026733783695153144, + "loss": 0.0224, "step": 43160 }, { - "epoch": 0.47, - "learning_rate": 0.00022999610819225528, - "loss": 0.0208, + "epoch": 0.22, + "learning_rate": 0.0002673302692585174, + "loss": 0.021, "step": 43170 }, { - "epoch": 0.47, - "learning_rate": 0.0002299798923266524, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.0002673227015655034, + "loss": 0.025, "step": 43180 }, { - "epoch": 0.47, - "learning_rate": 0.00022996367646104947, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.0002673151338724894, + "loss": 0.0229, "step": 43190 }, { - "epoch": 0.47, - "learning_rate": 0.00022994746059544656, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002673075661794754, + "loss": 0.0237, "step": 43200 }, { - "epoch": 0.47, - "learning_rate": 0.00022993124472984365, - "loss": 0.0182, + "epoch": 0.22, + "learning_rate": 0.0002672999984864614, + "loss": 0.0209, "step": 43210 }, { - "epoch": 0.47, - "learning_rate": 0.00022991502886424077, - "loss": 0.0226, + "epoch": 0.22, + "learning_rate": 0.0002672924307934474, + "loss": 0.021, "step": 43220 }, { - "epoch": 0.47, - "learning_rate": 0.00022989881299863784, - "loss": 0.0189, + "epoch": 0.22, + "learning_rate": 0.00026728486310043337, + "loss": 0.0237, "step": 43230 }, { - "epoch": 0.47, - "learning_rate": 0.00022988259713303493, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.00026727729540741935, + "loss": 0.0241, "step": 43240 }, { - "epoch": 0.47, - "learning_rate": 0.00022986638126743205, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026726972771440533, + "loss": 0.0254, "step": 43250 }, { - "epoch": 0.47, - "learning_rate": 0.00022985016540182914, - "loss": 0.0203, + "epoch": 0.22, + "learning_rate": 0.0002672621600213913, + "loss": 0.0236, "step": 43260 }, { - "epoch": 0.47, - "learning_rate": 0.0002298339495362262, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026725459232837735, + "loss": 0.0281, "step": 43270 }, { - "epoch": 0.47, - "learning_rate": 0.0002298177336706233, - "loss": 0.0197, + "epoch": 0.22, + "learning_rate": 0.00026724702463536333, + "loss": 0.023, "step": 43280 }, { - "epoch": 0.47, - "learning_rate": 0.00022980151780502042, - "loss": 0.0204, + "epoch": 0.22, + "learning_rate": 0.0002672394569423493, + "loss": 0.023, "step": 43290 }, { - "epoch": 0.47, - "learning_rate": 0.00022978530193941752, - "loss": 0.0256, + "epoch": 0.22, + "learning_rate": 0.0002672318892493353, + "loss": 0.0235, "step": 43300 }, { - "epoch": 0.47, - "learning_rate": 0.00022976908607381458, - "loss": 0.0214, + "epoch": 0.22, + "learning_rate": 0.00026722432155632127, + "loss": 0.0212, "step": 43310 }, { - "epoch": 0.47, - "learning_rate": 0.0002297528702082117, - "loss": 0.0182, + "epoch": 0.22, + "learning_rate": 0.00026721675386330725, + "loss": 0.0237, "step": 43320 }, { - "epoch": 0.47, - "learning_rate": 0.0002297366543426088, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.0002672091861702933, + "loss": 0.0194, "step": 43330 }, { - "epoch": 0.47, - "learning_rate": 0.0002297204384770059, - "loss": 0.0207, + "epoch": 0.22, + "learning_rate": 0.00026720161847727927, + "loss": 0.0216, "step": 43340 }, { - "epoch": 0.47, - "learning_rate": 0.00022970422261140295, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.00026719405078426525, + "loss": 0.0227, "step": 43350 }, { - "epoch": 0.47, - "learning_rate": 0.00022968800674580007, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026718648309125123, + "loss": 0.0219, "step": 43360 }, { - "epoch": 0.47, - "learning_rate": 0.00022967179088019717, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002671789153982372, + "loss": 0.0226, "step": 43370 }, { - "epoch": 0.47, - "learning_rate": 0.00022965557501459429, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.0002671713477052232, + "loss": 0.0236, "step": 43380 }, { - "epoch": 0.47, - "learning_rate": 0.00022963935914899135, - "loss": 0.0237, + "epoch": 0.22, + "learning_rate": 0.0002671637800122092, + "loss": 0.0223, "step": 43390 }, { - "epoch": 0.47, - "learning_rate": 0.00022962314328338844, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026715621231919516, + "loss": 0.0216, "step": 43400 }, { - "epoch": 0.47, - "learning_rate": 0.00022960692741778554, - "loss": 0.0178, + "epoch": 0.22, + "learning_rate": 0.00026714864462618114, + "loss": 0.0199, "step": 43410 }, { - "epoch": 0.47, - "learning_rate": 0.00022959071155218266, - "loss": 0.0197, + "epoch": 0.22, + "learning_rate": 0.0002671410769331671, + "loss": 0.0257, "step": 43420 }, { - "epoch": 0.47, - "learning_rate": 0.00022957449568657972, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026713350924015316, + "loss": 0.0252, "step": 43430 }, { - "epoch": 0.47, - "learning_rate": 0.00022955827982097681, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.00026712594154713914, + "loss": 0.023, "step": 43440 }, { - "epoch": 0.47, - "learning_rate": 0.00022954206395537393, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.0002671183738541251, + "loss": 0.0199, "step": 43450 }, { - "epoch": 0.47, - "learning_rate": 0.00022952584808977103, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.0002671108061611111, + "loss": 0.0217, "step": 43460 }, { - "epoch": 0.47, - "learning_rate": 0.0002295096322241681, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002671032384680971, + "loss": 0.0195, "step": 43470 }, { - "epoch": 0.47, - "learning_rate": 0.00022949341635856519, - "loss": 0.0255, + "epoch": 0.22, + "learning_rate": 0.00026709567077508306, + "loss": 0.0232, "step": 43480 }, { - "epoch": 0.47, - "learning_rate": 0.0002294772004929623, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.00026708810308206905, + "loss": 0.0198, "step": 43490 }, { - "epoch": 0.47, - "learning_rate": 0.0002294609846273594, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.0002670805353890551, + "loss": 0.0285, "step": 43500 }, { - "epoch": 0.47, - "learning_rate": 0.00022944476876175646, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.00026707296769604106, + "loss": 0.0255, "step": 43510 }, { - "epoch": 0.47, - "learning_rate": 0.00022942855289615358, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.00026706540000302704, + "loss": 0.0238, "step": 43520 }, { - "epoch": 0.47, - "learning_rate": 0.00022941233703055068, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.000267057832310013, + "loss": 0.022, "step": 43530 }, { - "epoch": 0.47, - "learning_rate": 0.00022939612116494777, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.000267050264616999, + "loss": 0.0227, "step": 43540 }, { - "epoch": 0.47, - "learning_rate": 0.00022937990529934483, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.000267042696923985, + "loss": 0.0226, "step": 43550 }, { - "epoch": 0.47, - "learning_rate": 0.00022936368943374195, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.000267035129230971, + "loss": 0.0207, "step": 43560 }, { - "epoch": 0.47, - "learning_rate": 0.00022934747356813905, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.000267027561537957, + "loss": 0.0234, "step": 43570 }, { - "epoch": 0.47, - "learning_rate": 0.00022933125770253614, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.000267019993844943, + "loss": 0.0204, "step": 43580 }, { - "epoch": 0.47, - "learning_rate": 0.00022931504183693323, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.00026701242615192897, + "loss": 0.0212, "step": 43590 }, { - "epoch": 0.47, - "learning_rate": 0.00022929882597133033, - "loss": 0.0156, + "epoch": 0.22, + "learning_rate": 0.00026700485845891495, + "loss": 0.022, "step": 43600 }, { - "epoch": 0.47, - "learning_rate": 0.00022928261010572742, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.00026699729076590093, + "loss": 0.0504, "step": 43610 }, { - "epoch": 0.47, - "learning_rate": 0.00022926639424012454, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.00026698972307288697, + "loss": 0.0199, "step": 43620 }, { - "epoch": 0.47, - "learning_rate": 0.0002292501783745216, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026698215537987295, + "loss": 0.0281, "step": 43630 }, { - "epoch": 0.47, - "learning_rate": 0.0002292339625089187, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026697458768685893, + "loss": 0.0217, "step": 43640 }, { - "epoch": 0.47, - "learning_rate": 0.00022921774664331582, - "loss": 0.0275, + "epoch": 0.22, + "learning_rate": 0.0002669670199938449, + "loss": 0.0236, "step": 43650 }, { - "epoch": 0.47, - "learning_rate": 0.0002292015307777129, - "loss": 0.0258, + "epoch": 0.22, + "learning_rate": 0.0002669594523008309, + "loss": 0.0211, "step": 43660 }, { - "epoch": 0.47, - "learning_rate": 0.00022918531491210997, - "loss": 0.0386, + "epoch": 0.22, + "learning_rate": 0.0002669518846078169, + "loss": 0.0208, "step": 43670 }, { - "epoch": 0.47, - "learning_rate": 0.00022916909904650707, - "loss": 0.0334, + "epoch": 0.22, + "learning_rate": 0.00026694431691480286, + "loss": 0.0253, "step": 43680 }, { - "epoch": 0.47, - "learning_rate": 0.0002291528831809042, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.0002669367492217889, + "loss": 0.0202, "step": 43690 }, { - "epoch": 0.47, - "learning_rate": 0.00022913666731530128, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.0002669291815287749, + "loss": 0.0228, "step": 43700 }, { - "epoch": 0.47, - "learning_rate": 0.00022912045144969835, - "loss": 0.0203, + "epoch": 0.22, + "learning_rate": 0.00026692161383576085, + "loss": 0.0259, "step": 43710 }, { - "epoch": 0.47, - "learning_rate": 0.00022910423558409547, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.00026691404614274684, + "loss": 0.0252, "step": 43720 }, { - "epoch": 0.47, - "learning_rate": 0.00022908801971849256, - "loss": 0.0232, + "epoch": 0.22, + "learning_rate": 0.0002669064784497328, + "loss": 0.0236, "step": 43730 }, { - "epoch": 0.47, - "learning_rate": 0.00022907180385288965, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.0002668989107567188, + "loss": 0.0253, "step": 43740 }, { - "epoch": 0.47, - "learning_rate": 0.00022905558798728672, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.00026689134306370483, + "loss": 0.0205, "step": 43750 }, { - "epoch": 0.47, - "learning_rate": 0.00022903937212168384, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.0002668837753706908, + "loss": 0.0192, "step": 43760 }, { - "epoch": 0.47, - "learning_rate": 0.00022902315625608093, - "loss": 0.0209, + "epoch": 0.22, + "learning_rate": 0.0002668762076776768, + "loss": 0.0189, "step": 43770 }, { - "epoch": 0.47, - "learning_rate": 0.00022900694039047802, - "loss": 0.0231, + "epoch": 0.22, + "learning_rate": 0.0002668686399846628, + "loss": 0.0208, "step": 43780 }, { - "epoch": 0.47, - "learning_rate": 0.00022899072452487511, - "loss": 0.0214, + "epoch": 0.22, + "learning_rate": 0.00026686107229164876, + "loss": 0.021, "step": 43790 }, { - "epoch": 0.47, - "learning_rate": 0.0002289745086592722, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026685350459863474, + "loss": 0.0204, "step": 43800 }, { - "epoch": 0.47, - "learning_rate": 0.0002289582927936693, - "loss": 0.0223, + "epoch": 0.22, + "learning_rate": 0.0002668459369056207, + "loss": 0.021, "step": 43810 }, { - "epoch": 0.47, - "learning_rate": 0.00022894207692806642, - "loss": 0.022, + "epoch": 0.22, + "learning_rate": 0.00026683836921260676, + "loss": 0.0225, "step": 43820 }, { - "epoch": 0.47, - "learning_rate": 0.00022892586106246349, - "loss": 0.0252, + "epoch": 0.22, + "learning_rate": 0.00026683080151959274, + "loss": 0.0263, "step": 43830 }, { - "epoch": 0.47, - "learning_rate": 0.00022890964519686058, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.0002668232338265787, + "loss": 0.0205, "step": 43840 }, { - "epoch": 0.47, - "learning_rate": 0.00022889342933125767, - "loss": 0.0213, + "epoch": 0.22, + "learning_rate": 0.0002668156661335647, + "loss": 0.0266, "step": 43850 }, { - "epoch": 0.47, - "learning_rate": 0.0002288772134656548, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002668080984405507, + "loss": 0.0246, "step": 43860 }, { - "epoch": 0.47, - "learning_rate": 0.00022886099760005186, - "loss": 0.0249, + "epoch": 0.22, + "learning_rate": 0.00026680053074753667, + "loss": 0.023, "step": 43870 }, { - "epoch": 0.47, - "learning_rate": 0.00022884478173444895, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.0002667929630545227, + "loss": 0.0242, "step": 43880 }, { - "epoch": 0.47, - "learning_rate": 0.00022882856586884607, - "loss": 0.0218, + "epoch": 0.22, + "learning_rate": 0.0002667853953615087, + "loss": 0.0225, "step": 43890 }, { - "epoch": 0.47, - "learning_rate": 0.00022881235000324316, - "loss": 0.0225, + "epoch": 0.22, + "learning_rate": 0.00026677782766849466, + "loss": 0.0233, "step": 43900 }, { - "epoch": 0.47, - "learning_rate": 0.00022879613413764025, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026677025997548065, + "loss": 0.0208, "step": 43910 }, { - "epoch": 0.47, - "learning_rate": 0.00022877991827203732, - "loss": 0.0228, + "epoch": 0.22, + "learning_rate": 0.00026676269228246663, + "loss": 0.0248, "step": 43920 }, { - "epoch": 0.47, - "learning_rate": 0.00022876370240643444, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.0002667551245894526, + "loss": 0.0218, "step": 43930 }, { - "epoch": 0.48, - "learning_rate": 0.00022874748654083153, + "epoch": 0.22, + "learning_rate": 0.00026674755689643864, "loss": 0.02, "step": 43940 }, { - "epoch": 0.48, - "learning_rate": 0.00022873127067522865, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002667399892034246, + "loss": 0.0161, "step": 43950 }, { - "epoch": 0.48, - "learning_rate": 0.00022871505480962572, - "loss": 0.0217, + "epoch": 0.22, + "learning_rate": 0.0002667324215104106, + "loss": 0.0226, "step": 43960 }, { - "epoch": 0.48, - "learning_rate": 0.0002286988389440228, - "loss": 0.0395, + "epoch": 0.22, + "learning_rate": 0.0002667248538173966, + "loss": 0.0182, "step": 43970 }, { - "epoch": 0.48, - "learning_rate": 0.0002286826230784199, - "loss": 0.0245, + "epoch": 0.22, + "learning_rate": 0.00026671728612438257, + "loss": 0.0228, "step": 43980 }, { - "epoch": 0.48, - "learning_rate": 0.00022866640721281702, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026670971843136855, + "loss": 0.0189, "step": 43990 }, { - "epoch": 0.48, - "learning_rate": 0.0002286501913472141, - "loss": 0.0219, + "epoch": 0.22, + "learning_rate": 0.00026670215073835453, + "loss": 0.0206, "step": 44000 }, { - "epoch": 0.48, - "eval_cer": 0.9215529925977656, - "eval_loss": 0.0145536158233881, - "eval_runtime": 121.7531, - "eval_samples_per_second": 16.427, - "eval_steps_per_second": 4.107, + "epoch": 0.22, + "eval_cer": 0.914452788772905, + "eval_loss": 0.01625337265431881, + "eval_runtime": 117.269, + "eval_samples_per_second": 17.055, + "eval_steps_per_second": 4.264, "step": 44000 }, { - "epoch": 0.48, - "learning_rate": 0.00022863397548161118, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.00026669458304534057, + "loss": 0.0252, "step": 44010 }, { - "epoch": 0.48, - "learning_rate": 0.0002286177596160083, - "loss": 0.0204, + "epoch": 0.22, + "learning_rate": 0.00026668701535232655, + "loss": 0.026, "step": 44020 }, { - "epoch": 0.48, - "learning_rate": 0.0002286015437504054, - "loss": 0.0216, + "epoch": 0.22, + "learning_rate": 0.00026667944765931253, + "loss": 0.0212, "step": 44030 }, { - "epoch": 0.48, - "learning_rate": 0.00022858532788480246, - "loss": 0.023, + "epoch": 0.22, + "learning_rate": 0.0002666718799662985, + "loss": 0.0205, "step": 44040 }, { - "epoch": 0.48, - "learning_rate": 0.00022856911201919955, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002666643122732845, + "loss": 0.0271, "step": 44050 }, { - "epoch": 0.48, - "learning_rate": 0.00022855289615359667, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.0002666567445802705, + "loss": 0.0234, "step": 44060 }, { - "epoch": 0.48, - "learning_rate": 0.00022853668028799377, - "loss": 0.0216, + "epoch": 0.22, + "learning_rate": 0.0002666491768872565, + "loss": 0.0242, "step": 44070 }, { - "epoch": 0.48, - "learning_rate": 0.00022852046442239083, - "loss": 0.0212, + "epoch": 0.22, + "learning_rate": 0.0002666416091942425, + "loss": 0.0203, "step": 44080 }, { - "epoch": 0.48, - "learning_rate": 0.00022850424855678795, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.0002666340415012285, + "loss": 0.0196, "step": 44090 }, { - "epoch": 0.48, - "learning_rate": 0.00022848803269118504, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026662647380821446, + "loss": 0.0214, "step": 44100 }, { - "epoch": 0.48, - "learning_rate": 0.00022847181682558214, - "loss": 0.0229, + "epoch": 0.22, + "learning_rate": 0.00026661890611520044, + "loss": 0.0276, "step": 44110 }, { - "epoch": 0.48, - "learning_rate": 0.0002284556009599792, - "loss": 0.0218, + "epoch": 0.22, + "learning_rate": 0.0002666113384221864, + "loss": 0.0215, "step": 44120 }, { - "epoch": 0.48, - "learning_rate": 0.00022843938509437632, - "loss": 0.0147, + "epoch": 0.22, + "learning_rate": 0.00026660377072917245, + "loss": 0.0233, "step": 44130 }, { - "epoch": 0.48, - "learning_rate": 0.00022842316922877341, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026659620303615844, + "loss": 0.0246, "step": 44140 }, { - "epoch": 0.48, - "learning_rate": 0.0002284069533631705, - "loss": 0.0221, + "epoch": 0.22, + "learning_rate": 0.0002665886353431444, + "loss": 0.0191, "step": 44150 }, { - "epoch": 0.48, - "learning_rate": 0.0002283907374975676, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002665810676501304, + "loss": 0.0241, "step": 44160 }, { - "epoch": 0.48, - "learning_rate": 0.0002283745216319647, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002665734999571164, + "loss": 0.0196, "step": 44170 }, { - "epoch": 0.48, - "learning_rate": 0.00022835830576636179, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.00026656593226410236, + "loss": 0.0297, "step": 44180 }, { - "epoch": 0.48, - "learning_rate": 0.0002283420899007589, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026655836457108834, + "loss": 0.0272, "step": 44190 }, { - "epoch": 0.48, - "learning_rate": 0.00022832587403515597, - "loss": 0.0208, + "epoch": 0.22, + "learning_rate": 0.0002665507968780744, + "loss": 0.0298, "step": 44200 }, { - "epoch": 0.48, - "learning_rate": 0.00022830965816955306, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.00026654322918506036, + "loss": 0.0241, "step": 44210 }, { - "epoch": 0.48, - "learning_rate": 0.00022829344230395016, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026653566149204634, + "loss": 0.0249, "step": 44220 }, { - "epoch": 0.48, - "learning_rate": 0.00022827722643834728, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.0002665280937990323, + "loss": 0.0265, "step": 44230 }, { - "epoch": 0.48, - "learning_rate": 0.00022826101057274434, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.0002665205261060183, + "loss": 0.021, "step": 44240 }, { - "epoch": 0.48, - "learning_rate": 0.00022824479470714144, - "loss": 0.0199, + "epoch": 0.22, + "learning_rate": 0.0002665129584130043, + "loss": 0.0226, "step": 44250 }, { - "epoch": 0.48, - "learning_rate": 0.00022822857884153855, - "loss": 0.0211, + "epoch": 0.22, + "learning_rate": 0.0002665053907199903, + "loss": 0.023, "step": 44260 }, { - "epoch": 0.48, - "learning_rate": 0.00022821236297593565, - "loss": 0.0216, + "epoch": 0.22, + "learning_rate": 0.0002664978230269763, + "loss": 0.0364, "step": 44270 }, { - "epoch": 0.48, - "learning_rate": 0.0002281961471103327, - "loss": 0.0196, + "epoch": 0.22, + "learning_rate": 0.0002664902553339623, + "loss": 0.0259, "step": 44280 }, { - "epoch": 0.48, - "learning_rate": 0.0002281799312447298, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.00026648268764094827, + "loss": 0.0238, "step": 44290 }, { - "epoch": 0.48, - "learning_rate": 0.00022816371537912693, - "loss": 0.0211, + "epoch": 0.22, + "learning_rate": 0.00026647511994793425, + "loss": 0.0234, "step": 44300 }, { - "epoch": 0.48, - "learning_rate": 0.00022814749951352402, - "loss": 0.0241, + "epoch": 0.22, + "learning_rate": 0.00026646755225492023, + "loss": 0.0217, "step": 44310 }, { - "epoch": 0.48, - "learning_rate": 0.00022813128364792108, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.0002664599845619062, + "loss": 0.0233, "step": 44320 }, { - "epoch": 0.48, - "learning_rate": 0.0002281150677823182, - "loss": 0.0216, + "epoch": 0.22, + "learning_rate": 0.00026645241686889225, + "loss": 0.023, "step": 44330 }, { - "epoch": 0.48, - "learning_rate": 0.0002280988519167153, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.00026644484917587823, + "loss": 0.0219, "step": 44340 }, { - "epoch": 0.48, - "learning_rate": 0.0002280826360511124, - "loss": 0.024, + "epoch": 0.22, + "learning_rate": 0.0002664372814828642, + "loss": 0.0251, "step": 44350 }, { - "epoch": 0.48, - "learning_rate": 0.00022806642018550946, - "loss": 0.021, + "epoch": 0.22, + "learning_rate": 0.0002664297137898502, + "loss": 0.0248, "step": 44360 }, { - "epoch": 0.48, - "learning_rate": 0.00022805020431990658, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026642214609683617, + "loss": 0.023, "step": 44370 }, { - "epoch": 0.48, - "learning_rate": 0.00022803398845430367, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026641457840382215, + "loss": 0.0293, "step": 44380 }, { - "epoch": 0.48, - "learning_rate": 0.0002280177725887008, - "loss": 0.0221, + "epoch": 0.22, + "learning_rate": 0.0002664070107108082, + "loss": 0.0262, "step": 44390 }, { - "epoch": 0.48, - "learning_rate": 0.00022800155672309785, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026639944301779417, + "loss": 0.0255, "step": 44400 }, { - "epoch": 0.48, - "learning_rate": 0.00022798534085749495, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.00026639187532478015, + "loss": 0.024, "step": 44410 }, { - "epoch": 0.48, - "learning_rate": 0.00022796912499189204, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026638430763176613, + "loss": 0.0228, "step": 44420 }, { - "epoch": 0.48, - "learning_rate": 0.00022795290912628916, - "loss": 0.0198, + "epoch": 0.22, + "learning_rate": 0.0002663767399387521, + "loss": 0.0215, "step": 44430 }, { - "epoch": 0.48, - "learning_rate": 0.00022793669326068622, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.0002663691722457381, + "loss": 0.0208, "step": 44440 }, { - "epoch": 0.48, - "learning_rate": 0.00022792047739508332, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.00026636160455272413, + "loss": 0.0209, "step": 44450 }, { - "epoch": 0.48, - "learning_rate": 0.00022790426152948044, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.0002663540368597101, + "loss": 0.0235, "step": 44460 }, { - "epoch": 0.48, - "learning_rate": 0.00022788804566387753, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002663464691666961, + "loss": 0.026, "step": 44470 }, { - "epoch": 0.48, - "learning_rate": 0.0002278718297982746, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.0002663389014736821, + "loss": 0.0173, "step": 44480 }, { - "epoch": 0.48, - "learning_rate": 0.0002278556139326717, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026633133378066806, + "loss": 0.0225, "step": 44490 }, { - "epoch": 0.48, - "learning_rate": 0.0002278393980670688, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026632376608765404, + "loss": 0.0256, "step": 44500 }, { - "epoch": 0.48, - "learning_rate": 0.0002278231822014659, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.00026631619839464, + "loss": 0.0221, "step": 44510 }, { - "epoch": 0.48, - "learning_rate": 0.00022780696633586297, - "loss": 0.0203, + "epoch": 0.22, + "learning_rate": 0.00026630863070162606, + "loss": 0.0248, "step": 44520 }, { - "epoch": 0.48, - "learning_rate": 0.00022779075047026009, - "loss": 0.0207, + "epoch": 0.22, + "learning_rate": 0.00026630106300861204, + "loss": 0.0199, "step": 44530 }, { - "epoch": 0.48, - "learning_rate": 0.00022777453460465718, - "loss": 0.0196, + "epoch": 0.22, + "learning_rate": 0.000266293495315598, + "loss": 0.0219, "step": 44540 }, { - "epoch": 0.48, - "learning_rate": 0.00022775831873905427, - "loss": 0.0209, + "epoch": 0.22, + "learning_rate": 0.000266285927622584, + "loss": 0.0223, "step": 44550 }, { - "epoch": 0.48, - "learning_rate": 0.00022774210287345134, - "loss": 0.0239, + "epoch": 0.22, + "learning_rate": 0.00026627835992957, + "loss": 0.0214, "step": 44560 }, { - "epoch": 0.48, - "learning_rate": 0.00022772588700784846, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.00026627079223655596, + "loss": 0.027, "step": 44570 }, { - "epoch": 0.48, - "learning_rate": 0.00022770967114224555, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.000266263224543542, + "loss": 0.0207, "step": 44580 }, { - "epoch": 0.48, - "learning_rate": 0.00022769345527664264, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.000266255656850528, + "loss": 0.0189, "step": 44590 }, { - "epoch": 0.48, - "learning_rate": 0.00022767723941103976, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026624808915751396, + "loss": 0.0237, "step": 44600 }, { - "epoch": 0.48, - "learning_rate": 0.00022766102354543683, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.00026624052146449994, + "loss": 0.0242, "step": 44610 }, { - "epoch": 0.48, - "learning_rate": 0.00022764480767983392, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002662329537714859, + "loss": 0.0203, "step": 44620 }, { - "epoch": 0.48, - "learning_rate": 0.00022762859181423104, - "loss": 0.02, + "epoch": 0.23, + "learning_rate": 0.0002662253860784719, + "loss": 0.025, "step": 44630 }, { - "epoch": 0.48, - "learning_rate": 0.00022761237594862813, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.0002662178183854579, + "loss": 0.0227, "step": 44640 }, { - "epoch": 0.48, - "learning_rate": 0.0002275961600830252, - "loss": 0.0193, + "epoch": 0.23, + "learning_rate": 0.00026621025069244387, + "loss": 0.0208, "step": 44650 }, { - "epoch": 0.48, - "learning_rate": 0.00022757994421742232, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.00026620268299942985, + "loss": 0.0214, "step": 44660 }, { - "epoch": 0.48, - "learning_rate": 0.0002275637283518194, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026619511530641583, + "loss": 0.0225, "step": 44670 }, { - "epoch": 0.48, - "learning_rate": 0.0002275475124862165, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.00026618754761340187, + "loss": 0.0193, "step": 44680 }, { - "epoch": 0.48, - "learning_rate": 0.00022753129662061357, - "loss": 0.0209, + "epoch": 0.23, + "learning_rate": 0.00026617997992038785, + "loss": 0.0233, "step": 44690 }, { - "epoch": 0.48, - "learning_rate": 0.0002275150807550107, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026617241222737383, + "loss": 0.0205, "step": 44700 }, { - "epoch": 0.48, - "learning_rate": 0.00022749886488940778, - "loss": 0.023, + "epoch": 0.23, + "learning_rate": 0.0002661648445343598, + "loss": 0.0236, "step": 44710 }, { - "epoch": 0.48, - "learning_rate": 0.00022748264902380488, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.0002661572768413458, + "loss": 0.0216, "step": 44720 }, { - "epoch": 0.48, - "learning_rate": 0.00022746643315820197, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002661497091483318, + "loss": 0.0232, "step": 44730 }, { - "epoch": 0.48, - "learning_rate": 0.00022745021729259906, - "loss": 0.0214, + "epoch": 0.23, + "learning_rate": 0.00026614214145531776, + "loss": 0.0252, "step": 44740 }, { - "epoch": 0.48, - "learning_rate": 0.00022743400142699615, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.0002661345737623038, + "loss": 0.0228, "step": 44750 }, { - "epoch": 0.48, - "learning_rate": 0.00022741778556139327, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002661270060692898, + "loss": 0.0239, "step": 44760 }, { - "epoch": 0.48, - "learning_rate": 0.00022740156969579034, - "loss": 0.0204, + "epoch": 0.23, + "learning_rate": 0.00026611943837627575, + "loss": 0.0185, "step": 44770 }, { - "epoch": 0.48, - "learning_rate": 0.00022738535383018743, - "loss": 0.0212, + "epoch": 0.23, + "learning_rate": 0.00026611187068326174, + "loss": 0.0217, "step": 44780 }, { - "epoch": 0.48, - "learning_rate": 0.00022736913796458452, - "loss": 0.0212, + "epoch": 0.23, + "learning_rate": 0.0002661043029902477, + "loss": 0.0229, "step": 44790 }, { - "epoch": 0.48, - "learning_rate": 0.00022735292209898164, - "loss": 0.0196, + "epoch": 0.23, + "learning_rate": 0.0002660967352972337, + "loss": 0.0223, "step": 44800 }, { - "epoch": 0.48, - "learning_rate": 0.0002273367062333787, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026608916760421973, + "loss": 0.0278, "step": 44810 }, { - "epoch": 0.48, - "learning_rate": 0.0002273204903677758, - "loss": 0.0232, + "epoch": 0.23, + "learning_rate": 0.0002660815999112057, + "loss": 0.0196, "step": 44820 }, { - "epoch": 0.48, - "learning_rate": 0.00022730427450217292, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002660740322181917, + "loss": 0.0175, "step": 44830 }, { - "epoch": 0.48, - "learning_rate": 0.00022728805863657002, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.0002660664645251777, + "loss": 0.0179, "step": 44840 }, { - "epoch": 0.48, - "learning_rate": 0.00022727184277096708, - "loss": 0.0162, + "epoch": 0.23, + "learning_rate": 0.00026605889683216366, + "loss": 0.0223, "step": 44850 }, { - "epoch": 0.48, - "learning_rate": 0.00022725562690536417, - "loss": 0.0215, + "epoch": 0.23, + "learning_rate": 0.00026605132913914964, + "loss": 0.0259, "step": 44860 }, { - "epoch": 0.49, - "learning_rate": 0.0002272394110397613, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002660437614461356, + "loss": 0.0212, "step": 44870 }, { - "epoch": 0.49, - "learning_rate": 0.00022722319517415839, + "epoch": 0.23, + "learning_rate": 0.00026603619375312166, "loss": 0.0186, "step": 44880 }, { - "epoch": 0.49, - "learning_rate": 0.00022720697930855545, - "loss": 0.0215, + "epoch": 0.23, + "learning_rate": 0.00026602862606010764, + "loss": 0.024, "step": 44890 }, { - "epoch": 0.49, - "learning_rate": 0.00022719076344295257, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.0002660210583670936, + "loss": 0.0233, "step": 44900 }, { - "epoch": 0.49, - "learning_rate": 0.00022717454757734966, - "loss": 0.0204, + "epoch": 0.23, + "learning_rate": 0.0002660134906740796, + "loss": 0.0251, "step": 44910 }, { - "epoch": 0.49, - "learning_rate": 0.00022715833171174676, - "loss": 0.0208, + "epoch": 0.23, + "learning_rate": 0.0002660059229810656, + "loss": 0.0229, "step": 44920 }, { - "epoch": 0.49, - "learning_rate": 0.00022714211584614382, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.00026599835528805157, + "loss": 0.0251, "step": 44930 }, { - "epoch": 0.49, - "learning_rate": 0.00022712589998054094, - "loss": 0.0188, + "epoch": 0.23, + "learning_rate": 0.0002659907875950376, + "loss": 0.02, "step": 44940 }, { - "epoch": 0.49, - "learning_rate": 0.00022710968411493804, - "loss": 0.0155, + "epoch": 0.23, + "learning_rate": 0.0002659832199020236, + "loss": 0.0213, "step": 44950 }, { - "epoch": 0.49, - "learning_rate": 0.00022709346824933516, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.00026597565220900956, + "loss": 0.0212, "step": 44960 }, { - "epoch": 0.49, - "learning_rate": 0.00022707725238373222, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026596808451599555, + "loss": 0.0219, "step": 44970 }, { - "epoch": 0.49, - "learning_rate": 0.00022706103651812931, - "loss": 0.0166, + "epoch": 0.23, + "learning_rate": 0.00026596051682298153, + "loss": 0.026, "step": 44980 }, { - "epoch": 0.49, - "learning_rate": 0.0002270448206525264, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002659529491299675, + "loss": 0.0202, "step": 44990 }, { - "epoch": 0.49, - "learning_rate": 0.00022702860478692353, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026594538143695354, + "loss": 0.024, "step": 45000 }, { - "epoch": 0.49, - "eval_cer": 0.9215347519356817, - "eval_loss": 0.013409956358373165, - "eval_runtime": 121.5929, - "eval_samples_per_second": 16.448, - "eval_steps_per_second": 4.112, + "epoch": 0.23, + "eval_cer": 0.9144896638256703, + "eval_loss": 0.016492534428834915, + "eval_runtime": 117.0086, + "eval_samples_per_second": 17.093, + "eval_steps_per_second": 4.273, "step": 45000 }, { - "epoch": 0.49, - "learning_rate": 0.0002270123889213206, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.0002659378137439395, + "loss": 0.0231, "step": 45010 }, { - "epoch": 0.49, - "learning_rate": 0.00022699617305571768, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.0002659302460509255, + "loss": 0.0235, "step": 45020 }, { - "epoch": 0.49, - "learning_rate": 0.0002269799571901148, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.0002659226783579115, + "loss": 0.0237, "step": 45030 }, { - "epoch": 0.49, - "learning_rate": 0.0002269637413245119, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.00026591511066489747, + "loss": 0.0202, "step": 45040 }, { - "epoch": 0.49, - "learning_rate": 0.00022694752545890896, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.00026590754297188345, + "loss": 0.0213, "step": 45050 }, { - "epoch": 0.49, - "learning_rate": 0.00022693130959330606, - "loss": 0.0204, + "epoch": 0.23, + "learning_rate": 0.00026589997527886943, + "loss": 0.019, "step": 45060 }, { - "epoch": 0.49, - "learning_rate": 0.00022691509372770318, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026589240758585547, + "loss": 0.0231, "step": 45070 }, { - "epoch": 0.49, - "learning_rate": 0.00022689887786210027, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.00026588483989284145, + "loss": 0.0309, "step": 45080 }, { - "epoch": 0.49, - "learning_rate": 0.00022688266199649733, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.00026587727219982743, + "loss": 0.0219, "step": 45090 }, { - "epoch": 0.49, - "learning_rate": 0.00022686644613089445, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.0002658697045068134, + "loss": 0.0226, "step": 45100 }, { - "epoch": 0.49, - "learning_rate": 0.00022685023026529155, - "loss": 0.0195, + "epoch": 0.23, + "learning_rate": 0.0002658621368137994, + "loss": 0.0203, "step": 45110 }, { - "epoch": 0.49, - "learning_rate": 0.00022683401439968864, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.0002658545691207854, + "loss": 0.0228, "step": 45120 }, { - "epoch": 0.49, - "learning_rate": 0.0002268177985340857, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002658470014277714, + "loss": 0.0229, "step": 45130 }, { - "epoch": 0.49, - "learning_rate": 0.00022680158266848282, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.0002658394337347574, + "loss": 0.0204, "step": 45140 }, { - "epoch": 0.49, - "learning_rate": 0.00022678536680287992, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.0002658318660417434, + "loss": 0.0221, "step": 45150 }, { - "epoch": 0.49, - "learning_rate": 0.000226769150937277, - "loss": 0.0193, + "epoch": 0.23, + "learning_rate": 0.00026582429834872936, + "loss": 0.022, "step": 45160 }, { - "epoch": 0.49, - "learning_rate": 0.0002267529350716741, - "loss": 0.0188, + "epoch": 0.23, + "learning_rate": 0.00026581673065571534, + "loss": 0.0216, "step": 45170 }, { - "epoch": 0.49, - "learning_rate": 0.0002267367192060712, - "loss": 0.0184, + "epoch": 0.23, + "learning_rate": 0.0002658091629627013, + "loss": 0.0224, "step": 45180 }, { - "epoch": 0.49, - "learning_rate": 0.0002267205033404683, - "loss": 0.0221, + "epoch": 0.23, + "learning_rate": 0.00026580159526968735, + "loss": 0.0237, "step": 45190 }, { - "epoch": 0.49, - "learning_rate": 0.0002267042874748654, - "loss": 0.0206, + "epoch": 0.23, + "learning_rate": 0.00026579402757667334, + "loss": 0.0245, "step": 45200 }, { - "epoch": 0.49, - "learning_rate": 0.00022668807160926247, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002657864598836593, + "loss": 0.023, "step": 45210 }, { - "epoch": 0.49, - "learning_rate": 0.00022667185574365957, - "loss": 0.0188, + "epoch": 0.23, + "learning_rate": 0.0002657788921906453, + "loss": 0.027, "step": 45220 }, { - "epoch": 0.49, - "learning_rate": 0.00022665563987805666, - "loss": 0.0233, + "epoch": 0.23, + "learning_rate": 0.0002657713244976313, + "loss": 0.0214, "step": 45230 }, { - "epoch": 0.49, - "learning_rate": 0.00022663942401245378, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026576375680461726, + "loss": 0.0209, "step": 45240 }, { - "epoch": 0.49, - "learning_rate": 0.00022662320814685084, - "loss": 0.021, + "epoch": 0.23, + "learning_rate": 0.00026575618911160324, + "loss": 0.0208, "step": 45250 }, { - "epoch": 0.49, - "learning_rate": 0.00022660699228124794, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.0002657486214185893, + "loss": 0.0224, "step": 45260 }, { - "epoch": 0.49, - "learning_rate": 0.00022659077641564506, - "loss": 0.0207, + "epoch": 0.23, + "learning_rate": 0.00026574105372557526, + "loss": 0.024, "step": 45270 }, { - "epoch": 0.49, - "learning_rate": 0.00022657456055004215, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.00026573348603256124, + "loss": 0.0253, "step": 45280 }, { - "epoch": 0.49, - "learning_rate": 0.00022655834468443922, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002657259183395472, + "loss": 0.0235, "step": 45290 }, { - "epoch": 0.49, - "learning_rate": 0.0002265421288188363, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002657183506465332, + "loss": 0.0219, "step": 45300 }, { - "epoch": 0.49, - "learning_rate": 0.00022652591295323343, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.0002657107829535192, + "loss": 0.0227, "step": 45310 }, { - "epoch": 0.49, - "learning_rate": 0.00022650969708763052, - "loss": 0.0215, + "epoch": 0.23, + "learning_rate": 0.0002657032152605052, + "loss": 0.0265, "step": 45320 }, { - "epoch": 0.49, - "learning_rate": 0.00022649348122202764, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002656956475674912, + "loss": 0.0194, "step": 45330 }, { - "epoch": 0.49, - "learning_rate": 0.0002264772653564247, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002656880798744772, + "loss": 0.0212, "step": 45340 }, { - "epoch": 0.49, - "learning_rate": 0.0002264610494908218, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026568051218146317, + "loss": 0.0228, "step": 45350 }, { - "epoch": 0.49, - "learning_rate": 0.0002264448336252189, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026567294448844915, + "loss": 0.0227, "step": 45360 }, { - "epoch": 0.49, - "learning_rate": 0.000226428617759616, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.00026566537679543513, + "loss": 0.0268, "step": 45370 }, { - "epoch": 0.49, - "learning_rate": 0.00022641240189401308, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.0002656578091024211, + "loss": 0.0272, "step": 45380 }, { - "epoch": 0.49, - "learning_rate": 0.00022639618602841017, - "loss": 0.0266, + "epoch": 0.23, + "learning_rate": 0.00026565024140940715, + "loss": 0.021, "step": 45390 }, { - "epoch": 0.49, - "learning_rate": 0.0002263799701628073, - "loss": 0.0196, + "epoch": 0.23, + "learning_rate": 0.00026564267371639313, + "loss": 0.0236, "step": 45400 }, { - "epoch": 0.49, - "learning_rate": 0.00022636375429720438, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002656351060233791, + "loss": 0.024, "step": 45410 }, { - "epoch": 0.49, - "learning_rate": 0.00022634753843160145, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.0002656275383303651, + "loss": 0.022, "step": 45420 }, { - "epoch": 0.49, - "learning_rate": 0.00022633132256599854, - "loss": 0.0219, + "epoch": 0.23, + "learning_rate": 0.00026561997063735107, + "loss": 0.0226, "step": 45430 }, { - "epoch": 0.49, - "learning_rate": 0.00022631510670039566, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026561240294433705, + "loss": 0.0266, "step": 45440 }, { - "epoch": 0.49, - "learning_rate": 0.00022629889083479275, - "loss": 0.0213, + "epoch": 0.23, + "learning_rate": 0.0002656048352513231, + "loss": 0.0282, "step": 45450 }, { - "epoch": 0.49, - "learning_rate": 0.00022628267496918982, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026559726755830907, + "loss": 0.0231, "step": 45460 }, { - "epoch": 0.49, - "learning_rate": 0.00022626645910358694, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026558969986529505, + "loss": 0.0223, "step": 45470 }, { - "epoch": 0.49, - "learning_rate": 0.00022625024323798403, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026558213217228103, + "loss": 0.0209, "step": 45480 }, { - "epoch": 0.49, - "learning_rate": 0.00022623402737238112, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.000265574564479267, + "loss": 0.0216, "step": 45490 }, { - "epoch": 0.49, - "learning_rate": 0.0002262178115067782, - "loss": 0.0197, + "epoch": 0.23, + "learning_rate": 0.000265566996786253, + "loss": 0.0232, "step": 45500 }, { - "epoch": 0.49, - "learning_rate": 0.0002262015956411753, - "loss": 0.0196, + "epoch": 0.23, + "learning_rate": 0.00026555942909323903, + "loss": 0.0253, "step": 45510 }, { - "epoch": 0.49, - "learning_rate": 0.0002261853797755724, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.000265551861400225, + "loss": 0.0236, "step": 45520 }, { - "epoch": 0.49, - "learning_rate": 0.0002261691639099695, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.000265544293707211, + "loss": 0.0222, "step": 45530 }, { - "epoch": 0.49, - "learning_rate": 0.0002261529480443666, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.000265536726014197, + "loss": 0.0205, "step": 45540 }, { - "epoch": 0.49, - "learning_rate": 0.00022613673217876368, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.00026552915832118296, + "loss": 0.0195, "step": 45550 }, { - "epoch": 0.49, - "learning_rate": 0.00022612051631316077, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.00026552159062816894, + "loss": 0.0212, "step": 45560 }, { - "epoch": 0.49, - "learning_rate": 0.0002261043004475579, - "loss": 0.0212, + "epoch": 0.23, + "learning_rate": 0.0002655140229351549, + "loss": 0.0227, "step": 45570 }, { - "epoch": 0.49, - "learning_rate": 0.00022608808458195496, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.00026550645524214096, + "loss": 0.0243, "step": 45580 }, { - "epoch": 0.49, - "learning_rate": 0.00022607186871635205, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.00026549888754912694, + "loss": 0.0207, "step": 45590 }, { - "epoch": 0.49, - "learning_rate": 0.00022605565285074915, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.0002654913198561129, + "loss": 0.0222, "step": 45600 }, { - "epoch": 0.49, - "learning_rate": 0.00022603943698514626, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002654837521630989, + "loss": 0.0198, "step": 45610 }, { - "epoch": 0.49, - "learning_rate": 0.00022602322111954333, - "loss": 0.0215, + "epoch": 0.23, + "learning_rate": 0.0002654761844700849, + "loss": 0.0216, "step": 45620 }, { - "epoch": 0.49, - "learning_rate": 0.00022600700525394042, - "loss": 0.0235, + "epoch": 0.23, + "learning_rate": 0.00026546861677707086, + "loss": 0.0186, "step": 45630 }, { - "epoch": 0.49, - "learning_rate": 0.00022599078938833754, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.0002654610490840569, + "loss": 0.0205, "step": 45640 }, { - "epoch": 0.49, - "learning_rate": 0.00022597457352273464, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002654534813910429, + "loss": 0.0279, "step": 45650 }, { - "epoch": 0.49, - "learning_rate": 0.0002259583576571317, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.00026544591369802886, + "loss": 0.0211, "step": 45660 }, { - "epoch": 0.49, - "learning_rate": 0.00022594214179152882, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.00026543834600501484, + "loss": 0.019, "step": 45670 }, { - "epoch": 0.49, - "learning_rate": 0.00022592592592592591, - "loss": 0.0193, + "epoch": 0.23, + "learning_rate": 0.0002654307783120008, + "loss": 0.0247, "step": 45680 }, { - "epoch": 0.49, - "learning_rate": 0.000225909710060323, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002654232106189868, + "loss": 0.0187, "step": 45690 }, { - "epoch": 0.49, - "learning_rate": 0.00022589349419472007, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026541564292597284, + "loss": 0.0231, "step": 45700 }, { - "epoch": 0.49, - "learning_rate": 0.0002258772783291172, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002654080752329588, + "loss": 0.0282, "step": 45710 }, { - "epoch": 0.49, - "learning_rate": 0.00022586106246351429, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.0002654005075399448, + "loss": 0.0182, "step": 45720 }, { - "epoch": 0.49, - "learning_rate": 0.00022584484659791138, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002653929398469308, + "loss": 0.0236, "step": 45730 }, { - "epoch": 0.49, - "learning_rate": 0.00022582863073230847, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.00026538537215391677, + "loss": 0.0195, "step": 45740 }, { - "epoch": 0.49, - "learning_rate": 0.00022581241486670556, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.00026537780446090275, + "loss": 0.0247, "step": 45750 }, { - "epoch": 0.49, - "learning_rate": 0.00022579619900110266, - "loss": 0.0162, + "epoch": 0.23, + "learning_rate": 0.00026537023676788873, + "loss": 0.0208, "step": 45760 }, { - "epoch": 0.49, - "learning_rate": 0.00022577998313549978, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.00026536266907487477, + "loss": 0.0218, "step": 45770 }, { - "epoch": 0.49, - "learning_rate": 0.00022576376726989684, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026535510138186075, + "loss": 0.0249, "step": 45780 }, { - "epoch": 0.5, - "learning_rate": 0.00022574755140429393, - "loss": 0.0211, + "epoch": 0.23, + "learning_rate": 0.00026534753368884673, + "loss": 0.0209, "step": 45790 }, { - "epoch": 0.5, - "learning_rate": 0.00022573133553869103, - "loss": 0.0197, + "epoch": 0.23, + "learning_rate": 0.0002653399659958327, + "loss": 0.023, "step": 45800 }, { - "epoch": 0.5, - "learning_rate": 0.00022571511967308815, - "loss": 0.02, + "epoch": 0.23, + "learning_rate": 0.0002653323983028187, + "loss": 0.0184, "step": 45810 }, { - "epoch": 0.5, - "learning_rate": 0.0002256989038074852, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.0002653248306098047, + "loss": 0.0246, "step": 45820 }, { - "epoch": 0.5, - "learning_rate": 0.0002256826879418823, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002653172629167907, + "loss": 0.0245, "step": 45830 }, { - "epoch": 0.5, - "learning_rate": 0.00022566647207627943, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002653096952237767, + "loss": 0.0209, "step": 45840 }, { - "epoch": 0.5, - "learning_rate": 0.00022565025621067652, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.00026530212753076267, + "loss": 0.0254, "step": 45850 }, { - "epoch": 0.5, - "learning_rate": 0.00022563404034507358, - "loss": 0.0257, + "epoch": 0.23, + "learning_rate": 0.00026529455983774865, + "loss": 0.0221, "step": 45860 }, { - "epoch": 0.5, - "learning_rate": 0.00022561782447947068, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.00026528699214473463, + "loss": 0.0208, "step": 45870 }, { - "epoch": 0.5, - "learning_rate": 0.0002256016086138678, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.0002652794244517206, + "loss": 0.0242, "step": 45880 }, { - "epoch": 0.5, - "learning_rate": 0.0002255853927482649, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.0002652718567587066, + "loss": 0.0208, "step": 45890 }, { - "epoch": 0.5, - "learning_rate": 0.00022556917688266195, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.0002652642890656926, + "loss": 0.0223, "step": 45900 }, { - "epoch": 0.5, - "learning_rate": 0.00022555296101705907, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.00026525672137267856, + "loss": 0.0214, "step": 45910 }, { - "epoch": 0.5, - "learning_rate": 0.00022553674515145617, - "loss": 0.0217, + "epoch": 0.23, + "learning_rate": 0.00026524915367966454, + "loss": 0.0258, "step": 45920 }, { - "epoch": 0.5, - "learning_rate": 0.00022552052928585326, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.0002652415859866506, + "loss": 0.0216, "step": 45930 }, { - "epoch": 0.5, - "learning_rate": 0.00022550431342025033, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.00026523401829363656, + "loss": 0.0246, "step": 45940 }, { - "epoch": 0.5, - "learning_rate": 0.00022548809755464745, - "loss": 0.0229, + "epoch": 0.23, + "learning_rate": 0.00026522645060062254, + "loss": 0.0233, "step": 45950 }, { - "epoch": 0.5, - "learning_rate": 0.00022547188168904454, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002652188829076085, + "loss": 0.0182, "step": 45960 }, { - "epoch": 0.5, - "learning_rate": 0.00022545566582344166, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002652113152145945, + "loss": 0.0225, "step": 45970 }, { - "epoch": 0.5, - "learning_rate": 0.00022543944995783872, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002652037475215805, + "loss": 0.0192, "step": 45980 }, { - "epoch": 0.5, - "learning_rate": 0.00022542323409223582, - "loss": 0.021, + "epoch": 0.23, + "learning_rate": 0.00026519617982856647, + "loss": 0.0246, "step": 45990 }, { - "epoch": 0.5, - "learning_rate": 0.0002254070182266329, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002651886121355525, + "loss": 0.0228, "step": 46000 }, { - "epoch": 0.5, - "eval_cer": 0.9215503867888964, - "eval_loss": 0.01366225816309452, - "eval_runtime": 121.4419, - "eval_samples_per_second": 16.469, - "eval_steps_per_second": 4.117, + "epoch": 0.23, + "eval_cer": 0.9144877230334195, + "eval_loss": 0.016304470598697662, + "eval_runtime": 117.0909, + "eval_samples_per_second": 17.081, + "eval_steps_per_second": 4.27, "step": 46000 }, { - "epoch": 0.5, - "learning_rate": 0.00022539080236103003, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002651810444425385, + "loss": 0.0214, "step": 46010 }, { - "epoch": 0.5, - "learning_rate": 0.0002253745864954271, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026517347674952447, + "loss": 0.0216, "step": 46020 }, { - "epoch": 0.5, - "learning_rate": 0.0002253583706298242, - "loss": 0.0206, + "epoch": 0.23, + "learning_rate": 0.00026516590905651045, + "loss": 0.0235, "step": 46030 }, { - "epoch": 0.5, - "learning_rate": 0.0002253421547642213, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.00026515834136349643, + "loss": 0.0227, "step": 46040 }, { - "epoch": 0.5, - "learning_rate": 0.0002253259388986184, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.0002651507736704824, + "loss": 0.0207, "step": 46050 }, { - "epoch": 0.5, - "learning_rate": 0.0002253097230330155, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.00026514320597746845, + "loss": 0.0197, "step": 46060 }, { - "epoch": 0.5, - "learning_rate": 0.00022529350716741256, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.0002651356382844544, + "loss": 0.0191, "step": 46070 }, { - "epoch": 0.5, - "learning_rate": 0.00022527729130180968, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.0002651280705914404, + "loss": 0.0204, "step": 46080 }, { - "epoch": 0.5, - "learning_rate": 0.00022526107543620677, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002651205028984264, + "loss": 0.0198, "step": 46090 }, { - "epoch": 0.5, - "learning_rate": 0.00022524485957060386, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.00026511293520541237, + "loss": 0.0197, "step": 46100 }, { - "epoch": 0.5, - "learning_rate": 0.00022522864370500096, - "loss": 0.0198, + "epoch": 0.23, + "learning_rate": 0.00026510536751239835, + "loss": 0.0199, "step": 46110 }, { - "epoch": 0.5, - "learning_rate": 0.00022521242783939805, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.00026509779981938433, + "loss": 0.023, "step": 46120 }, { - "epoch": 0.5, - "learning_rate": 0.00022519621197379514, - "loss": 0.0219, + "epoch": 0.23, + "learning_rate": 0.00026509023212637037, + "loss": 0.0263, "step": 46130 }, { - "epoch": 0.5, - "learning_rate": 0.00022517999610819226, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.00026508266443335635, + "loss": 0.0235, "step": 46140 }, { - "epoch": 0.5, - "learning_rate": 0.00022516378024258933, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026507509674034233, + "loss": 0.026, "step": 46150 }, { - "epoch": 0.5, - "learning_rate": 0.00022514756437698642, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002650675290473283, + "loss": 0.0229, "step": 46160 }, { - "epoch": 0.5, - "learning_rate": 0.0002251313485113835, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.0002650599613543143, + "loss": 0.0249, "step": 46170 }, { - "epoch": 0.5, - "learning_rate": 0.00022511513264578063, - "loss": 0.0188, + "epoch": 0.23, + "learning_rate": 0.0002650523936613003, + "loss": 0.0269, "step": 46180 }, { - "epoch": 0.5, - "learning_rate": 0.0002250989167801777, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.0002650448259682863, + "loss": 0.0199, "step": 46190 }, { - "epoch": 0.5, - "learning_rate": 0.0002250827009145748, - "loss": 0.0201, + "epoch": 0.23, + "learning_rate": 0.0002650372582752723, + "loss": 0.0235, "step": 46200 }, { - "epoch": 0.5, - "learning_rate": 0.0002250664850489719, - "loss": 0.0209, + "epoch": 0.23, + "learning_rate": 0.0002650296905822583, + "loss": 0.0305, "step": 46210 }, { - "epoch": 0.5, - "learning_rate": 0.000225050269183369, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.00026502212288924426, + "loss": 0.0246, "step": 46220 }, { - "epoch": 0.5, - "learning_rate": 0.00022503405331776607, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.00026501455519623024, + "loss": 0.0207, "step": 46230 }, { - "epoch": 0.5, - "learning_rate": 0.00022501783745216316, - "loss": 0.0195, + "epoch": 0.23, + "learning_rate": 0.0002650069875032162, + "loss": 0.0205, "step": 46240 }, { - "epoch": 0.5, - "learning_rate": 0.00022500162158656028, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.00026499941981020226, + "loss": 0.0233, "step": 46250 }, { - "epoch": 0.5, - "learning_rate": 0.00022498540572095737, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.00026499185211718824, + "loss": 0.0228, "step": 46260 }, { - "epoch": 0.5, - "learning_rate": 0.00022496918985535444, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.0002649842844241742, + "loss": 0.0191, "step": 46270 }, { - "epoch": 0.5, - "learning_rate": 0.00022495297398975156, - "loss": 0.0162, + "epoch": 0.23, + "learning_rate": 0.0002649767167311602, + "loss": 0.0205, "step": 46280 }, { - "epoch": 0.5, - "learning_rate": 0.00022493675812414865, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002649691490381462, + "loss": 0.0187, "step": 46290 }, { - "epoch": 0.5, - "learning_rate": 0.00022492054225854575, - "loss": 0.0219, + "epoch": 0.23, + "learning_rate": 0.00026496158134513216, + "loss": 0.0212, "step": 46300 }, { - "epoch": 0.5, - "learning_rate": 0.0002249043263929428, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.00026495401365211814, + "loss": 0.0185, "step": 46310 }, { - "epoch": 0.5, - "learning_rate": 0.00022488811052733993, - "loss": 0.0209, + "epoch": 0.23, + "learning_rate": 0.0002649464459591042, + "loss": 0.0228, "step": 46320 }, { - "epoch": 0.5, - "learning_rate": 0.00022487189466173702, - "loss": 0.0198, + "epoch": 0.23, + "learning_rate": 0.00026493887826609016, + "loss": 0.0214, "step": 46330 }, { - "epoch": 0.5, - "learning_rate": 0.00022485567879613414, - "loss": 0.0229, + "epoch": 0.23, + "learning_rate": 0.00026493131057307614, + "loss": 0.0189, "step": 46340 }, { - "epoch": 0.5, - "learning_rate": 0.0002248394629305312, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002649237428800621, + "loss": 0.0188, "step": 46350 }, { - "epoch": 0.5, - "learning_rate": 0.0002248232470649283, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002649161751870481, + "loss": 0.0262, "step": 46360 }, { - "epoch": 0.5, - "learning_rate": 0.0002248070311993254, - "loss": 0.0219, + "epoch": 0.23, + "learning_rate": 0.0002649086074940341, + "loss": 0.0203, "step": 46370 }, { - "epoch": 0.5, - "learning_rate": 0.00022479081533372251, - "loss": 0.0213, + "epoch": 0.23, + "learning_rate": 0.0002649010398010201, + "loss": 0.0235, "step": 46380 }, { - "epoch": 0.5, - "learning_rate": 0.00022477459946811958, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.0002648934721080061, + "loss": 0.0184, "step": 46390 }, { - "epoch": 0.5, - "learning_rate": 0.00022475838360251667, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.0002648859044149921, + "loss": 0.0214, "step": 46400 }, { - "epoch": 0.5, - "learning_rate": 0.0002247421677369138, - "loss": 0.0328, + "epoch": 0.23, + "learning_rate": 0.00026487833672197807, + "loss": 0.0194, "step": 46410 }, { - "epoch": 0.5, - "learning_rate": 0.00022472595187131089, - "loss": 0.0231, + "epoch": 0.23, + "learning_rate": 0.00026487076902896405, + "loss": 0.0244, "step": 46420 }, { - "epoch": 0.5, - "learning_rate": 0.00022470973600570795, - "loss": 0.0206, + "epoch": 0.23, + "learning_rate": 0.00026486320133595003, + "loss": 0.022, "step": 46430 }, { - "epoch": 0.5, - "learning_rate": 0.00022469352014010504, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026485563364293607, + "loss": 0.0233, "step": 46440 }, { - "epoch": 0.5, - "learning_rate": 0.00022467730427450216, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.00026484806594992205, + "loss": 0.0217, "step": 46450 }, { - "epoch": 0.5, - "learning_rate": 0.00022466108840889926, - "loss": 0.014, + "epoch": 0.23, + "learning_rate": 0.00026484049825690803, + "loss": 0.0219, "step": 46460 }, { - "epoch": 0.5, - "learning_rate": 0.00022464487254329632, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.000264832930563894, + "loss": 0.0162, "step": 46470 }, { - "epoch": 0.5, - "learning_rate": 0.00022462865667769344, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.00026482536287088, + "loss": 0.0231, "step": 46480 }, { - "epoch": 0.5, - "learning_rate": 0.00022461244081209053, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.00026481779517786597, + "loss": 0.0209, "step": 46490 }, { - "epoch": 0.5, - "learning_rate": 0.00022459622494648763, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.00026481022748485195, + "loss": 0.0207, "step": 46500 }, { - "epoch": 0.5, - "learning_rate": 0.0002245800090808847, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.000264802659791838, + "loss": 0.0205, "step": 46510 }, { - "epoch": 0.5, - "learning_rate": 0.0002245637932152818, - "loss": 0.0232, + "epoch": 0.23, + "learning_rate": 0.00026479509209882397, + "loss": 0.022, "step": 46520 }, { - "epoch": 0.5, - "learning_rate": 0.0002245475773496789, - "loss": 0.0207, + "epoch": 0.23, + "learning_rate": 0.00026478752440580995, + "loss": 0.0227, "step": 46530 }, { - "epoch": 0.5, - "learning_rate": 0.000224531361484076, - "loss": 0.0199, + "epoch": 0.23, + "learning_rate": 0.00026477995671279593, + "loss": 0.0235, "step": 46540 }, { - "epoch": 0.5, - "learning_rate": 0.0002245151456184731, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.0002647723890197819, + "loss": 0.0246, "step": 46550 }, { - "epoch": 0.5, - "learning_rate": 0.00022449892975287018, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002647648213267679, + "loss": 0.0276, "step": 46560 }, { - "epoch": 0.5, - "learning_rate": 0.00022448271388726728, - "loss": 0.0259, + "epoch": 0.23, + "learning_rate": 0.00026475725363375393, + "loss": 0.022, "step": 46570 }, { - "epoch": 0.5, - "learning_rate": 0.0002244664980216644, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.0002647496859407399, + "loss": 0.0196, "step": 46580 }, { - "epoch": 0.5, - "learning_rate": 0.00022445028215606146, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.0002647421182477259, + "loss": 0.0196, "step": 46590 }, { - "epoch": 0.5, - "learning_rate": 0.00022443406629045855, - "loss": 0.0315, + "epoch": 0.24, + "learning_rate": 0.0002647345505547119, + "loss": 0.0203, "step": 46600 }, { - "epoch": 0.5, - "learning_rate": 0.00022441785042485565, - "loss": 0.0219, + "epoch": 0.24, + "learning_rate": 0.00026472698286169786, + "loss": 0.0207, "step": 46610 }, { - "epoch": 0.5, - "learning_rate": 0.00022440163455925277, - "loss": 0.0223, + "epoch": 0.24, + "learning_rate": 0.00026471941516868384, + "loss": 0.0217, "step": 46620 }, { - "epoch": 0.5, - "learning_rate": 0.00022438541869364983, - "loss": 0.0226, + "epoch": 0.24, + "learning_rate": 0.0002647118474756698, + "loss": 0.0185, "step": 46630 }, { - "epoch": 0.5, - "learning_rate": 0.00022436920282804693, - "loss": 0.0226, + "epoch": 0.24, + "learning_rate": 0.00026470427978265586, + "loss": 0.0215, "step": 46640 }, { - "epoch": 0.5, - "learning_rate": 0.00022435298696244405, - "loss": 0.0219, + "epoch": 0.24, + "learning_rate": 0.00026469671208964184, + "loss": 0.0194, "step": 46650 }, { - "epoch": 0.5, - "learning_rate": 0.00022433677109684114, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.0002646891443966278, + "loss": 0.0238, "step": 46660 }, { - "epoch": 0.5, - "learning_rate": 0.0002243205552312382, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002646815767036138, + "loss": 0.0205, "step": 46670 }, { - "epoch": 0.5, - "learning_rate": 0.00022430433936563532, - "loss": 0.021, + "epoch": 0.24, + "learning_rate": 0.0002646740090105998, + "loss": 0.0214, "step": 46680 }, { - "epoch": 0.5, - "learning_rate": 0.00022428812350003242, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.00026466644131758576, + "loss": 0.0189, "step": 46690 }, { - "epoch": 0.5, - "learning_rate": 0.0002242719076344295, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.0002646588736245718, + "loss": 0.0191, "step": 46700 }, { - "epoch": 0.5, - "learning_rate": 0.00022425569176882658, - "loss": 0.0217, + "epoch": 0.24, + "learning_rate": 0.0002646513059315578, + "loss": 0.0238, "step": 46710 }, { - "epoch": 0.51, - "learning_rate": 0.0002242394759032237, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026464373823854376, + "loss": 0.0209, "step": 46720 }, { - "epoch": 0.51, - "learning_rate": 0.0002242232600376208, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.00026463617054552974, + "loss": 0.023, "step": 46730 }, { - "epoch": 0.51, - "learning_rate": 0.00022420704417201788, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002646286028525157, + "loss": 0.0222, "step": 46740 }, { - "epoch": 0.51, - "learning_rate": 0.00022419082830641497, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002646210351595017, + "loss": 0.0259, "step": 46750 }, { - "epoch": 0.51, - "learning_rate": 0.00022417461244081207, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.00026461346746648774, + "loss": 0.0206, "step": 46760 }, { - "epoch": 0.51, - "learning_rate": 0.00022415839657520916, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.0002646058997734737, + "loss": 0.0267, "step": 46770 }, { - "epoch": 0.51, - "learning_rate": 0.00022414218070960628, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.0002645983320804597, + "loss": 0.0238, "step": 46780 }, { - "epoch": 0.51, - "learning_rate": 0.00022412596484400337, - "loss": 0.0248, + "epoch": 0.24, + "learning_rate": 0.0002645907643874457, + "loss": 0.026, "step": 46790 }, { - "epoch": 0.51, - "learning_rate": 0.00022410974897840044, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.00026458319669443167, + "loss": 0.023, "step": 46800 }, { - "epoch": 0.51, - "learning_rate": 0.00022409353311279753, - "loss": 0.0205, + "epoch": 0.24, + "learning_rate": 0.00026457562900141765, + "loss": 0.0181, "step": 46810 }, { - "epoch": 0.51, - "learning_rate": 0.00022407731724719465, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026456806130840363, + "loss": 0.023, "step": 46820 }, { - "epoch": 0.51, - "learning_rate": 0.00022406110138159174, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.00026456049361538967, + "loss": 0.0237, "step": 46830 }, { - "epoch": 0.51, - "learning_rate": 0.0002240448855159888, - "loss": 0.0215, + "epoch": 0.24, + "learning_rate": 0.00026455292592237565, + "loss": 0.0209, "step": 46840 }, { - "epoch": 0.51, - "learning_rate": 0.00022402866965038593, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.00026454535822936163, + "loss": 0.0234, "step": 46850 }, { - "epoch": 0.51, - "learning_rate": 0.00022401245378478302, - "loss": 0.0167, + "epoch": 0.24, + "learning_rate": 0.0002645377905363476, + "loss": 0.0178, "step": 46860 }, { - "epoch": 0.51, - "learning_rate": 0.0002239962379191801, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.0002645302228433336, + "loss": 0.0219, "step": 46870 }, { - "epoch": 0.51, - "learning_rate": 0.00022398002205357718, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.0002645226551503196, + "loss": 0.0225, "step": 46880 }, { - "epoch": 0.51, - "learning_rate": 0.0002239638061879743, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002645150874573056, + "loss": 0.0207, "step": 46890 }, { - "epoch": 0.51, - "learning_rate": 0.0002239475903223714, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002645075197642916, + "loss": 0.0211, "step": 46900 }, { - "epoch": 0.51, - "learning_rate": 0.00022393137445676848, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026449995207127757, + "loss": 0.0274, "step": 46910 }, { - "epoch": 0.51, - "learning_rate": 0.00022391515859116558, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026449238437826355, + "loss": 0.0229, "step": 46920 }, { - "epoch": 0.51, - "learning_rate": 0.00022389894272556267, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.00026448481668524954, + "loss": 0.0243, "step": 46930 }, { - "epoch": 0.51, - "learning_rate": 0.00022388272685995976, - "loss": 0.0193, + "epoch": 0.24, + "learning_rate": 0.0002644772489922355, + "loss": 0.0228, "step": 46940 }, { - "epoch": 0.51, - "learning_rate": 0.00022386651099435688, - "loss": 0.0201, + "epoch": 0.24, + "learning_rate": 0.00026446968129922155, + "loss": 0.0171, "step": 46950 }, { - "epoch": 0.51, - "learning_rate": 0.00022385029512875395, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026446211360620753, + "loss": 0.0219, "step": 46960 }, { - "epoch": 0.51, - "learning_rate": 0.00022383407926315104, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002644545459131935, + "loss": 0.0197, "step": 46970 }, { - "epoch": 0.51, - "learning_rate": 0.00022381786339754816, - "loss": 0.0193, + "epoch": 0.24, + "learning_rate": 0.0002644469782201795, + "loss": 0.0285, "step": 46980 }, { - "epoch": 0.51, - "learning_rate": 0.00022380164753194525, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002644394105271655, + "loss": 0.0208, "step": 46990 }, { - "epoch": 0.51, - "learning_rate": 0.00022378543166634232, - "loss": 0.0199, + "epoch": 0.24, + "learning_rate": 0.00026443184283415146, + "loss": 0.0222, "step": 47000 }, { - "epoch": 0.51, - "eval_cer": 0.9215434379652454, - "eval_loss": 0.013291054405272007, - "eval_runtime": 121.5822, - "eval_samples_per_second": 16.45, - "eval_steps_per_second": 4.112, + "epoch": 0.24, + "eval_cer": 0.9145042197675514, + "eval_loss": 0.01637718454003334, + "eval_runtime": 117.1859, + "eval_samples_per_second": 17.067, + "eval_steps_per_second": 4.267, "step": 47000 }, { - "epoch": 0.51, - "learning_rate": 0.0002237692158007394, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.00026442427514113744, + "loss": 0.0188, "step": 47010 }, { - "epoch": 0.51, - "learning_rate": 0.00022375299993513653, - "loss": 0.0203, + "epoch": 0.24, + "learning_rate": 0.0002644167074481235, + "loss": 0.0246, "step": 47020 }, { - "epoch": 0.51, - "learning_rate": 0.00022373678406953362, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.00026440913975510946, + "loss": 0.0251, "step": 47030 }, { - "epoch": 0.51, - "learning_rate": 0.0002237205682039307, - "loss": 0.0214, + "epoch": 0.24, + "learning_rate": 0.00026440157206209544, + "loss": 0.0211, "step": 47040 }, { - "epoch": 0.51, - "learning_rate": 0.0002237043523383278, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002643940043690814, + "loss": 0.0213, "step": 47050 }, { - "epoch": 0.51, - "learning_rate": 0.0002236881364727249, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002643864366760674, + "loss": 0.0222, "step": 47060 }, { - "epoch": 0.51, - "learning_rate": 0.000223671920607122, - "loss": 0.0229, + "epoch": 0.24, + "learning_rate": 0.0002643788689830534, + "loss": 0.0188, "step": 47070 }, { - "epoch": 0.51, - "learning_rate": 0.00022365570474151906, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.0002643713012900394, + "loss": 0.0238, "step": 47080 }, { - "epoch": 0.51, - "learning_rate": 0.00022363948887591618, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.0002643637335970254, + "loss": 0.0224, "step": 47090 }, { - "epoch": 0.51, - "learning_rate": 0.00022362327301031327, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002643561659040114, + "loss": 0.0182, "step": 47100 }, { - "epoch": 0.51, - "learning_rate": 0.00022360705714471037, - "loss": 0.0182, + "epoch": 0.24, + "learning_rate": 0.00026434859821099736, + "loss": 0.0235, "step": 47110 }, { - "epoch": 0.51, - "learning_rate": 0.00022359084127910746, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026434103051798335, + "loss": 0.0206, "step": 47120 }, { - "epoch": 0.51, - "learning_rate": 0.00022357462541350455, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.0002643334628249693, + "loss": 0.0196, "step": 47130 }, { - "epoch": 0.51, - "learning_rate": 0.00022355840954790164, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.0002643258951319553, + "loss": 0.0266, "step": 47140 }, { - "epoch": 0.51, - "learning_rate": 0.00022354219368229876, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002643183274389413, + "loss": 0.0225, "step": 47150 }, { - "epoch": 0.51, - "learning_rate": 0.00022352597781669583, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.00026431075974592727, + "loss": 0.0224, "step": 47160 }, { - "epoch": 0.51, - "learning_rate": 0.00022350976195109292, - "loss": 0.021, + "epoch": 0.24, + "learning_rate": 0.00026430319205291325, + "loss": 0.0199, "step": 47170 }, { - "epoch": 0.51, - "learning_rate": 0.00022349354608549002, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.00026429562435989923, + "loss": 0.0187, "step": 47180 }, { - "epoch": 0.51, - "learning_rate": 0.00022347733021988714, - "loss": 0.0223, + "epoch": 0.24, + "learning_rate": 0.00026428805666688527, + "loss": 0.0233, "step": 47190 }, { - "epoch": 0.51, - "learning_rate": 0.0002234611143542842, - "loss": 0.0199, + "epoch": 0.24, + "learning_rate": 0.00026428048897387125, + "loss": 0.0248, "step": 47200 }, { - "epoch": 0.51, - "learning_rate": 0.0002234448984886813, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.00026427292128085723, + "loss": 0.0197, "step": 47210 }, { - "epoch": 0.51, - "learning_rate": 0.0002234286826230784, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.0002642653535878432, + "loss": 0.027, "step": 47220 }, { - "epoch": 0.51, - "learning_rate": 0.0002234124667574755, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002642577858948292, + "loss": 0.0225, "step": 47230 }, { - "epoch": 0.51, - "learning_rate": 0.00022339625089187257, - "loss": 0.0216, + "epoch": 0.24, + "learning_rate": 0.0002642502182018152, + "loss": 0.0343, "step": 47240 }, { - "epoch": 0.51, - "learning_rate": 0.00022338003502626966, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.0002642426505088012, + "loss": 0.0245, "step": 47250 }, { - "epoch": 0.51, - "learning_rate": 0.00022336381916066678, - "loss": 0.0207, + "epoch": 0.24, + "learning_rate": 0.0002642350828157872, + "loss": 0.0214, "step": 47260 }, { - "epoch": 0.51, - "learning_rate": 0.00022334760329506388, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.0002642275151227732, + "loss": 0.0239, "step": 47270 }, { - "epoch": 0.51, - "learning_rate": 0.00022333138742946094, - "loss": 0.0201, + "epoch": 0.24, + "learning_rate": 0.00026421994742975916, + "loss": 0.0241, "step": 47280 }, { - "epoch": 0.51, - "learning_rate": 0.00022331517156385806, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.00026421237973674514, + "loss": 0.0199, "step": 47290 }, { - "epoch": 0.51, - "learning_rate": 0.00022329895569825516, - "loss": 0.0194, + "epoch": 0.24, + "learning_rate": 0.0002642048120437311, + "loss": 0.0254, "step": 47300 }, { - "epoch": 0.51, - "learning_rate": 0.00022328273983265225, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.00026419724435071716, + "loss": 0.0212, "step": 47310 }, { - "epoch": 0.51, - "learning_rate": 0.00022326652396704931, - "loss": 0.0196, + "epoch": 0.24, + "learning_rate": 0.00026418967665770314, + "loss": 0.019, "step": 47320 }, { - "epoch": 0.51, - "learning_rate": 0.00022325030810144643, - "loss": 0.0167, + "epoch": 0.24, + "learning_rate": 0.0002641821089646891, + "loss": 0.0199, "step": 47330 }, { - "epoch": 0.51, - "learning_rate": 0.00022323409223584353, - "loss": 0.019, + "epoch": 0.24, + "learning_rate": 0.0002641745412716751, + "loss": 0.0228, "step": 47340 }, { - "epoch": 0.51, - "learning_rate": 0.00022321787637024065, + "epoch": 0.24, + "learning_rate": 0.0002641669735786611, "loss": 0.0224, "step": 47350 }, { - "epoch": 0.51, - "learning_rate": 0.0002232016605046377, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.00026415940588564706, + "loss": 0.0274, "step": 47360 }, { - "epoch": 0.51, - "learning_rate": 0.0002231854446390348, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.00026415183819263304, + "loss": 0.0212, "step": 47370 }, { - "epoch": 0.51, - "learning_rate": 0.0002231692287734319, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.0002641442704996191, + "loss": 0.0212, "step": 47380 }, { - "epoch": 0.51, - "learning_rate": 0.00022315301290782902, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.00026413670280660506, + "loss": 0.0193, "step": 47390 }, { - "epoch": 0.51, - "learning_rate": 0.00022313679704222608, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026412913511359104, + "loss": 0.0199, "step": 47400 }, { - "epoch": 0.51, - "learning_rate": 0.00022312058117662318, - "loss": 0.0203, + "epoch": 0.24, + "learning_rate": 0.000264121567420577, + "loss": 0.0196, "step": 47410 }, { - "epoch": 0.51, - "learning_rate": 0.0002231043653110203, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.000264113999727563, + "loss": 0.024, "step": 47420 }, { - "epoch": 0.51, - "learning_rate": 0.0002230881494454174, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.000264106432034549, + "loss": 0.0214, "step": 47430 }, { - "epoch": 0.51, - "learning_rate": 0.00022307193357981445, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.000264098864341535, + "loss": 0.0207, "step": 47440 }, { - "epoch": 0.51, - "learning_rate": 0.00022305571771421155, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.000264091296648521, + "loss": 0.0191, "step": 47450 }, { - "epoch": 0.51, - "learning_rate": 0.00022303950184860867, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.000264083728955507, + "loss": 0.0182, "step": 47460 }, { - "epoch": 0.51, - "learning_rate": 0.00022302328598300576, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.00026407616126249297, + "loss": 0.0216, "step": 47470 }, { - "epoch": 0.51, - "learning_rate": 0.00022300707011740285, - "loss": 0.0207, + "epoch": 0.24, + "learning_rate": 0.00026406859356947895, + "loss": 0.02, "step": 47480 }, { - "epoch": 0.51, - "learning_rate": 0.00022299085425179994, - "loss": 0.0223, + "epoch": 0.24, + "learning_rate": 0.00026406102587646493, + "loss": 0.0159, "step": 47490 }, { - "epoch": 0.51, - "learning_rate": 0.00022297463838619704, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.00026405345818345097, + "loss": 0.0212, "step": 47500 }, { - "epoch": 0.51, - "learning_rate": 0.00022295842252059413, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.00026404589049043695, + "loss": 0.0226, "step": 47510 }, { - "epoch": 0.51, - "learning_rate": 0.00022294220665499125, + "epoch": 0.24, + "learning_rate": 0.00026403832279742293, "loss": 0.0201, "step": 47520 }, { - "epoch": 0.51, - "learning_rate": 0.00022292599078938832, - "loss": 0.0191, + "epoch": 0.24, + "learning_rate": 0.0002640307551044089, + "loss": 0.0164, "step": 47530 }, { - "epoch": 0.51, - "learning_rate": 0.0002229097749237854, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002640231874113949, + "loss": 0.0229, "step": 47540 }, { - "epoch": 0.51, - "learning_rate": 0.0002228935590581825, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.00026401561971838087, + "loss": 0.0247, "step": 47550 }, { - "epoch": 0.51, - "learning_rate": 0.00022287734319257962, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.00026400805202536685, + "loss": 0.0194, "step": 47560 }, { - "epoch": 0.51, - "learning_rate": 0.0002228611273269767, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.0002640004843323529, + "loss": 0.0219, "step": 47570 }, { - "epoch": 0.51, - "learning_rate": 0.00022284491146137378, - "loss": 0.0204, + "epoch": 0.24, + "learning_rate": 0.00026399291663933887, + "loss": 0.0188, "step": 47580 }, { - "epoch": 0.51, - "learning_rate": 0.0002228286955957709, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026398534894632485, + "loss": 0.0244, "step": 47590 }, { - "epoch": 0.51, - "learning_rate": 0.000222812479730168, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.00026397778125331083, + "loss": 0.0197, "step": 47600 }, { - "epoch": 0.51, - "learning_rate": 0.00022279626386456506, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002639702135602968, + "loss": 0.0221, "step": 47610 }, { - "epoch": 0.51, - "learning_rate": 0.00022278004799896215, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002639626458672828, + "loss": 0.0216, "step": 47620 }, { - "epoch": 0.51, - "learning_rate": 0.00022276383213335927, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.00026395507817426883, + "loss": 0.0227, "step": 47630 }, { - "epoch": 0.52, - "learning_rate": 0.00022274761626775636, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002639475104812548, + "loss": 0.0247, "step": 47640 }, { - "epoch": 0.52, - "learning_rate": 0.00022273140040215343, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.0002639399427882408, + "loss": 0.0204, "step": 47650 }, { - "epoch": 0.52, - "learning_rate": 0.00022271518453655055, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.0002639323750952268, + "loss": 0.026, "step": 47660 }, { - "epoch": 0.52, - "learning_rate": 0.00022269896867094764, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.00026392480740221276, + "loss": 0.0216, "step": 47670 }, { - "epoch": 0.52, - "learning_rate": 0.00022268275280534473, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.00026391723970919874, + "loss": 0.022, "step": 47680 }, { - "epoch": 0.52, - "learning_rate": 0.0002226665369397418, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.0002639096720161847, + "loss": 0.0216, "step": 47690 }, { - "epoch": 0.52, - "learning_rate": 0.00022265032107413892, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026390210432317076, + "loss": 0.0209, "step": 47700 }, { - "epoch": 0.52, - "learning_rate": 0.000222634105208536, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.00026389453663015674, + "loss": 0.0277, "step": 47710 }, { - "epoch": 0.52, - "learning_rate": 0.00022261788934293313, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002638869689371427, + "loss": 0.0262, "step": 47720 }, { - "epoch": 0.52, - "learning_rate": 0.0002226016734773302, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002638794012441287, + "loss": 0.0212, "step": 47730 }, { - "epoch": 0.52, - "learning_rate": 0.0002225854576117273, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002638718335511147, + "loss": 0.0265, "step": 47740 }, { - "epoch": 0.52, - "learning_rate": 0.00022256924174612438, - "loss": 0.0217, + "epoch": 0.24, + "learning_rate": 0.00026386426585810066, + "loss": 0.0204, "step": 47750 }, { - "epoch": 0.52, - "learning_rate": 0.0002225530258805215, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.0002638566981650867, + "loss": 0.0244, "step": 47760 }, { - "epoch": 0.52, - "learning_rate": 0.00022253681001491857, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002638491304720727, + "loss": 0.0235, "step": 47770 }, { - "epoch": 0.52, - "learning_rate": 0.00022252059414931566, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.00026384156277905866, + "loss": 0.0228, "step": 47780 }, { - "epoch": 0.52, - "learning_rate": 0.00022250437828371278, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.00026383399508604464, + "loss": 0.0228, "step": 47790 }, { - "epoch": 0.52, - "learning_rate": 0.00022248816241810987, - "loss": 0.0226, + "epoch": 0.24, + "learning_rate": 0.0002638264273930306, + "loss": 0.0253, "step": 47800 }, { - "epoch": 0.52, - "learning_rate": 0.00022247194655250694, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.0002638188597000166, + "loss": 0.0205, "step": 47810 }, { - "epoch": 0.52, - "learning_rate": 0.00022245573068690403, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.00026381129200700264, + "loss": 0.0226, "step": 47820 }, { - "epoch": 0.52, - "learning_rate": 0.00022243951482130115, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.0002638037243139886, + "loss": 0.0198, "step": 47830 }, { - "epoch": 0.52, - "learning_rate": 0.00022242329895569824, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002637961566209746, + "loss": 0.0209, "step": 47840 }, { - "epoch": 0.52, - "learning_rate": 0.0002224070830900953, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.0002637885889279606, + "loss": 0.0246, "step": 47850 }, { - "epoch": 0.52, - "learning_rate": 0.00022239086722449243, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026378102123494657, + "loss": 0.0185, "step": 47860 }, { - "epoch": 0.52, - "learning_rate": 0.00022237465135888952, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.00026377345354193255, + "loss": 0.0212, "step": 47870 }, { - "epoch": 0.52, - "learning_rate": 0.00022235843549328662, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026376588584891853, + "loss": 0.0234, "step": 47880 }, { - "epoch": 0.52, - "learning_rate": 0.00022234221962768368, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.00026375831815590457, + "loss": 0.0225, "step": 47890 }, { - "epoch": 0.52, - "learning_rate": 0.0002223260037620808, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.00026375075046289055, + "loss": 0.0246, "step": 47900 }, { - "epoch": 0.52, - "learning_rate": 0.0002223097878964779, - "loss": 0.0193, + "epoch": 0.24, + "learning_rate": 0.00026374318276987653, + "loss": 0.0237, "step": 47910 }, { - "epoch": 0.52, - "learning_rate": 0.000222293572030875, - "loss": 0.0196, + "epoch": 0.24, + "learning_rate": 0.0002637356150768625, + "loss": 0.0229, "step": 47920 }, { - "epoch": 0.52, - "learning_rate": 0.00022227735616527208, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.0002637280473838485, + "loss": 0.0238, "step": 47930 }, { - "epoch": 0.52, - "learning_rate": 0.00022226114029966917, - "loss": 0.0222, + "epoch": 0.24, + "learning_rate": 0.0002637204796908345, + "loss": 0.023, "step": 47940 }, { - "epoch": 0.52, - "learning_rate": 0.00022224492443406627, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.0002637129119978205, + "loss": 0.0245, "step": 47950 }, { - "epoch": 0.52, - "learning_rate": 0.00022222870856846338, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002637053443048065, + "loss": 0.024, "step": 47960 }, { - "epoch": 0.52, - "learning_rate": 0.00022221249270286045, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.00026369777661179247, + "loss": 0.0206, "step": 47970 }, { - "epoch": 0.52, - "learning_rate": 0.00022219627683725754, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026369020891877845, + "loss": 0.0229, "step": 47980 }, { - "epoch": 0.52, - "learning_rate": 0.00022218006097165466, - "loss": 0.0218, + "epoch": 0.24, + "learning_rate": 0.00026368264122576444, + "loss": 0.0198, "step": 47990 }, { - "epoch": 0.52, - "learning_rate": 0.00022216384510605176, - "loss": 0.0211, + "epoch": 0.24, + "learning_rate": 0.0002636750735327504, + "loss": 0.0226, "step": 48000 }, { - "epoch": 0.52, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.013234671205282211, - "eval_runtime": 121.4322, - "eval_samples_per_second": 16.47, - "eval_steps_per_second": 4.118, + "epoch": 0.24, + "eval_cer": 0.9144945158062973, + "eval_loss": 0.015514707192778587, + "eval_runtime": 117.0856, + "eval_samples_per_second": 17.082, + "eval_steps_per_second": 4.27, "step": 48000 }, { - "epoch": 0.52, - "learning_rate": 0.00022214762924044882, - "loss": 0.0167, + "epoch": 0.24, + "learning_rate": 0.00026366750583973645, + "loss": 0.0243, "step": 48010 }, { - "epoch": 0.52, - "learning_rate": 0.00022213141337484591, - "loss": 0.0182, + "epoch": 0.24, + "learning_rate": 0.00026365993814672243, + "loss": 0.0214, "step": 48020 }, { - "epoch": 0.52, - "learning_rate": 0.00022211519750924303, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002636523704537084, + "loss": 0.0243, "step": 48030 }, { - "epoch": 0.52, - "learning_rate": 0.00022209898164364013, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002636448027606944, + "loss": 0.0254, "step": 48040 }, { - "epoch": 0.52, - "learning_rate": 0.0002220827657780372, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.0002636372350676804, + "loss": 0.023, "step": 48050 }, { - "epoch": 0.52, - "learning_rate": 0.0002220665499124343, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.00026362966737466636, + "loss": 0.0218, "step": 48060 }, { - "epoch": 0.52, - "learning_rate": 0.0002220503340468314, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.00026362209968165234, + "loss": 0.0228, "step": 48070 }, { - "epoch": 0.52, - "learning_rate": 0.0002220341181812285, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.0002636145319886384, + "loss": 0.0219, "step": 48080 }, { - "epoch": 0.52, - "learning_rate": 0.00022201790231562556, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.00026360696429562436, + "loss": 0.0156, "step": 48090 }, { - "epoch": 0.52, - "learning_rate": 0.00022200168645002268, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.00026359939660261034, + "loss": 0.0239, "step": 48100 }, { - "epoch": 0.52, - "learning_rate": 0.00022198547058441978, - "loss": 0.0182, + "epoch": 0.24, + "learning_rate": 0.0002635918289095963, + "loss": 0.0257, "step": 48110 }, { - "epoch": 0.52, - "learning_rate": 0.00022196925471881687, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.0002635842612165823, + "loss": 0.0211, "step": 48120 }, { - "epoch": 0.52, - "learning_rate": 0.00022195303885321396, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002635766935235683, + "loss": 0.0273, "step": 48130 }, { - "epoch": 0.52, - "learning_rate": 0.00022193682298761105, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002635691258305543, + "loss": 0.0219, "step": 48140 }, { - "epoch": 0.52, - "learning_rate": 0.00022192060712200815, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.0002635615581375403, + "loss": 0.0251, "step": 48150 }, { - "epoch": 0.52, - "learning_rate": 0.00022190439125640527, - "loss": 0.0201, + "epoch": 0.24, + "learning_rate": 0.0002635539904445263, + "loss": 0.0212, "step": 48160 }, { - "epoch": 0.52, - "learning_rate": 0.00022188817539080233, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026354642275151226, + "loss": 0.0205, "step": 48170 }, { - "epoch": 0.52, - "learning_rate": 0.00022187195952519943, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.00026353885505849825, + "loss": 0.0199, "step": 48180 }, { - "epoch": 0.52, - "learning_rate": 0.00022185574365959652, - "loss": 0.0211, + "epoch": 0.24, + "learning_rate": 0.0002635312873654842, + "loss": 0.0203, "step": 48190 }, { - "epoch": 0.52, - "learning_rate": 0.00022183952779399364, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.0002635237196724702, + "loss": 0.0216, "step": 48200 }, { - "epoch": 0.52, - "learning_rate": 0.00022182331192839073, - "loss": 0.0199, + "epoch": 0.24, + "learning_rate": 0.00026351615197945624, + "loss": 0.0198, "step": 48210 }, { - "epoch": 0.52, - "learning_rate": 0.0002218070960627878, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.0002635085842864422, + "loss": 0.0235, "step": 48220 }, { - "epoch": 0.52, - "learning_rate": 0.00022179088019718492, - "loss": 0.0225, + "epoch": 0.24, + "learning_rate": 0.0002635010165934282, + "loss": 0.0244, "step": 48230 }, { - "epoch": 0.52, - "learning_rate": 0.000221774664331582, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.0002634934489004142, + "loss": 0.0211, "step": 48240 }, { - "epoch": 0.52, - "learning_rate": 0.0002217584484659791, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.00026348588120740017, + "loss": 0.0189, "step": 48250 }, { - "epoch": 0.52, - "learning_rate": 0.00022174223260037617, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.00026347831351438615, + "loss": 0.0228, "step": 48260 }, { - "epoch": 0.52, - "learning_rate": 0.0002217260167347733, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002634707458213722, + "loss": 0.0208, "step": 48270 }, { - "epoch": 0.52, - "learning_rate": 0.00022170980086917038, - "loss": 0.0215, + "epoch": 0.24, + "learning_rate": 0.00026346317812835817, + "loss": 0.024, "step": 48280 }, { - "epoch": 0.52, - "learning_rate": 0.0002216935850035675, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.00026345561043534415, + "loss": 0.0229, "step": 48290 }, { - "epoch": 0.52, - "learning_rate": 0.00022167736913796457, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.00026344804274233013, + "loss": 0.0207, "step": 48300 }, { - "epoch": 0.52, - "learning_rate": 0.00022166115327236166, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002634404750493161, + "loss": 0.0215, "step": 48310 }, { - "epoch": 0.52, - "learning_rate": 0.00022164493740675875, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.0002634329073563021, + "loss": 0.0354, "step": 48320 }, { - "epoch": 0.52, - "learning_rate": 0.00022162872154115587, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.00026342533966328813, + "loss": 0.0351, "step": 48330 }, { - "epoch": 0.52, - "learning_rate": 0.00022161250567555294, - "loss": 0.0191, + "epoch": 0.24, + "learning_rate": 0.0002634177719702741, + "loss": 0.0239, "step": 48340 }, { - "epoch": 0.52, - "learning_rate": 0.00022159628980995003, - "loss": 0.0193, + "epoch": 0.24, + "learning_rate": 0.0002634102042772601, + "loss": 0.0199, "step": 48350 }, { - "epoch": 0.52, - "learning_rate": 0.00022158007394434715, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002634026365842461, + "loss": 0.0196, "step": 48360 }, { - "epoch": 0.52, - "learning_rate": 0.00022156385807874424, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.00026339506889123206, + "loss": 0.0282, "step": 48370 }, { - "epoch": 0.52, - "learning_rate": 0.0002215476422131413, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026338750119821804, + "loss": 0.0207, "step": 48380 }, { - "epoch": 0.52, - "learning_rate": 0.0002215314263475384, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.000263379933505204, + "loss": 0.0238, "step": 48390 }, { - "epoch": 0.52, - "learning_rate": 0.00022151521048193552, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.00026337236581219, + "loss": 0.0243, "step": 48400 }, { - "epoch": 0.52, - "learning_rate": 0.0002214989946163326, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.000263364798119176, + "loss": 0.0196, "step": 48410 }, { - "epoch": 0.52, - "learning_rate": 0.00022148277875072968, - "loss": 0.0199, + "epoch": 0.24, + "learning_rate": 0.00026335723042616196, + "loss": 0.0195, "step": 48420 }, { - "epoch": 0.52, - "learning_rate": 0.0002214665628851268, - "loss": 0.0221, + "epoch": 0.24, + "learning_rate": 0.00026334966273314794, + "loss": 0.0169, "step": 48430 }, { - "epoch": 0.52, - "learning_rate": 0.0002214503470195239, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.000263342095040134, + "loss": 0.0239, "step": 48440 }, { - "epoch": 0.52, - "learning_rate": 0.00022143413115392098, - "loss": 0.0204, + "epoch": 0.24, + "learning_rate": 0.00026333452734711996, + "loss": 0.0218, "step": 48450 }, { - "epoch": 0.52, - "learning_rate": 0.00022141791528831805, - "loss": 0.0205, + "epoch": 0.24, + "learning_rate": 0.00026332695965410594, + "loss": 0.0185, "step": 48460 }, { - "epoch": 0.52, - "learning_rate": 0.00022140169942271517, - "loss": 0.0201, + "epoch": 0.24, + "learning_rate": 0.0002633193919610919, + "loss": 0.0182, "step": 48470 }, { - "epoch": 0.52, - "learning_rate": 0.00022138548355711226, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002633118242680779, + "loss": 0.0219, "step": 48480 }, { - "epoch": 0.52, - "learning_rate": 0.00022136926769150935, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002633042565750639, + "loss": 0.0188, "step": 48490 }, { - "epoch": 0.52, - "learning_rate": 0.00022135305182590645, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.0002632966888820499, + "loss": 0.0259, "step": 48500 }, { - "epoch": 0.52, - "learning_rate": 0.00022133683596030354, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.0002632891211890359, + "loss": 0.0259, "step": 48510 }, { - "epoch": 0.52, - "learning_rate": 0.00022132062009470063, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002632815534960219, + "loss": 0.0211, "step": 48520 }, { - "epoch": 0.52, - "learning_rate": 0.00022130440422909775, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.00026327398580300787, + "loss": 0.0176, "step": 48530 }, { - "epoch": 0.52, - "learning_rate": 0.00022128818836349482, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.00026326641810999385, + "loss": 0.0215, "step": 48540 }, { - "epoch": 0.52, - "learning_rate": 0.0002212719724978919, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.00026325885041697983, + "loss": 0.0193, "step": 48550 }, { - "epoch": 0.52, - "learning_rate": 0.000221255756632289, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.00026325128272396587, + "loss": 0.0211, "step": 48560 }, { - "epoch": 0.53, - "learning_rate": 0.00022123954076668612, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.00026324371503095185, + "loss": 0.0204, "step": 48570 }, { - "epoch": 0.53, - "learning_rate": 0.0002212233249010832, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.00026323614733793783, + "loss": 0.0194, "step": 48580 }, { - "epoch": 0.53, - "learning_rate": 0.00022120710903548028, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.0002632285796449238, + "loss": 0.0161, "step": 48590 }, { - "epoch": 0.53, - "learning_rate": 0.0002211908931698774, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.0002632210119519098, + "loss": 0.0273, "step": 48600 }, { - "epoch": 0.53, - "learning_rate": 0.0002211746773042745, - "loss": 0.0209, + "epoch": 0.25, + "learning_rate": 0.00026321344425889577, + "loss": 0.0227, "step": 48610 }, { - "epoch": 0.53, - "learning_rate": 0.00022115846143867156, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.00026320587656588175, + "loss": 0.0217, "step": 48620 }, { - "epoch": 0.53, - "learning_rate": 0.00022114224557306865, - "loss": 0.0162, + "epoch": 0.25, + "learning_rate": 0.0002631983088728678, + "loss": 0.0256, "step": 48630 }, { - "epoch": 0.53, - "learning_rate": 0.00022112602970746577, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.00026319074117985377, + "loss": 0.0195, "step": 48640 }, { - "epoch": 0.53, - "learning_rate": 0.00022110981384186287, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.00026318317348683975, + "loss": 0.0206, "step": 48650 }, { - "epoch": 0.53, - "learning_rate": 0.00022109359797625993, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026317560579382573, + "loss": 0.0203, "step": 48660 }, { - "epoch": 0.53, - "learning_rate": 0.00022107738211065705, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002631680381008117, + "loss": 0.0292, "step": 48670 }, { - "epoch": 0.53, - "learning_rate": 0.00022106116624505414, - "loss": 0.0219, + "epoch": 0.25, + "learning_rate": 0.0002631604704077977, + "loss": 0.0227, "step": 48680 }, { - "epoch": 0.53, - "learning_rate": 0.00022104495037945124, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.00026315290271478373, + "loss": 0.0221, "step": 48690 }, { - "epoch": 0.53, - "learning_rate": 0.0002210287345138483, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.0002631453350217697, + "loss": 0.0199, "step": 48700 }, { - "epoch": 0.53, - "learning_rate": 0.00022101251864824542, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.0002631377673287557, + "loss": 0.0205, "step": 48710 }, { - "epoch": 0.53, - "learning_rate": 0.00022099630278264251, - "loss": 0.0207, + "epoch": 0.25, + "learning_rate": 0.0002631301996357417, + "loss": 0.0198, "step": 48720 }, { - "epoch": 0.53, - "learning_rate": 0.00022098008691703963, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026312263194272766, + "loss": 0.0239, "step": 48730 }, { - "epoch": 0.53, - "learning_rate": 0.0002209638710514367, + "epoch": 0.25, + "learning_rate": 0.00026311506424971364, "loss": 0.0193, "step": 48740 }, { - "epoch": 0.53, - "learning_rate": 0.0002209476551858338, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.0002631074965566996, + "loss": 0.0203, "step": 48750 }, { - "epoch": 0.53, - "learning_rate": 0.00022093143932023089, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.00026309992886368566, + "loss": 0.0259, "step": 48760 }, { - "epoch": 0.53, - "learning_rate": 0.000220915223454628, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.00026309236117067164, + "loss": 0.0228, "step": 48770 }, { - "epoch": 0.53, - "learning_rate": 0.00022089900758902507, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002630847934776576, + "loss": 0.0207, "step": 48780 }, { - "epoch": 0.53, - "learning_rate": 0.00022088279172342216, - "loss": 0.018, + "epoch": 0.25, + "learning_rate": 0.0002630772257846436, + "loss": 0.0235, "step": 48790 }, { - "epoch": 0.53, - "learning_rate": 0.00022086657585781928, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002630696580916296, + "loss": 0.0219, "step": 48800 }, { - "epoch": 0.53, - "learning_rate": 0.00022085035999221638, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.00026306209039861556, + "loss": 0.0228, "step": 48810 }, { - "epoch": 0.53, - "learning_rate": 0.00022083414412661344, - "loss": 0.0198, + "epoch": 0.25, + "learning_rate": 0.0002630545227056016, + "loss": 0.021, "step": 48820 }, { - "epoch": 0.53, - "learning_rate": 0.00022081792826101053, - "loss": 0.0206, + "epoch": 0.25, + "learning_rate": 0.0002630469550125876, + "loss": 0.0212, "step": 48830 }, { - "epoch": 0.53, - "learning_rate": 0.00022080171239540765, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.00026303938731957356, + "loss": 0.0202, "step": 48840 }, { - "epoch": 0.53, - "learning_rate": 0.00022078549652980475, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026303181962655954, + "loss": 0.0193, "step": 48850 }, { - "epoch": 0.53, - "learning_rate": 0.0002207692806642018, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002630242519335455, + "loss": 0.0174, "step": 48860 }, { - "epoch": 0.53, - "learning_rate": 0.00022075306479859893, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002630166842405315, + "loss": 0.0211, "step": 48870 }, { - "epoch": 0.53, - "learning_rate": 0.00022073684893299603, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026300911654751754, + "loss": 0.0255, "step": 48880 }, { - "epoch": 0.53, - "learning_rate": 0.00022072063306739312, - "loss": 0.0247, + "epoch": 0.25, + "learning_rate": 0.0002630015488545035, + "loss": 0.0251, "step": 48890 }, { - "epoch": 0.53, - "learning_rate": 0.00022070441720179018, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.0002629939811614895, + "loss": 0.0213, "step": 48900 }, { - "epoch": 0.53, - "learning_rate": 0.0002206882013361873, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.0002629864134684755, + "loss": 0.0236, "step": 48910 }, { - "epoch": 0.53, - "learning_rate": 0.0002206719854705844, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.00026297884577546147, + "loss": 0.0214, "step": 48920 }, { - "epoch": 0.53, - "learning_rate": 0.0002206557696049815, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026297127808244745, + "loss": 0.0194, "step": 48930 }, { - "epoch": 0.53, - "learning_rate": 0.0002206395537393786, - "loss": 0.02, + "epoch": 0.25, + "learning_rate": 0.00026296371038943343, + "loss": 0.0219, "step": 48940 }, { - "epoch": 0.53, - "learning_rate": 0.00022062333787377567, - "loss": 0.0209, + "epoch": 0.25, + "learning_rate": 0.00026295614269641947, + "loss": 0.0216, "step": 48950 }, { - "epoch": 0.53, - "learning_rate": 0.00022060712200817277, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.00026294857500340545, + "loss": 0.0219, "step": 48960 }, { - "epoch": 0.53, - "learning_rate": 0.0002205909061425699, - "loss": 0.0298, + "epoch": 0.25, + "learning_rate": 0.00026294100731039143, + "loss": 0.0237, "step": 48970 }, { - "epoch": 0.53, - "learning_rate": 0.00022057469027696698, - "loss": 0.0256, + "epoch": 0.25, + "learning_rate": 0.0002629334396173774, + "loss": 0.0216, "step": 48980 }, { - "epoch": 0.53, - "learning_rate": 0.00022055847441136405, - "loss": 0.022, + "epoch": 0.25, + "learning_rate": 0.0002629258719243634, + "loss": 0.0226, "step": 48990 }, { - "epoch": 0.53, - "learning_rate": 0.00022054225854576117, - "loss": 0.0184, + "epoch": 0.25, + "learning_rate": 0.0002629183042313494, + "loss": 0.0171, "step": 49000 }, { - "epoch": 0.53, - "eval_cer": 0.921567758848024, - "eval_loss": 0.013597916811704636, - "eval_runtime": 121.4697, - "eval_samples_per_second": 16.465, - "eval_steps_per_second": 4.116, + "epoch": 0.25, + "eval_cer": 0.914452788772905, + "eval_loss": 0.01547841913998127, + "eval_runtime": 116.9106, + "eval_samples_per_second": 17.107, + "eval_steps_per_second": 4.277, "step": 49000 }, { - "epoch": 0.53, - "learning_rate": 0.00022052604268015826, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.0002629107365383354, + "loss": 0.0207, "step": 49010 }, { - "epoch": 0.53, - "learning_rate": 0.00022050982681455535, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.0002629031688453214, + "loss": 0.0196, "step": 49020 }, { - "epoch": 0.53, - "learning_rate": 0.00022049361094895242, - "loss": 0.0198, + "epoch": 0.25, + "learning_rate": 0.0002628956011523074, + "loss": 0.0228, "step": 49030 }, { - "epoch": 0.53, - "learning_rate": 0.00022047739508334954, - "loss": 0.0202, + "epoch": 0.25, + "learning_rate": 0.00026288803345929335, + "loss": 0.0224, "step": 49040 }, { - "epoch": 0.53, - "learning_rate": 0.00022046117921774663, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.00026288046576627934, + "loss": 0.0213, "step": 49050 }, { - "epoch": 0.53, - "learning_rate": 0.00022044496335214372, - "loss": 0.0199, + "epoch": 0.25, + "learning_rate": 0.0002628728980732653, + "loss": 0.02, "step": 49060 }, { - "epoch": 0.53, - "learning_rate": 0.00022042874748654081, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.00026286533038025135, + "loss": 0.0183, "step": 49070 }, { - "epoch": 0.53, - "learning_rate": 0.0002204125316209379, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.00026285776268723733, + "loss": 0.023, "step": 49080 }, { - "epoch": 0.53, - "learning_rate": 0.000220396315755335, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002628501949942233, + "loss": 0.0184, "step": 49090 }, { - "epoch": 0.53, - "learning_rate": 0.00022038009988973212, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.0002628426273012093, + "loss": 0.0265, "step": 49100 }, { - "epoch": 0.53, - "learning_rate": 0.00022036388402412919, - "loss": 0.0206, + "epoch": 0.25, + "learning_rate": 0.0002628350596081953, + "loss": 0.023, "step": 49110 }, { - "epoch": 0.53, - "learning_rate": 0.00022034766815852628, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.00026282749191518126, + "loss": 0.0267, "step": 49120 }, { - "epoch": 0.53, - "learning_rate": 0.00022033145229292337, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.00026281992422216724, + "loss": 0.021, "step": 49130 }, { - "epoch": 0.53, - "learning_rate": 0.0002203152364273205, - "loss": 0.0181, + "epoch": 0.25, + "learning_rate": 0.0002628123565291533, + "loss": 0.0201, "step": 49140 }, { - "epoch": 0.53, - "learning_rate": 0.00022029902056171756, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.00026280478883613926, + "loss": 0.023, "step": 49150 }, { - "epoch": 0.53, - "learning_rate": 0.00022028280469611465, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.00026279722114312524, + "loss": 0.0224, "step": 49160 }, { - "epoch": 0.53, - "learning_rate": 0.00022026658883051177, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.0002627896534501112, + "loss": 0.0228, "step": 49170 }, { - "epoch": 0.53, - "learning_rate": 0.00022025037296490886, - "loss": 0.0181, + "epoch": 0.25, + "learning_rate": 0.0002627820857570972, + "loss": 0.022, "step": 49180 }, { - "epoch": 0.53, - "learning_rate": 0.00022023415709930593, - "loss": 0.0214, + "epoch": 0.25, + "learning_rate": 0.0002627745180640832, + "loss": 0.0164, "step": 49190 }, { - "epoch": 0.53, - "learning_rate": 0.00022021794123370302, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.0002627669503710692, + "loss": 0.018, "step": 49200 }, { - "epoch": 0.53, - "learning_rate": 0.00022020172536810014, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.0002627593826780552, + "loss": 0.0173, "step": 49210 }, { - "epoch": 0.53, - "learning_rate": 0.00022018550950249723, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002627518149850412, + "loss": 0.0205, "step": 49220 }, { - "epoch": 0.53, - "learning_rate": 0.0002201692936368943, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.00026274424729202716, + "loss": 0.0234, "step": 49230 }, { - "epoch": 0.53, - "learning_rate": 0.00022015307777129142, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.00026273667959901315, + "loss": 0.0218, "step": 49240 }, { - "epoch": 0.53, - "learning_rate": 0.0002201368619056885, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.00026272911190599913, + "loss": 0.0169, "step": 49250 }, { - "epoch": 0.53, - "learning_rate": 0.0002201206460400856, - "loss": 0.0207, + "epoch": 0.25, + "learning_rate": 0.0002627215442129851, + "loss": 0.0187, "step": 49260 }, { - "epoch": 0.53, - "learning_rate": 0.00022010443017448267, - "loss": 0.0235, + "epoch": 0.25, + "learning_rate": 0.00026271397651997114, + "loss": 0.0195, "step": 49270 }, { - "epoch": 0.53, - "learning_rate": 0.0002200882143088798, - "loss": 0.019, + "epoch": 0.25, + "learning_rate": 0.0002627064088269571, + "loss": 0.0175, "step": 49280 }, { - "epoch": 0.53, - "learning_rate": 0.00022007199844327688, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002626988411339431, + "loss": 0.0215, "step": 49290 }, { - "epoch": 0.53, - "learning_rate": 0.000220055782577674, - "loss": 0.0196, + "epoch": 0.25, + "learning_rate": 0.0002626912734409291, + "loss": 0.0204, "step": 49300 }, { - "epoch": 0.53, - "learning_rate": 0.00022003956671207107, - "loss": 0.0227, + "epoch": 0.25, + "learning_rate": 0.00026268370574791507, + "loss": 0.0264, "step": 49310 }, { - "epoch": 0.53, - "learning_rate": 0.00022002335084646816, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.00026267613805490105, + "loss": 0.0278, "step": 49320 }, { - "epoch": 0.53, - "learning_rate": 0.00022000713498086525, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.0002626685703618871, + "loss": 0.0248, "step": 49330 }, { - "epoch": 0.53, - "learning_rate": 0.00021999091911526237, - "loss": 0.0201, + "epoch": 0.25, + "learning_rate": 0.00026266100266887307, + "loss": 0.0231, "step": 49340 }, { - "epoch": 0.53, - "learning_rate": 0.00021997470324965944, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026265343497585905, + "loss": 0.0239, "step": 49350 }, { - "epoch": 0.53, - "learning_rate": 0.00021995848738405653, - "loss": 0.0241, + "epoch": 0.25, + "learning_rate": 0.00026264586728284503, + "loss": 0.0204, "step": 49360 }, { - "epoch": 0.53, - "learning_rate": 0.00021994227151845365, - "loss": 0.0227, + "epoch": 0.25, + "learning_rate": 0.000262638299589831, + "loss": 0.021, "step": 49370 }, { - "epoch": 0.53, - "learning_rate": 0.00021992605565285074, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.000262630731896817, + "loss": 0.0216, "step": 49380 }, { - "epoch": 0.53, - "learning_rate": 0.0002199098397872478, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.00026262316420380303, + "loss": 0.022, "step": 49390 }, { - "epoch": 0.53, - "learning_rate": 0.0002198936239216449, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.000262615596510789, + "loss": 0.02, "step": 49400 }, { - "epoch": 0.53, - "learning_rate": 0.00021987740805604202, - "loss": 0.0238, + "epoch": 0.25, + "learning_rate": 0.000262608028817775, + "loss": 0.0201, "step": 49410 }, { - "epoch": 0.53, - "learning_rate": 0.00021986119219043912, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.000262600461124761, + "loss": 0.0203, "step": 49420 }, { - "epoch": 0.53, - "learning_rate": 0.00021984497632483618, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.00026259289343174696, + "loss": 0.0205, "step": 49430 }, { - "epoch": 0.53, - "learning_rate": 0.0002198287604592333, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026258532573873294, + "loss": 0.0223, "step": 49440 }, { - "epoch": 0.53, - "learning_rate": 0.0002198125445936304, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002625777580457189, + "loss": 0.0216, "step": 49450 }, { - "epoch": 0.53, - "learning_rate": 0.00021979632872802749, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.00026257019035270495, + "loss": 0.0212, "step": 49460 }, { - "epoch": 0.53, - "learning_rate": 0.00021978011286242455, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.00026256262265969094, + "loss": 0.0207, "step": 49470 }, { - "epoch": 0.53, - "learning_rate": 0.00021976389699682167, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002625550549666769, + "loss": 0.0235, "step": 49480 }, { - "epoch": 0.54, - "learning_rate": 0.00021974768113121876, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.0002625474872736629, + "loss": 0.0181, "step": 49490 }, { - "epoch": 0.54, - "learning_rate": 0.00021973146526561586, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.0002625399195806489, + "loss": 0.0182, "step": 49500 }, { - "epoch": 0.54, - "learning_rate": 0.00021971524940001295, - "loss": 0.0214, + "epoch": 0.25, + "learning_rate": 0.00026253235188763486, + "loss": 0.0221, "step": 49510 }, { - "epoch": 0.54, - "learning_rate": 0.00021969903353441004, - "loss": 0.0211, + "epoch": 0.25, + "learning_rate": 0.0002625247841946209, + "loss": 0.0301, "step": 49520 }, { - "epoch": 0.54, - "learning_rate": 0.00021968281766880714, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002625172165016069, + "loss": 0.0225, "step": 49530 }, { - "epoch": 0.54, - "learning_rate": 0.00021966660180320426, - "loss": 0.02, + "epoch": 0.25, + "learning_rate": 0.00026250964880859286, + "loss": 0.0241, "step": 49540 }, { - "epoch": 0.54, - "learning_rate": 0.00021965038593760132, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026250208111557884, + "loss": 0.0226, "step": 49550 }, { - "epoch": 0.54, - "learning_rate": 0.00021963417007199841, - "loss": 0.0213, + "epoch": 0.25, + "learning_rate": 0.0002624945134225648, + "loss": 0.0236, "step": 49560 }, { - "epoch": 0.54, - "learning_rate": 0.0002196179542063955, - "loss": 0.0212, + "epoch": 0.25, + "learning_rate": 0.0002624869457295508, + "loss": 0.0215, "step": 49570 }, { - "epoch": 0.54, - "learning_rate": 0.00021960173834079263, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026247937803653684, + "loss": 0.0232, "step": 49580 }, { - "epoch": 0.54, - "learning_rate": 0.0002195855224751897, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.0002624718103435228, + "loss": 0.02, "step": 49590 }, { - "epoch": 0.54, - "learning_rate": 0.00021956930660958678, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.0002624642426505088, + "loss": 0.0189, "step": 49600 }, { - "epoch": 0.54, - "learning_rate": 0.0002195530907439839, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002624566749574948, + "loss": 0.0234, "step": 49610 }, { - "epoch": 0.54, - "learning_rate": 0.000219536874878381, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.00026244910726448077, + "loss": 0.0208, "step": 49620 }, { - "epoch": 0.54, - "learning_rate": 0.00021952065901277806, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026244153957146675, + "loss": 0.0176, "step": 49630 }, { - "epoch": 0.54, - "learning_rate": 0.00021950444314717516, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.00026243397187845273, + "loss": 0.0277, "step": 49640 }, { - "epoch": 0.54, - "learning_rate": 0.00021948822728157228, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.0002624264041854387, + "loss": 0.0259, "step": 49650 }, { - "epoch": 0.54, - "learning_rate": 0.00021947201141596937, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.0002624188364924247, + "loss": 0.0293, "step": 49660 }, { - "epoch": 0.54, - "learning_rate": 0.0002194557955503665, - "loss": 0.019, + "epoch": 0.25, + "learning_rate": 0.0002624112687994107, + "loss": 0.0237, "step": 49670 }, { - "epoch": 0.54, - "learning_rate": 0.00021943957968476355, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.00026240370110639665, + "loss": 0.0198, "step": 49680 }, { - "epoch": 0.54, - "learning_rate": 0.00021942336381916065, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.0002623961334133827, + "loss": 0.0218, "step": 49690 }, { - "epoch": 0.54, - "learning_rate": 0.00021940714795355774, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026238856572036867, + "loss": 0.0217, "step": 49700 }, { - "epoch": 0.54, - "learning_rate": 0.00021939093208795486, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026238099802735465, + "loss": 0.0206, "step": 49710 }, { - "epoch": 0.54, - "learning_rate": 0.00021937471622235192, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.00026237343033434063, + "loss": 0.0174, "step": 49720 }, { - "epoch": 0.54, - "learning_rate": 0.00021935850035674902, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002623658626413266, + "loss": 0.0238, "step": 49730 }, { - "epoch": 0.54, - "learning_rate": 0.00021934228449114614, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.0002623582949483126, + "loss": 0.0251, "step": 49740 }, { - "epoch": 0.54, - "learning_rate": 0.00021932606862554323, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.00026235072725529863, + "loss": 0.0189, "step": 49750 }, { - "epoch": 0.54, - "learning_rate": 0.0002193098527599403, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.0002623431595622846, + "loss": 0.019, "step": 49760 }, { - "epoch": 0.54, - "learning_rate": 0.0002192936368943374, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.0002623355918692706, + "loss": 0.0216, "step": 49770 }, { - "epoch": 0.54, - "learning_rate": 0.0002192774210287345, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.0002623280241762566, + "loss": 0.0211, "step": 49780 }, { - "epoch": 0.54, - "learning_rate": 0.0002192612051631316, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.00026232045648324256, + "loss": 0.0243, "step": 49790 }, { - "epoch": 0.54, - "learning_rate": 0.00021924498929752867, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026231288879022854, + "loss": 0.0228, "step": 49800 }, { - "epoch": 0.54, - "learning_rate": 0.00021922877343192579, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002623053210972146, + "loss": 0.0223, "step": 49810 }, { - "epoch": 0.54, - "learning_rate": 0.00021921255756632288, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026229775340420056, + "loss": 0.0203, "step": 49820 }, { - "epoch": 0.54, - "learning_rate": 0.00021919634170071997, - "loss": 0.0226, + "epoch": 0.25, + "learning_rate": 0.00026229018571118654, + "loss": 0.0194, "step": 49830 }, { - "epoch": 0.54, - "learning_rate": 0.00021918012583511704, - "loss": 0.0217, + "epoch": 0.25, + "learning_rate": 0.0002622826180181725, + "loss": 0.0225, "step": 49840 }, { - "epoch": 0.54, - "learning_rate": 0.00021916390996951416, - "loss": 0.0209, + "epoch": 0.25, + "learning_rate": 0.0002622750503251585, + "loss": 0.0241, "step": 49850 }, { - "epoch": 0.54, - "learning_rate": 0.00021914769410391125, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.0002622674826321445, + "loss": 0.0213, "step": 49860 }, { - "epoch": 0.54, - "learning_rate": 0.00021913147823830834, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.00026225991493913046, + "loss": 0.0197, "step": 49870 }, { - "epoch": 0.54, - "learning_rate": 0.00021911526237270544, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002622523472461165, + "loss": 0.0223, "step": 49880 }, { - "epoch": 0.54, - "learning_rate": 0.00021909904650710253, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002622447795531025, + "loss": 0.0208, "step": 49890 }, { - "epoch": 0.54, - "learning_rate": 0.00021908283064149962, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.00026223721186008846, + "loss": 0.0244, "step": 49900 }, { - "epoch": 0.54, - "learning_rate": 0.00021906661477589674, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.00026222964416707444, + "loss": 0.0235, "step": 49910 }, { - "epoch": 0.54, - "learning_rate": 0.0002190503989102938, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002622220764740604, + "loss": 0.0244, "step": 49920 }, { - "epoch": 0.54, - "learning_rate": 0.0002190341830446909, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002622145087810464, + "loss": 0.0262, "step": 49930 }, { - "epoch": 0.54, - "learning_rate": 0.000219017967179088, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.00026220694108803244, + "loss": 0.0229, "step": 49940 }, { - "epoch": 0.54, - "learning_rate": 0.0002190017513134851, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002621993733950184, + "loss": 0.0204, "step": 49950 }, { - "epoch": 0.54, - "learning_rate": 0.00021898553544788218, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.0002621918057020044, + "loss": 0.0185, "step": 49960 }, { - "epoch": 0.54, - "learning_rate": 0.00021896931958227927, - "loss": 0.0163, + "epoch": 0.25, + "learning_rate": 0.0002621842380089904, + "loss": 0.0206, "step": 49970 }, { - "epoch": 0.54, - "learning_rate": 0.0002189531037166764, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.00026217667031597637, + "loss": 0.0246, "step": 49980 }, { - "epoch": 0.54, - "learning_rate": 0.00021893688785107348, - "loss": 0.0218, + "epoch": 0.25, + "learning_rate": 0.00026216910262296235, + "loss": 0.0191, "step": 49990 }, { - "epoch": 0.54, - "learning_rate": 0.00021892067198547055, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.00026216153492994833, + "loss": 0.0225, "step": 50000 }, { - "epoch": 0.54, - "eval_cer": 0.9215842623041952, - "eval_loss": 0.012915155850350857, - "eval_runtime": 121.4472, - "eval_samples_per_second": 16.468, - "eval_steps_per_second": 4.117, + "epoch": 0.25, + "eval_cer": 0.9144683151109114, + "eval_loss": 0.015245326794683933, + "eval_runtime": 117.0207, + "eval_samples_per_second": 17.091, + "eval_steps_per_second": 4.273, "step": 50000 }, { - "epoch": 0.54, - "learning_rate": 0.00021890445611986767, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.00026215396723693437, + "loss": 0.0215, "step": 50010 }, { - "epoch": 0.54, - "learning_rate": 0.00021888824025426476, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.00026214639954392035, + "loss": 0.0214, "step": 50020 }, { - "epoch": 0.54, - "learning_rate": 0.00021887202438866185, - "loss": 0.0203, + "epoch": 0.25, + "learning_rate": 0.00026213883185090633, + "loss": 0.0212, "step": 50030 }, { - "epoch": 0.54, - "learning_rate": 0.00021885580852305892, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.0002621312641578923, + "loss": 0.0178, "step": 50040 }, { - "epoch": 0.54, - "learning_rate": 0.00021883959265745604, - "loss": 0.0184, + "epoch": 0.25, + "learning_rate": 0.0002621236964648783, + "loss": 0.023, "step": 50050 }, { - "epoch": 0.54, - "learning_rate": 0.00021882337679185313, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.0002621161287718643, + "loss": 0.0211, "step": 50060 }, { - "epoch": 0.54, - "learning_rate": 0.00021880716092625022, - "loss": 0.0182, + "epoch": 0.25, + "learning_rate": 0.0002621085610788503, + "loss": 0.0221, "step": 50070 }, { - "epoch": 0.54, - "learning_rate": 0.00021879094506064732, - "loss": 0.0141, + "epoch": 0.25, + "learning_rate": 0.0002621009933858363, + "loss": 0.0188, "step": 50080 }, { - "epoch": 0.54, - "learning_rate": 0.0002187747291950444, - "loss": 0.0184, + "epoch": 0.25, + "learning_rate": 0.0002620934256928223, + "loss": 0.0233, "step": 50090 }, { - "epoch": 0.54, - "learning_rate": 0.0002187585133294415, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026208585799980825, + "loss": 0.0258, "step": 50100 }, { - "epoch": 0.54, - "learning_rate": 0.00021874229746383862, - "loss": 0.0196, + "epoch": 0.25, + "learning_rate": 0.00026207829030679424, + "loss": 0.0252, "step": 50110 }, { - "epoch": 0.54, - "learning_rate": 0.0002187260815982357, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002620707226137802, + "loss": 0.0217, "step": 50120 }, { - "epoch": 0.54, - "learning_rate": 0.00021870986573263278, - "loss": 0.0215, + "epoch": 0.25, + "learning_rate": 0.00026206315492076625, + "loss": 0.0236, "step": 50130 }, { - "epoch": 0.54, - "learning_rate": 0.00021869364986702987, - "loss": 0.0177, + "epoch": 0.25, + "learning_rate": 0.00026205558722775223, + "loss": 0.0214, "step": 50140 }, { - "epoch": 0.54, - "learning_rate": 0.000218677434001427, - "loss": 0.0229, + "epoch": 0.25, + "learning_rate": 0.0002620480195347382, + "loss": 0.0196, "step": 50150 }, { - "epoch": 0.54, - "learning_rate": 0.00021866121813582406, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.0002620404518417242, + "loss": 0.0211, "step": 50160 }, { - "epoch": 0.54, - "learning_rate": 0.00021864500227022115, - "loss": 0.0163, + "epoch": 0.25, + "learning_rate": 0.0002620328841487102, + "loss": 0.0217, "step": 50170 }, { - "epoch": 0.54, - "learning_rate": 0.00021862878640461827, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.00026202531645569616, + "loss": 0.0216, "step": 50180 }, { - "epoch": 0.54, - "learning_rate": 0.00021861257053901536, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.00026201774876268214, + "loss": 0.0212, "step": 50190 }, { - "epoch": 0.54, - "learning_rate": 0.00021859635467341243, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002620101810696682, + "loss": 0.0194, "step": 50200 }, { - "epoch": 0.54, - "learning_rate": 0.00021858013880780952, - "loss": 0.0177, + "epoch": 0.25, + "learning_rate": 0.00026200261337665416, + "loss": 0.0253, "step": 50210 }, { - "epoch": 0.54, - "learning_rate": 0.00021856392294220664, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.00026199504568364014, + "loss": 0.0251, "step": 50220 }, { - "epoch": 0.54, - "learning_rate": 0.00021854770707660374, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.0002619874779906261, + "loss": 0.02, "step": 50230 }, { - "epoch": 0.54, - "learning_rate": 0.0002185314912110008, - "loss": 0.0227, + "epoch": 0.25, + "learning_rate": 0.0002619799102976121, + "loss": 0.0204, "step": 50240 }, { - "epoch": 0.54, - "learning_rate": 0.00021851527534539792, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.0002619723426045981, + "loss": 0.0262, "step": 50250 }, { - "epoch": 0.54, - "learning_rate": 0.00021849905947979501, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002619647749115841, + "loss": 0.0199, "step": 50260 }, { - "epoch": 0.54, - "learning_rate": 0.0002184828436141921, - "loss": 0.0199, + "epoch": 0.25, + "learning_rate": 0.0002619572072185701, + "loss": 0.0235, "step": 50270 }, { - "epoch": 0.54, - "learning_rate": 0.00021846662774858917, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.0002619496395255561, + "loss": 0.0206, "step": 50280 }, { - "epoch": 0.54, - "learning_rate": 0.0002184504118829863, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.00026194207183254206, + "loss": 0.0196, "step": 50290 }, { - "epoch": 0.54, - "learning_rate": 0.00021843419601738339, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.00026193450413952805, + "loss": 0.019, "step": 50300 }, { - "epoch": 0.54, - "learning_rate": 0.0002184179801517805, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.00026192693644651403, + "loss": 0.0215, "step": 50310 }, { - "epoch": 0.54, - "learning_rate": 0.00021840176428617757, - "loss": 0.0222, + "epoch": 0.25, + "learning_rate": 0.00026191936875350006, + "loss": 0.0218, "step": 50320 }, { - "epoch": 0.54, - "learning_rate": 0.00021838554842057466, - "loss": 0.0194, + "epoch": 0.25, + "learning_rate": 0.00026191180106048604, + "loss": 0.0237, "step": 50330 }, { - "epoch": 0.54, - "learning_rate": 0.00021836933255497176, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.000261904233367472, + "loss": 0.0252, "step": 50340 }, { - "epoch": 0.54, - "learning_rate": 0.00021835311668936888, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.000261896665674458, + "loss": 0.0229, "step": 50350 }, { - "epoch": 0.54, - "learning_rate": 0.00021833690082376597, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.000261889097981444, + "loss": 0.0208, "step": 50360 }, { - "epoch": 0.54, - "learning_rate": 0.00021832068495816303, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026188153028842997, + "loss": 0.021, "step": 50370 }, { - "epoch": 0.54, - "learning_rate": 0.00021830446909256015, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.00026187396259541595, + "loss": 0.0233, "step": 50380 }, { - "epoch": 0.54, - "learning_rate": 0.00021828825322695725, - "loss": 0.0199, + "epoch": 0.25, + "learning_rate": 0.000261866394902402, + "loss": 0.0215, "step": 50390 }, { - "epoch": 0.54, - "learning_rate": 0.00021827203736135434, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.00026185882720938797, + "loss": 0.0213, "step": 50400 }, { - "epoch": 0.54, - "learning_rate": 0.0002182558214957514, - "loss": 0.0214, + "epoch": 0.25, + "learning_rate": 0.00026185125951637395, + "loss": 0.0197, "step": 50410 }, { - "epoch": 0.55, - "learning_rate": 0.00021823960563014853, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.00026184369182335993, + "loss": 0.0214, "step": 50420 }, { - "epoch": 0.55, - "learning_rate": 0.00021822338976454562, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002618361241303459, + "loss": 0.0183, "step": 50430 }, { - "epoch": 0.55, - "learning_rate": 0.0002182071738989427, - "loss": 0.0194, + "epoch": 0.25, + "learning_rate": 0.0002618285564373319, + "loss": 0.0213, "step": 50440 }, { - "epoch": 0.55, - "learning_rate": 0.0002181909580333398, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026182098874431793, + "loss": 0.0207, "step": 50450 }, { - "epoch": 0.55, - "learning_rate": 0.0002181747421677369, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.0002618134210513039, + "loss": 0.019, "step": 50460 }, { - "epoch": 0.55, - "learning_rate": 0.000218158526302134, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.0002618058533582899, + "loss": 0.0195, "step": 50470 }, { - "epoch": 0.55, - "learning_rate": 0.0002181423104365311, - "loss": 0.0211, + "epoch": 0.25, + "learning_rate": 0.0002617982856652759, + "loss": 0.0182, "step": 50480 }, { - "epoch": 0.55, - "learning_rate": 0.00021812609457092817, - "loss": 0.0205, + "epoch": 0.25, + "learning_rate": 0.00026179071797226186, + "loss": 0.022, "step": 50490 }, { - "epoch": 0.55, - "learning_rate": 0.00021810987870532527, - "loss": 0.0207, + "epoch": 0.25, + "learning_rate": 0.00026178315027924784, + "loss": 0.0216, "step": 50500 }, { - "epoch": 0.55, - "learning_rate": 0.00021809366283972236, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.0002617755825862338, + "loss": 0.0211, "step": 50510 }, { - "epoch": 0.55, - "learning_rate": 0.00021807744697411948, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.00026176801489321985, + "loss": 0.0225, "step": 50520 }, { - "epoch": 0.55, - "learning_rate": 0.00021806123110851655, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026176044720020584, + "loss": 0.0247, "step": 50530 }, { - "epoch": 0.55, - "learning_rate": 0.00021804501524291364, - "loss": 0.0212, + "epoch": 0.25, + "learning_rate": 0.0002617528795071918, + "loss": 0.0167, "step": 50540 }, { - "epoch": 0.55, - "learning_rate": 0.00021802879937731076, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002617453118141778, + "loss": 0.0208, "step": 50550 }, { - "epoch": 0.55, - "learning_rate": 0.00021801258351170785, - "loss": 0.021, + "epoch": 0.26, + "learning_rate": 0.0002617377441211638, + "loss": 0.0187, "step": 50560 }, { - "epoch": 0.55, - "learning_rate": 0.00021799636764610492, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.00026173017642814976, + "loss": 0.0207, "step": 50570 }, { - "epoch": 0.55, - "learning_rate": 0.000217980151780502, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002617226087351358, + "loss": 0.0205, "step": 50580 }, { - "epoch": 0.55, - "learning_rate": 0.00021796393591489913, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002617150410421218, + "loss": 0.0193, "step": 50590 }, { - "epoch": 0.55, - "learning_rate": 0.00021794772004929622, - "loss": 0.0197, + "epoch": 0.26, + "learning_rate": 0.00026170747334910776, + "loss": 0.0202, "step": 50600 }, { - "epoch": 0.55, - "learning_rate": 0.0002179315041836933, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026169990565609374, + "loss": 0.0174, "step": 50610 }, { - "epoch": 0.55, - "learning_rate": 0.0002179152883180904, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.0002616923379630797, + "loss": 0.0223, "step": 50620 }, { - "epoch": 0.55, - "learning_rate": 0.0002178990724524875, - "loss": 0.0186, + "epoch": 0.26, + "learning_rate": 0.0002616847702700657, + "loss": 0.0233, "step": 50630 }, { - "epoch": 0.55, - "learning_rate": 0.0002178828565868846, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026167720257705174, + "loss": 0.0248, "step": 50640 }, { - "epoch": 0.55, - "learning_rate": 0.00021786664072128166, - "loss": 0.0211, + "epoch": 0.26, + "learning_rate": 0.0002616696348840377, + "loss": 0.0214, "step": 50650 }, { - "epoch": 0.55, - "learning_rate": 0.00021785042485567878, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002616620671910237, + "loss": 0.0205, "step": 50660 }, { - "epoch": 0.55, - "learning_rate": 0.00021783420899007587, - "loss": 0.0202, + "epoch": 0.26, + "learning_rate": 0.0002616544994980097, + "loss": 0.0223, "step": 50670 }, { - "epoch": 0.55, - "learning_rate": 0.000217817993124473, - "loss": 0.0184, + "epoch": 0.26, + "learning_rate": 0.00026164693180499567, + "loss": 0.0222, "step": 50680 }, { - "epoch": 0.55, - "learning_rate": 0.00021780177725887006, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026163936411198165, + "loss": 0.024, "step": 50690 }, { - "epoch": 0.55, - "learning_rate": 0.00021778556139326715, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026163179641896763, + "loss": 0.0229, "step": 50700 }, { - "epoch": 0.55, - "learning_rate": 0.00021776934552766424, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026162422872595366, + "loss": 0.022, "step": 50710 }, { - "epoch": 0.55, - "learning_rate": 0.00021775312966206136, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026161666103293965, + "loss": 0.021, "step": 50720 }, { - "epoch": 0.55, - "learning_rate": 0.00021773691379645843, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026160909333992563, + "loss": 0.0199, "step": 50730 }, { - "epoch": 0.55, - "learning_rate": 0.00021772069793085552, - "loss": 0.0215, + "epoch": 0.26, + "learning_rate": 0.0002616015256469116, + "loss": 0.0206, "step": 50740 }, { - "epoch": 0.55, - "learning_rate": 0.00021770448206525264, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.0002615939579538976, + "loss": 0.022, "step": 50750 }, { - "epoch": 0.55, - "learning_rate": 0.00021768826619964973, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.00026158639026088357, + "loss": 0.0206, "step": 50760 }, { - "epoch": 0.55, - "learning_rate": 0.0002176720503340468, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002615788225678696, + "loss": 0.0215, "step": 50770 }, { - "epoch": 0.55, - "learning_rate": 0.0002176558344684439, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.0002615712548748556, + "loss": 0.0254, "step": 50780 }, { - "epoch": 0.55, - "learning_rate": 0.000217639618602841, - "loss": 0.0194, + "epoch": 0.26, + "learning_rate": 0.00026156368718184157, + "loss": 0.021, "step": 50790 }, { - "epoch": 0.55, - "learning_rate": 0.0002176234027372381, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026155611948882755, + "loss": 0.0202, "step": 50800 }, { - "epoch": 0.55, - "learning_rate": 0.00021760718687163517, - "loss": 0.0196, + "epoch": 0.26, + "learning_rate": 0.00026154855179581353, + "loss": 0.0216, "step": 50810 }, { - "epoch": 0.55, - "learning_rate": 0.0002175909710060323, - "loss": 0.0191, + "epoch": 0.26, + "learning_rate": 0.0002615409841027995, + "loss": 0.0244, "step": 50820 }, { - "epoch": 0.55, - "learning_rate": 0.00021757475514042938, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.00026153341640978555, + "loss": 0.0193, "step": 50830 }, { - "epoch": 0.55, - "learning_rate": 0.00021755853927482647, - "loss": 0.0203, + "epoch": 0.26, + "learning_rate": 0.00026152584871677153, + "loss": 0.0197, "step": 50840 }, { - "epoch": 0.55, - "learning_rate": 0.00021754232340922354, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002615182810237575, + "loss": 0.0207, "step": 50850 }, { - "epoch": 0.55, - "learning_rate": 0.00021752610754362066, - "loss": 0.0187, + "epoch": 0.26, + "learning_rate": 0.0002615107133307435, + "loss": 0.021, "step": 50860 }, { - "epoch": 0.55, - "learning_rate": 0.00021750989167801775, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.0002615031456377295, + "loss": 0.023, "step": 50870 }, { - "epoch": 0.55, - "learning_rate": 0.00021749367581241485, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026149557794471546, + "loss": 0.0209, "step": 50880 }, { - "epoch": 0.55, - "learning_rate": 0.00021747745994681194, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026148801025170144, + "loss": 0.022, "step": 50890 }, { - "epoch": 0.55, - "learning_rate": 0.00021746124408120903, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.0002614804425586875, + "loss": 0.0198, "step": 50900 }, { - "epoch": 0.55, - "learning_rate": 0.00021744502821560612, - "loss": 0.019, + "epoch": 0.26, + "learning_rate": 0.0002614728748656734, + "loss": 0.0215, "step": 50910 }, { - "epoch": 0.55, - "learning_rate": 0.00021742881235000324, - "loss": 0.0197, + "epoch": 0.26, + "learning_rate": 0.0002614653071726594, + "loss": 0.023, "step": 50920 }, { - "epoch": 0.55, - "learning_rate": 0.0002174125964844003, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.00026145773947964536, + "loss": 0.0217, "step": 50930 }, { - "epoch": 0.55, - "learning_rate": 0.0002173963806187974, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002614501717866314, + "loss": 0.0229, "step": 50940 }, { - "epoch": 0.55, - "learning_rate": 0.0002173801647531945, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.0002614426040936174, + "loss": 0.0212, "step": 50950 }, { - "epoch": 0.55, - "learning_rate": 0.00021736394888759161, - "loss": 0.0182, + "epoch": 0.26, + "learning_rate": 0.00026143503640060336, + "loss": 0.018, "step": 50960 }, { - "epoch": 0.55, - "learning_rate": 0.00021734773302198868, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.00026142746870758934, + "loss": 0.0183, "step": 50970 }, { - "epoch": 0.55, - "learning_rate": 0.00021733151715638577, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.0002614199010145753, + "loss": 0.018, "step": 50980 }, { - "epoch": 0.55, - "learning_rate": 0.0002173153012907829, - "loss": 0.0201, + "epoch": 0.26, + "learning_rate": 0.0002614123333215613, + "loss": 0.0205, "step": 50990 }, { - "epoch": 0.55, - "learning_rate": 0.00021729908542517999, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.00026140476562854734, + "loss": 0.022, "step": 51000 }, { - "epoch": 0.55, - "eval_cer": 0.921579050686457, - "eval_loss": 0.012746312655508518, - "eval_runtime": 121.6627, - "eval_samples_per_second": 16.439, - "eval_steps_per_second": 4.11, + "epoch": 0.26, + "eval_cer": 0.9144770486760401, + "eval_loss": 0.01605140045285225, + "eval_runtime": 117.035, + "eval_samples_per_second": 17.089, + "eval_steps_per_second": 4.272, "step": 51000 }, { - "epoch": 0.55, - "learning_rate": 0.00021728286955957705, - "loss": 0.0226, + "epoch": 0.26, + "learning_rate": 0.0002613971979355333, + "loss": 0.019, "step": 51010 }, { - "epoch": 0.55, - "learning_rate": 0.00021726665369397417, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.0002613896302425193, + "loss": 0.0237, "step": 51020 }, { - "epoch": 0.55, - "learning_rate": 0.00021725043782837126, - "loss": 0.0194, + "epoch": 0.26, + "learning_rate": 0.0002613820625495053, + "loss": 0.0232, "step": 51030 }, { - "epoch": 0.55, - "learning_rate": 0.00021723422196276836, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.00026137449485649127, + "loss": 0.0221, "step": 51040 }, { - "epoch": 0.55, - "learning_rate": 0.00021721800609716542, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026136692716347725, + "loss": 0.017, "step": 51050 }, { - "epoch": 0.55, - "learning_rate": 0.00021720179023156254, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026135935947046323, + "loss": 0.0204, "step": 51060 }, { - "epoch": 0.55, - "learning_rate": 0.00021718557436595963, - "loss": 0.0186, + "epoch": 0.26, + "learning_rate": 0.00026135179177744927, + "loss": 0.02, "step": 51070 }, { - "epoch": 0.55, - "learning_rate": 0.00021716935850035673, - "loss": 0.0221, + "epoch": 0.26, + "learning_rate": 0.00026134422408443525, + "loss": 0.0178, "step": 51080 }, { - "epoch": 0.55, - "learning_rate": 0.00021715314263475385, - "loss": 0.0229, + "epoch": 0.26, + "learning_rate": 0.00026133665639142123, + "loss": 0.0212, "step": 51090 }, { - "epoch": 0.55, - "learning_rate": 0.0002171369267691509, - "loss": 0.0208, + "epoch": 0.26, + "learning_rate": 0.0002613290886984072, + "loss": 0.0243, "step": 51100 }, { - "epoch": 0.55, - "learning_rate": 0.000217120710903548, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.0002613215210053932, + "loss": 0.0243, "step": 51110 }, { - "epoch": 0.55, - "learning_rate": 0.00021710449503794513, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.0002613139533123792, + "loss": 0.0238, "step": 51120 }, { - "epoch": 0.55, - "learning_rate": 0.00021708827917234222, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002613063856193652, + "loss": 0.0265, "step": 51130 }, { - "epoch": 0.55, - "learning_rate": 0.00021707206330673928, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002612988179263512, + "loss": 0.0194, "step": 51140 }, { - "epoch": 0.55, - "learning_rate": 0.00021705584744113638, - "loss": 0.0208, + "epoch": 0.26, + "learning_rate": 0.0002612912502333372, + "loss": 0.0224, "step": 51150 }, { - "epoch": 0.55, - "learning_rate": 0.0002170396315755335, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.00026128368254032315, + "loss": 0.0209, "step": 51160 }, { - "epoch": 0.55, - "learning_rate": 0.0002170234157099306, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026127611484730914, + "loss": 0.0192, "step": 51170 }, { - "epoch": 0.55, - "learning_rate": 0.00021700719984432765, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.0002612685471542951, + "loss": 0.0194, "step": 51180 }, { - "epoch": 0.55, - "learning_rate": 0.00021699098397872477, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.00026126097946128115, + "loss": 0.023, "step": 51190 }, { - "epoch": 0.55, - "learning_rate": 0.00021697476811312187, - "loss": 0.022, + "epoch": 0.26, + "learning_rate": 0.00026125341176826713, + "loss": 0.0234, "step": 51200 }, { - "epoch": 0.55, - "learning_rate": 0.00021695855224751896, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.0002612458440752531, + "loss": 0.0201, "step": 51210 }, { - "epoch": 0.55, - "learning_rate": 0.00021694233638191603, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002612382763822391, + "loss": 0.0248, "step": 51220 }, { - "epoch": 0.55, - "learning_rate": 0.00021692612051631315, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002612307086892251, + "loss": 0.0214, "step": 51230 }, { - "epoch": 0.55, - "learning_rate": 0.00021690990465071024, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.00026122314099621106, + "loss": 0.0203, "step": 51240 }, { - "epoch": 0.55, - "learning_rate": 0.00021689368878510733, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026121557330319704, + "loss": 0.0187, "step": 51250 }, { - "epoch": 0.55, - "learning_rate": 0.00021687747291950442, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.0002612080056101831, + "loss": 0.0227, "step": 51260 }, { - "epoch": 0.55, - "learning_rate": 0.00021686125705390152, - "loss": 0.02, + "epoch": 0.26, + "learning_rate": 0.00026120043791716906, + "loss": 0.0194, "step": 51270 }, { - "epoch": 0.55, - "learning_rate": 0.0002168450411882986, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.00026119287022415504, + "loss": 0.0226, "step": 51280 }, { - "epoch": 0.55, - "learning_rate": 0.00021682882532269573, - "loss": 0.0202, + "epoch": 0.26, + "learning_rate": 0.000261185302531141, + "loss": 0.0201, "step": 51290 }, { - "epoch": 0.55, - "learning_rate": 0.0002168126094570928, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.000261177734838127, + "loss": 0.0182, "step": 51300 }, { - "epoch": 0.55, - "learning_rate": 0.0002167963935914899, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.000261170167145113, + "loss": 0.0282, "step": 51310 }, { - "epoch": 0.55, - "learning_rate": 0.000216780177725887, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.000261162599452099, + "loss": 0.0208, "step": 51320 }, { - "epoch": 0.55, - "learning_rate": 0.0002167639618602841, - "loss": 0.0185, + "epoch": 0.26, + "learning_rate": 0.000261155031759085, + "loss": 0.0216, "step": 51330 }, { - "epoch": 0.56, - "learning_rate": 0.00021674774599468117, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.000261147464066071, + "loss": 0.0241, "step": 51340 }, { - "epoch": 0.56, - "learning_rate": 0.00021673153012907826, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026113989637305696, + "loss": 0.0197, "step": 51350 }, { - "epoch": 0.56, - "learning_rate": 0.00021671531426347538, - "loss": 0.0182, + "epoch": 0.26, + "learning_rate": 0.00026113232868004295, + "loss": 0.0178, "step": 51360 }, { - "epoch": 0.56, - "learning_rate": 0.00021669909839787247, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.00026112476098702893, + "loss": 0.0197, "step": 51370 }, { - "epoch": 0.56, - "learning_rate": 0.00021668288253226954, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026111719329401496, + "loss": 0.0244, "step": 51380 }, { - "epoch": 0.56, - "learning_rate": 0.00021666666666666666, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026110962560100094, + "loss": 0.0223, "step": 51390 }, { - "epoch": 0.56, - "learning_rate": 0.00021665045080106375, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.0002611020579079869, + "loss": 0.0218, "step": 51400 }, { - "epoch": 0.56, - "learning_rate": 0.00021663423493546084, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.0002610944902149729, + "loss": 0.0206, "step": 51410 }, { - "epoch": 0.56, - "learning_rate": 0.0002166180190698579, - "loss": 0.0219, + "epoch": 0.26, + "learning_rate": 0.0002610869225219589, + "loss": 0.0204, "step": 51420 }, { - "epoch": 0.56, - "learning_rate": 0.00021660180320425503, - "loss": 0.0199, + "epoch": 0.26, + "learning_rate": 0.00026107935482894487, + "loss": 0.0269, "step": 51430 }, { - "epoch": 0.56, - "learning_rate": 0.00021658558733865212, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026107178713593085, + "loss": 0.0278, "step": 51440 }, { - "epoch": 0.56, - "learning_rate": 0.0002165693714730492, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.0002610642194429169, + "loss": 0.0228, "step": 51450 }, { - "epoch": 0.56, - "learning_rate": 0.0002165531556074463, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026105665174990287, + "loss": 0.0213, "step": 51460 }, { - "epoch": 0.56, - "learning_rate": 0.0002165369397418434, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.00026104908405688885, + "loss": 0.0199, "step": 51470 }, { - "epoch": 0.56, - "learning_rate": 0.0002165207238762405, - "loss": 0.0185, + "epoch": 0.26, + "learning_rate": 0.00026104151636387483, + "loss": 0.0218, "step": 51480 }, { - "epoch": 0.56, - "learning_rate": 0.0002165045080106376, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002610339486708608, + "loss": 0.0202, "step": 51490 }, { - "epoch": 0.56, - "learning_rate": 0.00021648829214503468, - "loss": 0.0194, + "epoch": 0.26, + "learning_rate": 0.0002610263809778468, + "loss": 0.0209, "step": 51500 }, { - "epoch": 0.56, - "learning_rate": 0.00021647207627943177, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026101881328483283, + "loss": 0.0213, "step": 51510 }, { - "epoch": 0.56, - "learning_rate": 0.00021645586041382886, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.0002610112455918188, + "loss": 0.0222, "step": 51520 }, { - "epoch": 0.56, - "learning_rate": 0.00021643964454822598, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002610036778988048, + "loss": 0.0191, "step": 51530 }, { - "epoch": 0.56, - "learning_rate": 0.00021642342868262305, - "loss": 0.0185, + "epoch": 0.26, + "learning_rate": 0.0002609961102057908, + "loss": 0.0196, "step": 51540 }, { - "epoch": 0.56, - "learning_rate": 0.00021640721281702014, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.00026098854251277676, + "loss": 0.0214, "step": 51550 }, { - "epoch": 0.56, - "learning_rate": 0.00021639099695141726, - "loss": 0.0211, + "epoch": 0.26, + "learning_rate": 0.00026098097481976274, + "loss": 0.016, "step": 51560 }, { - "epoch": 0.56, - "learning_rate": 0.00021637478108581435, - "loss": 0.019, + "epoch": 0.26, + "learning_rate": 0.0002609734071267487, + "loss": 0.0207, "step": 51570 }, { - "epoch": 0.56, - "learning_rate": 0.00021635856522021142, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.00026096583943373475, + "loss": 0.0242, "step": 51580 }, { - "epoch": 0.56, - "learning_rate": 0.0002163423493546085, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026095827174072074, + "loss": 0.018, "step": 51590 }, { - "epoch": 0.56, - "learning_rate": 0.00021632613348900563, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002609507040477067, + "loss": 0.0201, "step": 51600 }, { - "epoch": 0.56, - "learning_rate": 0.00021630991762340272, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.0002609431363546927, + "loss": 0.0232, "step": 51610 }, { - "epoch": 0.56, - "learning_rate": 0.0002162937017577998, - "loss": 0.0184, + "epoch": 0.26, + "learning_rate": 0.0002609355686616787, + "loss": 0.0234, "step": 51620 }, { - "epoch": 0.56, - "learning_rate": 0.0002162774858921969, - "loss": 0.021, + "epoch": 0.26, + "learning_rate": 0.00026092800096866466, + "loss": 0.0198, "step": 51630 }, { - "epoch": 0.56, - "learning_rate": 0.000216261270026594, - "loss": 0.0163, + "epoch": 0.26, + "learning_rate": 0.0002609204332756507, + "loss": 0.0238, "step": 51640 }, { - "epoch": 0.56, - "learning_rate": 0.0002162450541609911, - "loss": 0.022, + "epoch": 0.26, + "learning_rate": 0.0002609128655826367, + "loss": 0.0186, "step": 51650 }, { - "epoch": 0.56, - "learning_rate": 0.00021622883829538816, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026090529788962266, + "loss": 0.019, "step": 51660 }, { - "epoch": 0.56, - "learning_rate": 0.00021621262242978528, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.00026089773019660864, + "loss": 0.0186, "step": 51670 }, { - "epoch": 0.56, - "learning_rate": 0.00021619640656418237, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.0002608901625035946, + "loss": 0.0225, "step": 51680 }, { - "epoch": 0.56, - "learning_rate": 0.0002161801906985795, - "loss": 0.0197, + "epoch": 0.26, + "learning_rate": 0.0002608825948105806, + "loss": 0.0175, "step": 51690 }, { - "epoch": 0.56, - "learning_rate": 0.00021616397483297656, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.00026087502711756664, + "loss": 0.0212, "step": 51700 }, { - "epoch": 0.56, - "learning_rate": 0.00021614775896737365, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.0002608674594245526, + "loss": 0.0241, "step": 51710 }, { - "epoch": 0.56, - "learning_rate": 0.00021613154310177074, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.0002608598917315386, + "loss": 0.0191, "step": 51720 }, { - "epoch": 0.56, - "learning_rate": 0.00021611532723616786, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002608523240385246, + "loss": 0.0188, "step": 51730 }, { - "epoch": 0.56, - "learning_rate": 0.00021609911137056493, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026084475634551057, + "loss": 0.0208, "step": 51740 }, { - "epoch": 0.56, - "learning_rate": 0.00021608289550496202, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.00026083718865249655, + "loss": 0.0202, "step": 51750 }, { - "epoch": 0.56, - "learning_rate": 0.00021606667963935914, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.00026082962095948253, + "loss": 0.0199, "step": 51760 }, { - "epoch": 0.56, - "learning_rate": 0.00021605046377375624, - "loss": 0.0211, + "epoch": 0.26, + "learning_rate": 0.00026082205326646856, + "loss": 0.0393, "step": 51770 }, { - "epoch": 0.56, - "learning_rate": 0.0002160342479081533, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.00026081448557345455, + "loss": 0.0419, "step": 51780 }, { - "epoch": 0.56, - "learning_rate": 0.0002160180320425504, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.00026080691788044053, + "loss": 0.0159, "step": 51790 }, { - "epoch": 0.56, - "learning_rate": 0.0002160018161769475, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.0002607993501874265, + "loss": 0.0194, "step": 51800 }, { - "epoch": 0.56, - "learning_rate": 0.0002159856003113446, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002607917824944125, + "loss": 0.0199, "step": 51810 }, { - "epoch": 0.56, - "learning_rate": 0.0002159693844457417, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026078421480139847, + "loss": 0.0203, "step": 51820 }, { - "epoch": 0.56, - "learning_rate": 0.0002159531685801388, - "loss": 0.0205, + "epoch": 0.26, + "learning_rate": 0.0002607766471083845, + "loss": 0.0208, "step": 51830 }, { - "epoch": 0.56, - "learning_rate": 0.00021593695271453588, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002607690794153705, + "loss": 0.0246, "step": 51840 }, { - "epoch": 0.56, - "learning_rate": 0.00021592073684893298, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.00026076151172235647, + "loss": 0.0209, "step": 51850 }, { - "epoch": 0.56, - "learning_rate": 0.0002159045209833301, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.00026075394402934245, + "loss": 0.0238, "step": 51860 }, { - "epoch": 0.56, - "learning_rate": 0.00021588830511772716, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.00026074637633632843, + "loss": 0.0219, "step": 51870 }, { - "epoch": 0.56, - "learning_rate": 0.00021587208925212426, - "loss": 0.0207, + "epoch": 0.26, + "learning_rate": 0.0002607388086433144, + "loss": 0.0247, "step": 51880 }, { - "epoch": 0.56, - "learning_rate": 0.00021585587338652135, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026073124095030045, + "loss": 0.0211, "step": 51890 }, { - "epoch": 0.56, - "learning_rate": 0.00021583965752091847, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.00026072367325728643, + "loss": 0.0167, "step": 51900 }, { - "epoch": 0.56, - "learning_rate": 0.00021582344165531553, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.0002607161055642724, + "loss": 0.0237, "step": 51910 }, { - "epoch": 0.56, - "learning_rate": 0.00021580722578971263, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002607085378712584, + "loss": 0.0207, "step": 51920 }, { - "epoch": 0.56, - "learning_rate": 0.00021579100992410975, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002607009701782444, + "loss": 0.0234, "step": 51930 }, { - "epoch": 0.56, - "learning_rate": 0.00021577479405850684, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.00026069340248523036, + "loss": 0.0232, "step": 51940 }, { - "epoch": 0.56, - "learning_rate": 0.0002157585781929039, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.00026068583479221634, + "loss": 0.0213, "step": 51950 }, { - "epoch": 0.56, - "learning_rate": 0.000215742362327301, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.0002606782670992024, + "loss": 0.0221, "step": 51960 }, { - "epoch": 0.56, - "learning_rate": 0.00021572614646169812, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026067069940618836, + "loss": 0.0236, "step": 51970 }, { - "epoch": 0.56, - "learning_rate": 0.0002157099305960952, - "loss": 0.021, + "epoch": 0.26, + "learning_rate": 0.00026066313171317434, + "loss": 0.0219, "step": 51980 }, { - "epoch": 0.56, - "learning_rate": 0.00021569371473049228, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.0002606555640201603, + "loss": 0.0223, "step": 51990 }, { - "epoch": 0.56, - "learning_rate": 0.0002156774988648894, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.0002606479963271463, + "loss": 0.0231, "step": 52000 }, { - "epoch": 0.56, - "eval_cer": 0.9215338833327253, - "eval_loss": 0.01269690040498972, - "eval_runtime": 121.7858, - "eval_samples_per_second": 16.422, - "eval_steps_per_second": 4.106, + "epoch": 0.26, + "eval_cer": 0.9145013085791751, + "eval_loss": 0.015823883935809135, + "eval_runtime": 116.6377, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, "step": 52000 }, { - "epoch": 0.56, - "learning_rate": 0.0002156612829992865, - "loss": 0.0184, + "epoch": 0.26, + "learning_rate": 0.0002606404286341323, + "loss": 0.0225, "step": 52010 }, { - "epoch": 0.56, - "learning_rate": 0.00021564506713368358, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002606328609411183, + "loss": 0.0197, "step": 52020 }, { - "epoch": 0.56, - "learning_rate": 0.00021562885126808067, - "loss": 0.0194, + "epoch": 0.26, + "learning_rate": 0.0002606252932481043, + "loss": 0.0207, "step": 52030 }, { - "epoch": 0.56, - "learning_rate": 0.00021561263540247777, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.0002606177255550903, + "loss": 0.0181, "step": 52040 }, { - "epoch": 0.56, - "learning_rate": 0.00021559641953687486, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026061015786207626, + "loss": 0.0194, "step": 52050 }, { - "epoch": 0.56, - "learning_rate": 0.00021558020367127198, - "loss": 0.0203, + "epoch": 0.26, + "learning_rate": 0.00026060259016906224, + "loss": 0.0248, "step": 52060 }, { - "epoch": 0.56, - "learning_rate": 0.00021556398780566904, - "loss": 0.0203, + "epoch": 0.26, + "learning_rate": 0.0002605950224760482, + "loss": 0.0233, "step": 52070 }, { - "epoch": 0.56, - "learning_rate": 0.00021554777194006614, - "loss": 0.0205, + "epoch": 0.26, + "learning_rate": 0.0002605874547830342, + "loss": 0.0234, "step": 52080 }, { - "epoch": 0.56, - "learning_rate": 0.00021553155607446323, - "loss": 0.0186, + "epoch": 0.26, + "learning_rate": 0.00026057988709002024, + "loss": 0.0198, "step": 52090 }, { - "epoch": 0.56, - "learning_rate": 0.00021551534020886035, - "loss": 0.0261, + "epoch": 0.26, + "learning_rate": 0.0002605723193970062, + "loss": 0.0197, "step": 52100 }, { - "epoch": 0.56, - "learning_rate": 0.00021549912434325742, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002605647517039922, + "loss": 0.0186, "step": 52110 }, { - "epoch": 0.56, - "learning_rate": 0.0002154829084776545, - "loss": 0.0199, + "epoch": 0.26, + "learning_rate": 0.0002605571840109782, + "loss": 0.0216, "step": 52120 }, { - "epoch": 0.56, - "learning_rate": 0.00021546669261205163, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.00026054961631796417, + "loss": 0.0231, "step": 52130 }, { - "epoch": 0.56, - "learning_rate": 0.00021545047674644872, - "loss": 0.0346, + "epoch": 0.26, + "learning_rate": 0.00026054204862495015, + "loss": 0.0219, "step": 52140 }, { - "epoch": 0.56, - "learning_rate": 0.0002154342608808458, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.0002605344809319362, + "loss": 0.0209, "step": 52150 }, { - "epoch": 0.56, - "learning_rate": 0.00021541804501524288, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.00026052691323892217, + "loss": 0.0191, "step": 52160 }, { - "epoch": 0.56, - "learning_rate": 0.00021540182914964, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.0002605193455459081, + "loss": 0.0205, "step": 52170 }, { - "epoch": 0.56, - "learning_rate": 0.0002153856132840371, - "loss": 0.022, + "epoch": 0.26, + "learning_rate": 0.0002605117778528941, + "loss": 0.0268, "step": 52180 }, { - "epoch": 0.56, - "learning_rate": 0.00021536939741843416, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.0002605042101598801, + "loss": 0.019, "step": 52190 }, { - "epoch": 0.56, - "learning_rate": 0.00021535318155283128, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.0002604966424668661, + "loss": 0.0191, "step": 52200 }, { - "epoch": 0.56, - "learning_rate": 0.00021533696568722837, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002604890747738521, + "loss": 0.0197, "step": 52210 }, { - "epoch": 0.56, - "learning_rate": 0.00021532074982162546, - "loss": 0.0163, + "epoch": 0.26, + "learning_rate": 0.00026048150708083806, + "loss": 0.0232, "step": 52220 }, { - "epoch": 0.56, - "learning_rate": 0.00021530453395602253, - "loss": 0.0206, + "epoch": 0.26, + "learning_rate": 0.00026047393938782404, + "loss": 0.0213, "step": 52230 }, { - "epoch": 0.56, - "learning_rate": 0.00021528831809041965, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.00026046637169481, + "loss": 0.0238, "step": 52240 }, { - "epoch": 0.56, - "learning_rate": 0.00021527210222481674, - "loss": 0.0202, + "epoch": 0.26, + "learning_rate": 0.00026045880400179605, + "loss": 0.0203, "step": 52250 }, { - "epoch": 0.56, - "learning_rate": 0.00021525588635921383, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026045123630878204, + "loss": 0.0217, "step": 52260 }, { - "epoch": 0.57, - "learning_rate": 0.00021523967049361093, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.000260443668615768, + "loss": 0.024, "step": 52270 }, { - "epoch": 0.57, - "learning_rate": 0.00021522345462800802, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.000260436100922754, + "loss": 0.019, "step": 52280 }, { - "epoch": 0.57, - "learning_rate": 0.0002152072387624051, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026042853322974, + "loss": 0.0183, "step": 52290 }, { - "epoch": 0.57, - "learning_rate": 0.00021519102289680223, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.00026042096553672596, + "loss": 0.0207, "step": 52300 }, { - "epoch": 0.57, - "learning_rate": 0.0002151748070311993, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026041339784371194, + "loss": 0.0191, "step": 52310 }, { - "epoch": 0.57, - "learning_rate": 0.0002151585911655964, - "loss": 0.0206, + "epoch": 0.26, + "learning_rate": 0.000260405830150698, + "loss": 0.0196, "step": 52320 }, { - "epoch": 0.57, - "learning_rate": 0.0002151423752999935, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026039826245768396, + "loss": 0.0229, "step": 52330 }, { - "epoch": 0.57, - "learning_rate": 0.0002151261594343906, - "loss": 0.0189, + "epoch": 0.26, + "learning_rate": 0.00026039069476466994, + "loss": 0.02, "step": 52340 }, { - "epoch": 0.57, - "learning_rate": 0.00021510994356878767, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002603831270716559, + "loss": 0.0205, "step": 52350 }, { - "epoch": 0.57, - "learning_rate": 0.00021509372770318476, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002603755593786419, + "loss": 0.0192, "step": 52360 }, { - "epoch": 0.57, - "learning_rate": 0.00021507751183758188, - "loss": 0.0205, + "epoch": 0.26, + "learning_rate": 0.0002603679916856279, + "loss": 0.02, "step": 52370 }, { - "epoch": 0.57, - "learning_rate": 0.00021506129597197897, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002603604239926139, + "loss": 0.0292, "step": 52380 }, { - "epoch": 0.57, - "learning_rate": 0.00021504508010637604, - "loss": 0.0423, + "epoch": 0.26, + "learning_rate": 0.0002603528562995999, + "loss": 0.0183, "step": 52390 }, { - "epoch": 0.57, - "learning_rate": 0.00021502886424077316, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.0002603452886065859, + "loss": 0.0249, "step": 52400 }, { - "epoch": 0.57, - "learning_rate": 0.00021501264837517025, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.00026033772091357187, + "loss": 0.0192, "step": 52410 }, { - "epoch": 0.57, - "learning_rate": 0.00021499643250956734, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026033015322055785, + "loss": 0.0211, "step": 52420 }, { - "epoch": 0.57, - "learning_rate": 0.0002149802166439644, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.00026032258552754383, + "loss": 0.0222, "step": 52430 }, { - "epoch": 0.57, - "learning_rate": 0.00021496400077836153, - "loss": 0.0189, + "epoch": 0.26, + "learning_rate": 0.00026031501783452986, + "loss": 0.0232, "step": 52440 }, { - "epoch": 0.57, - "learning_rate": 0.00021494778491275862, - "loss": 0.0196, + "epoch": 0.26, + "learning_rate": 0.00026030745014151585, + "loss": 0.0258, "step": 52450 }, { - "epoch": 0.57, - "learning_rate": 0.00021493156904715572, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.0002602998824485018, + "loss": 0.021, "step": 52460 }, { - "epoch": 0.57, - "learning_rate": 0.0002149153531815528, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.0002602923147554878, + "loss": 0.0185, "step": 52470 }, { - "epoch": 0.57, - "learning_rate": 0.0002148991373159499, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.0002602847470624738, + "loss": 0.0182, "step": 52480 }, { - "epoch": 0.57, - "learning_rate": 0.000214882921450347, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026027717936945977, + "loss": 0.0181, "step": 52490 }, { - "epoch": 0.57, - "learning_rate": 0.00021486670558474411, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026026961167644575, + "loss": 0.0193, "step": 52500 }, { - "epoch": 0.57, - "learning_rate": 0.0002148504897191412, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002602620439834318, + "loss": 0.0241, "step": 52510 }, { - "epoch": 0.57, - "learning_rate": 0.00021483427385353827, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.00026025447629041777, + "loss": 0.0183, "step": 52520 }, { - "epoch": 0.57, - "learning_rate": 0.00021481805798793536, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00026024690859740375, + "loss": 0.0205, "step": 52530 }, { - "epoch": 0.57, - "learning_rate": 0.00021480184212233248, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00026023934090438973, + "loss": 0.0189, "step": 52540 }, { - "epoch": 0.57, - "learning_rate": 0.00021478562625672958, - "loss": 0.0174, + "epoch": 0.27, + "learning_rate": 0.0002602317732113757, + "loss": 0.0187, "step": 52550 }, { - "epoch": 0.57, - "learning_rate": 0.00021476941039112664, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002602242055183617, + "loss": 0.0214, "step": 52560 }, { - "epoch": 0.57, - "learning_rate": 0.00021475319452552376, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00026021663782534773, + "loss": 0.0204, "step": 52570 }, { - "epoch": 0.57, - "learning_rate": 0.00021473697865992086, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.0002602090701323337, + "loss": 0.0226, "step": 52580 }, { - "epoch": 0.57, - "learning_rate": 0.00021472076279431795, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.0002602015024393197, + "loss": 0.0285, "step": 52590 }, { - "epoch": 0.57, - "learning_rate": 0.00021470454692871501, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.0002601939347463057, + "loss": 0.0269, "step": 52600 }, { - "epoch": 0.57, - "learning_rate": 0.00021468833106311213, - "loss": 0.0227, + "epoch": 0.27, + "learning_rate": 0.00026018636705329166, + "loss": 0.0216, "step": 52610 }, { - "epoch": 0.57, - "learning_rate": 0.00021467211519750923, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.00026017879936027764, + "loss": 0.021, "step": 52620 }, { - "epoch": 0.57, - "learning_rate": 0.00021465589933190635, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002601712316672636, + "loss": 0.0208, "step": 52630 }, { - "epoch": 0.57, - "learning_rate": 0.0002146396834663034, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.00026016366397424966, + "loss": 0.0242, "step": 52640 }, { - "epoch": 0.57, - "learning_rate": 0.0002146234676007005, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.00026015609628123564, + "loss": 0.0206, "step": 52650 }, { - "epoch": 0.57, - "learning_rate": 0.0002146072517350976, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.0002601485285882216, + "loss": 0.0181, "step": 52660 }, { - "epoch": 0.57, - "learning_rate": 0.00021459103586949472, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002601409608952076, + "loss": 0.0177, "step": 52670 }, { - "epoch": 0.57, - "learning_rate": 0.00021457482000389178, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.0002601333932021936, + "loss": 0.0231, "step": 52680 }, { - "epoch": 0.57, - "learning_rate": 0.00021455860413828888, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.00026012582550917956, + "loss": 0.0209, "step": 52690 }, { - "epoch": 0.57, - "learning_rate": 0.000214542388272686, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.0002601182578161656, + "loss": 0.0232, "step": 52700 }, { - "epoch": 0.57, - "learning_rate": 0.0002145261724070831, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.0002601106901231516, + "loss": 0.0216, "step": 52710 }, { - "epoch": 0.57, - "learning_rate": 0.00021450995654148015, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00026010312243013756, + "loss": 0.0172, "step": 52720 }, { - "epoch": 0.57, - "learning_rate": 0.00021449374067587725, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.00026009555473712354, + "loss": 0.0181, "step": 52730 }, { - "epoch": 0.57, - "learning_rate": 0.00021447752481027437, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002600879870441095, + "loss": 0.0199, "step": 52740 }, { - "epoch": 0.57, - "learning_rate": 0.00021446130894467146, - "loss": 0.0196, + "epoch": 0.27, + "learning_rate": 0.0002600804193510955, + "loss": 0.0209, "step": 52750 }, { - "epoch": 0.57, - "learning_rate": 0.00021444509307906853, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00026007285165808154, + "loss": 0.0196, "step": 52760 }, { - "epoch": 0.57, - "learning_rate": 0.00021442887721346565, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.0002600652839650675, + "loss": 0.0218, "step": 52770 }, { - "epoch": 0.57, - "learning_rate": 0.00021441266134786274, - "loss": 0.0194, + "epoch": 0.27, + "learning_rate": 0.0002600577162720535, + "loss": 0.0219, "step": 52780 }, { - "epoch": 0.57, - "learning_rate": 0.00021439644548225983, - "loss": 0.0196, + "epoch": 0.27, + "learning_rate": 0.0002600501485790395, + "loss": 0.0209, "step": 52790 }, { - "epoch": 0.57, - "learning_rate": 0.0002143802296166569, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00026004258088602547, + "loss": 0.0178, "step": 52800 }, { - "epoch": 0.57, - "learning_rate": 0.00021436401375105402, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00026003501319301145, + "loss": 0.0203, "step": 52810 }, { - "epoch": 0.57, - "learning_rate": 0.0002143477978854511, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00026002744549999743, + "loss": 0.0229, "step": 52820 }, { - "epoch": 0.57, - "learning_rate": 0.0002143315820198482, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00026001987780698347, + "loss": 0.0202, "step": 52830 }, { - "epoch": 0.57, - "learning_rate": 0.0002143153661542453, - "loss": 0.0183, + "epoch": 0.27, + "learning_rate": 0.00026001231011396945, + "loss": 0.0215, "step": 52840 }, { - "epoch": 0.57, - "learning_rate": 0.0002142991502886424, - "loss": 0.0198, + "epoch": 0.27, + "learning_rate": 0.00026000474242095543, + "loss": 0.019, "step": 52850 }, { - "epoch": 0.57, - "learning_rate": 0.00021428293442303948, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002599971747279414, + "loss": 0.0201, "step": 52860 }, { - "epoch": 0.57, - "learning_rate": 0.0002142667185574366, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002599896070349274, + "loss": 0.0209, "step": 52870 }, { - "epoch": 0.57, - "learning_rate": 0.00021425050269183367, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.00025998203934191337, + "loss": 0.0205, "step": 52880 }, { - "epoch": 0.57, - "learning_rate": 0.00021423428682623076, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002599744716488994, + "loss": 0.023, "step": 52890 }, { - "epoch": 0.57, - "learning_rate": 0.00021421807096062785, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002599669039558854, + "loss": 0.02, "step": 52900 }, { - "epoch": 0.57, - "learning_rate": 0.00021420185509502497, - "loss": 0.0202, + "epoch": 0.27, + "learning_rate": 0.00025995933626287137, + "loss": 0.0205, "step": 52910 }, { - "epoch": 0.57, - "learning_rate": 0.00021418563922942204, - "loss": 0.0205, + "epoch": 0.27, + "learning_rate": 0.00025995176856985735, + "loss": 0.0192, "step": 52920 }, { - "epoch": 0.57, - "learning_rate": 0.00021416942336381913, - "loss": 0.0177, + "epoch": 0.27, + "learning_rate": 0.00025994420087684333, + "loss": 0.022, "step": 52930 }, { - "epoch": 0.57, - "learning_rate": 0.00021415320749821625, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.0002599366331838293, + "loss": 0.0226, "step": 52940 }, { - "epoch": 0.57, - "learning_rate": 0.00021413699163261334, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.00025992906549081535, + "loss": 0.0185, "step": 52950 }, { - "epoch": 0.57, - "learning_rate": 0.0002141207757670104, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.00025992149779780133, + "loss": 0.0218, "step": 52960 }, { - "epoch": 0.57, - "learning_rate": 0.0002141045599014075, - "loss": 0.0201, + "epoch": 0.27, + "learning_rate": 0.0002599139301047873, + "loss": 0.0222, "step": 52970 }, { - "epoch": 0.57, - "learning_rate": 0.00021408834403580462, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.0002599063624117733, + "loss": 0.0201, "step": 52980 }, { - "epoch": 0.57, - "learning_rate": 0.0002140721281702017, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.0002598987947187593, + "loss": 0.0221, "step": 52990 }, { - "epoch": 0.57, - "learning_rate": 0.00021405591230459878, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025989122702574526, + "loss": 0.0175, "step": 53000 }, { - "epoch": 0.57, - "eval_cer": 0.9215582042155038, - "eval_loss": 0.012771863490343094, - "eval_runtime": 121.4029, - "eval_samples_per_second": 16.474, - "eval_steps_per_second": 4.119, + "epoch": 0.27, + "eval_cer": 0.9145139237288054, + "eval_loss": 0.015266528353095055, + "eval_runtime": 115.681, + "eval_samples_per_second": 17.289, + "eval_steps_per_second": 4.322, "step": 53000 }, { - "epoch": 0.57, - "learning_rate": 0.0002140396964389959, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.00025988365933273124, + "loss": 0.0195, "step": 53010 }, { - "epoch": 0.57, - "learning_rate": 0.000214023480573393, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.0002598760916397173, + "loss": 0.0184, "step": 53020 }, { - "epoch": 0.57, - "learning_rate": 0.00021400726470779008, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025986852394670326, + "loss": 0.0241, "step": 53030 }, { - "epoch": 0.57, - "learning_rate": 0.00021399104884218718, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00025986095625368924, + "loss": 0.0221, "step": 53040 }, { - "epoch": 0.57, - "learning_rate": 0.00021397483297658427, - "loss": 0.0206, + "epoch": 0.27, + "learning_rate": 0.0002598533885606752, + "loss": 0.0205, "step": 53050 }, { - "epoch": 0.57, - "learning_rate": 0.00021395861711098136, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.0002598458208676612, + "loss": 0.0233, "step": 53060 }, { - "epoch": 0.57, - "learning_rate": 0.00021394240124537848, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002598382531746472, + "loss": 0.0203, "step": 53070 }, { - "epoch": 0.57, - "learning_rate": 0.00021392618537977555, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002598306854816332, + "loss": 0.0199, "step": 53080 }, { - "epoch": 0.57, - "learning_rate": 0.00021390996951417264, - "loss": 0.0183, + "epoch": 0.27, + "learning_rate": 0.0002598231177886192, + "loss": 0.021, "step": 53090 }, { - "epoch": 0.57, - "learning_rate": 0.00021389375364856973, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.0002598155500956052, + "loss": 0.0176, "step": 53100 }, { - "epoch": 0.57, - "learning_rate": 0.00021387753778296685, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025980798240259116, + "loss": 0.0187, "step": 53110 }, { - "epoch": 0.57, - "learning_rate": 0.00021386132191736392, - "loss": 0.02, + "epoch": 0.27, + "learning_rate": 0.00025980041470957714, + "loss": 0.0223, "step": 53120 }, { - "epoch": 0.57, - "learning_rate": 0.000213845106051761, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002597928470165631, + "loss": 0.0216, "step": 53130 }, { - "epoch": 0.57, - "learning_rate": 0.00021382889018615813, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.0002597852793235491, + "loss": 0.0224, "step": 53140 }, { - "epoch": 0.57, - "learning_rate": 0.00021381267432055522, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.00025977771163053514, + "loss": 0.0224, "step": 53150 }, { - "epoch": 0.57, - "learning_rate": 0.0002137964584549523, + "epoch": 0.27, + "learning_rate": 0.0002597701439375211, "loss": 0.0199, "step": 53160 }, { - "epoch": 0.57, - "learning_rate": 0.00021378024258934938, - "loss": 0.0177, + "epoch": 0.27, + "learning_rate": 0.0002597625762445071, + "loss": 0.0199, "step": 53170 }, { - "epoch": 0.57, - "learning_rate": 0.0002137640267237465, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.0002597550085514931, + "loss": 0.0261, "step": 53180 }, { - "epoch": 0.58, - "learning_rate": 0.0002137478108581436, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.00025974744085847907, + "loss": 0.0254, "step": 53190 }, { - "epoch": 0.58, - "learning_rate": 0.00021373159499254066, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.00025973987316546505, + "loss": 0.024, "step": 53200 }, { - "epoch": 0.58, - "learning_rate": 0.00021371537912693778, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.0002597323054724511, + "loss": 0.0212, "step": 53210 }, { - "epoch": 0.58, - "learning_rate": 0.00021369916326133487, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.00025972473777943707, + "loss": 0.0167, "step": 53220 }, { - "epoch": 0.58, - "learning_rate": 0.00021368294739573197, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.00025971717008642305, + "loss": 0.0234, "step": 53230 }, { - "epoch": 0.58, - "learning_rate": 0.00021366673153012909, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.00025970960239340903, + "loss": 0.0207, "step": 53240 }, { - "epoch": 0.58, - "learning_rate": 0.00021365051566452615, - "loss": 0.0198, + "epoch": 0.27, + "learning_rate": 0.000259702034700395, + "loss": 0.0243, "step": 53250 }, { - "epoch": 0.58, - "learning_rate": 0.00021363429979892324, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.000259694467007381, + "loss": 0.0201, "step": 53260 }, { - "epoch": 0.58, - "learning_rate": 0.00021361808393332034, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025968689931436703, + "loss": 0.019, "step": 53270 }, { - "epoch": 0.58, - "learning_rate": 0.00021360186806771746, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.000259679331621353, + "loss": 0.0231, "step": 53280 }, { - "epoch": 0.58, - "learning_rate": 0.00021358565220211452, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.000259671763928339, + "loss": 0.0202, "step": 53290 }, { - "epoch": 0.58, - "learning_rate": 0.00021356943633651161, - "loss": 0.0177, + "epoch": 0.27, + "learning_rate": 0.00025966419623532497, + "loss": 0.022, "step": 53300 }, { - "epoch": 0.58, - "learning_rate": 0.00021355322047090873, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025965662854231095, + "loss": 0.021, "step": 53310 }, { - "epoch": 0.58, - "learning_rate": 0.00021353700460530583, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025964906084929694, + "loss": 0.0198, "step": 53320 }, { - "epoch": 0.58, - "learning_rate": 0.0002135207887397029, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002596414931562829, + "loss": 0.0193, "step": 53330 }, { - "epoch": 0.58, - "learning_rate": 0.0002135045728741, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.00025963392546326895, + "loss": 0.0194, "step": 53340 }, { - "epoch": 0.58, - "learning_rate": 0.0002134883570084971, - "loss": 0.0216, + "epoch": 0.27, + "learning_rate": 0.00025962635777025493, + "loss": 0.0188, "step": 53350 }, { - "epoch": 0.58, - "learning_rate": 0.0002134721411428942, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.0002596187900772409, + "loss": 0.0222, "step": 53360 }, { - "epoch": 0.58, - "learning_rate": 0.00021345592527729126, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.0002596112223842269, + "loss": 0.0222, "step": 53370 }, { - "epoch": 0.58, - "learning_rate": 0.00021343970941168838, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.0002596036546912129, + "loss": 0.0183, "step": 53380 }, { - "epoch": 0.58, - "learning_rate": 0.00021342349354608548, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.00025959608699819886, + "loss": 0.0209, "step": 53390 }, { - "epoch": 0.58, - "learning_rate": 0.00021340727768048257, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.0002595885193051849, + "loss": 0.0216, "step": 53400 }, { - "epoch": 0.58, - "learning_rate": 0.00021339106181487966, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002595809516121709, + "loss": 0.0195, "step": 53410 }, { - "epoch": 0.58, - "learning_rate": 0.00021337484594927675, - "loss": 0.0193, + "epoch": 0.27, + "learning_rate": 0.0002595733839191568, + "loss": 0.02, "step": 53420 }, { - "epoch": 0.58, - "learning_rate": 0.00021335863008367385, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002595658162261428, + "loss": 0.0177, "step": 53430 }, { - "epoch": 0.58, - "learning_rate": 0.00021334241421807097, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002595582485331288, + "loss": 0.0191, "step": 53440 }, { - "epoch": 0.58, - "learning_rate": 0.00021332619835246803, - "loss": 0.0183, + "epoch": 0.27, + "learning_rate": 0.0002595506808401148, + "loss": 0.0245, "step": 53450 }, { - "epoch": 0.58, - "learning_rate": 0.00021330998248686513, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002595431131471008, + "loss": 0.0175, "step": 53460 }, { - "epoch": 0.58, - "learning_rate": 0.00021329376662126222, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.00025953554545408677, + "loss": 0.0199, "step": 53470 }, { - "epoch": 0.58, - "learning_rate": 0.00021327755075565934, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025952797776107275, + "loss": 0.0222, "step": 53480 }, { - "epoch": 0.58, - "learning_rate": 0.0002132613348900564, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.00025952041006805873, + "loss": 0.0218, "step": 53490 }, { - "epoch": 0.58, - "learning_rate": 0.0002132451190244535, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025951284237504476, + "loss": 0.0183, "step": 53500 }, { - "epoch": 0.58, - "learning_rate": 0.00021322890315885062, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00025950527468203075, + "loss": 0.0208, "step": 53510 }, { - "epoch": 0.58, - "learning_rate": 0.0002132126872932477, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.0002594977069890167, + "loss": 0.0213, "step": 53520 }, { - "epoch": 0.58, - "learning_rate": 0.00021319647142764477, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002594901392960027, + "loss": 0.0182, "step": 53530 }, { - "epoch": 0.58, - "learning_rate": 0.00021318025556204187, - "loss": 0.0194, + "epoch": 0.27, + "learning_rate": 0.0002594825716029887, + "loss": 0.0207, "step": 53540 }, { - "epoch": 0.58, - "learning_rate": 0.000213164039696439, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025947500390997467, + "loss": 0.0188, "step": 53550 }, { - "epoch": 0.58, - "learning_rate": 0.00021314782383083608, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.00025946743621696065, + "loss": 0.0212, "step": 53560 }, { - "epoch": 0.58, - "learning_rate": 0.00021313160796523315, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.0002594598685239467, + "loss": 0.0211, "step": 53570 }, { - "epoch": 0.58, - "learning_rate": 0.00021311539209963027, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.00025945230083093267, + "loss": 0.0185, "step": 53580 }, { - "epoch": 0.58, - "learning_rate": 0.00021309917623402736, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.00025944473313791865, + "loss": 0.0217, "step": 53590 }, { - "epoch": 0.58, - "learning_rate": 0.00021308296036842445, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025943716544490463, + "loss": 0.0209, "step": 53600 }, { - "epoch": 0.58, - "learning_rate": 0.00021306674450282152, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.0002594295977518906, + "loss": 0.0213, "step": 53610 }, { - "epoch": 0.58, - "learning_rate": 0.00021305052863721864, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002594220300588766, + "loss": 0.0195, "step": 53620 }, { - "epoch": 0.58, - "learning_rate": 0.00021303431277161573, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.00025941446236586263, + "loss": 0.0239, "step": 53630 }, { - "epoch": 0.58, - "learning_rate": 0.00021301809690601285, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.0002594068946728486, + "loss": 0.0188, "step": 53640 }, { - "epoch": 0.58, - "learning_rate": 0.00021300188104040991, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.0002593993269798346, + "loss": 0.0215, "step": 53650 }, { - "epoch": 0.58, - "learning_rate": 0.000212985665174807, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002593917592868206, + "loss": 0.0215, "step": 53660 }, { - "epoch": 0.58, - "learning_rate": 0.0002129694493092041, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.00025938419159380656, + "loss": 0.0234, "step": 53670 }, { - "epoch": 0.58, - "learning_rate": 0.00021295323344360122, - "loss": 0.0177, + "epoch": 0.27, + "learning_rate": 0.00025937662390079254, + "loss": 0.0191, "step": 53680 }, { - "epoch": 0.58, - "learning_rate": 0.00021293701757799829, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002593690562077786, + "loss": 0.021, "step": 53690 }, { - "epoch": 0.58, - "learning_rate": 0.00021292080171239538, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.00025936148851476456, + "loss": 0.0237, "step": 53700 }, { - "epoch": 0.58, - "learning_rate": 0.0002129045858467925, - "loss": 0.0213, + "epoch": 0.27, + "learning_rate": 0.00025935392082175054, + "loss": 0.0247, "step": 53710 }, { - "epoch": 0.58, - "learning_rate": 0.0002128883699811896, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002593463531287365, + "loss": 0.0222, "step": 53720 }, { - "epoch": 0.58, - "learning_rate": 0.00021287215411558666, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002593387854357225, + "loss": 0.025, "step": 53730 }, { - "epoch": 0.58, - "learning_rate": 0.00021285593824998375, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.0002593312177427085, + "loss": 0.023, "step": 53740 }, { - "epoch": 0.58, - "learning_rate": 0.00021283972238438087, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.00025932365004969446, + "loss": 0.0198, "step": 53750 }, { - "epoch": 0.58, - "learning_rate": 0.00021282350651877796, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.0002593160823566805, + "loss": 0.0187, "step": 53760 }, { - "epoch": 0.58, - "learning_rate": 0.00021280729065317503, - "loss": 0.0195, + "epoch": 0.27, + "learning_rate": 0.0002593085146636665, + "loss": 0.0211, "step": 53770 }, { - "epoch": 0.58, - "learning_rate": 0.00021279107478757215, - "loss": 0.0223, + "epoch": 0.27, + "learning_rate": 0.00025930094697065246, + "loss": 0.018, "step": 53780 }, { - "epoch": 0.58, - "learning_rate": 0.00021277485892196924, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025929337927763844, + "loss": 0.0223, "step": 53790 }, { - "epoch": 0.58, - "learning_rate": 0.00021275864305636633, - "loss": 0.0207, + "epoch": 0.27, + "learning_rate": 0.0002592858115846244, + "loss": 0.0201, "step": 53800 }, { - "epoch": 0.58, - "learning_rate": 0.0002127424271907634, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.0002592782438916104, + "loss": 0.0215, "step": 53810 }, { - "epoch": 0.58, - "learning_rate": 0.00021272621132516052, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025927067619859644, + "loss": 0.0229, "step": 53820 }, { - "epoch": 0.58, - "learning_rate": 0.0002127099954595576, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002592631085055824, + "loss": 0.02, "step": 53830 }, { - "epoch": 0.58, - "learning_rate": 0.0002126937795939547, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002592555408125684, + "loss": 0.0187, "step": 53840 }, { - "epoch": 0.58, - "learning_rate": 0.0002126775637283518, - "loss": 0.0205, + "epoch": 0.27, + "learning_rate": 0.0002592479731195544, + "loss": 0.0186, "step": 53850 }, { - "epoch": 0.58, - "learning_rate": 0.0002126613478627489, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025924040542654037, + "loss": 0.0216, "step": 53860 }, { - "epoch": 0.58, - "learning_rate": 0.00021264513199714598, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025923283773352635, + "loss": 0.0201, "step": 53870 }, { - "epoch": 0.58, - "learning_rate": 0.0002126289161315431, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.00025922527004051233, + "loss": 0.0207, "step": 53880 }, { - "epoch": 0.58, - "learning_rate": 0.00021261270026594017, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025921770234749837, + "loss": 0.0211, "step": 53890 }, { - "epoch": 0.58, - "learning_rate": 0.00021259648440033726, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00025921013465448435, + "loss": 0.0197, "step": 53900 }, { - "epoch": 0.58, - "learning_rate": 0.00021258026853473435, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025920256696147033, + "loss": 0.0213, "step": 53910 }, { - "epoch": 0.58, - "learning_rate": 0.00021256405266913147, - "loss": 0.0214, + "epoch": 0.27, + "learning_rate": 0.0002591949992684563, + "loss": 0.0166, "step": 53920 }, { - "epoch": 0.58, - "learning_rate": 0.00021254783680352854, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002591874315754423, + "loss": 0.0223, "step": 53930 }, { - "epoch": 0.58, - "learning_rate": 0.00021253162093792563, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.00025917986388242827, + "loss": 0.0161, "step": 53940 }, { - "epoch": 0.58, - "learning_rate": 0.00021251540507232275, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002591722961894143, + "loss": 0.0202, "step": 53950 }, { - "epoch": 0.58, - "learning_rate": 0.00021249918920671984, - "loss": 0.0184, + "epoch": 0.27, + "learning_rate": 0.0002591647284964003, + "loss": 0.0214, "step": 53960 }, { - "epoch": 0.58, - "learning_rate": 0.00021248297334111694, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025915716080338627, + "loss": 0.0167, "step": 53970 }, { - "epoch": 0.58, - "learning_rate": 0.000212466757475514, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.00025914959311037225, + "loss": 0.0202, "step": 53980 }, { - "epoch": 0.58, - "learning_rate": 0.00021245054160991112, - "loss": 0.0177, + "epoch": 0.27, + "learning_rate": 0.00025914202541735823, + "loss": 0.0219, "step": 53990 }, { - "epoch": 0.58, - "learning_rate": 0.00021243432574430822, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002591344577243442, + "loss": 0.0209, "step": 54000 }, { - "epoch": 0.58, - "eval_cer": 0.9215590728184603, - "eval_loss": 0.012681106105446815, - "eval_runtime": 121.7214, - "eval_samples_per_second": 16.431, - "eval_steps_per_second": 4.108, + "epoch": 0.27, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.014917539432644844, + "eval_runtime": 115.9864, + "eval_samples_per_second": 17.243, + "eval_steps_per_second": 4.311, "step": 54000 }, { - "epoch": 0.58, - "learning_rate": 0.00021241810987870533, - "loss": 0.0182, + "epoch": 0.27, + "learning_rate": 0.00025912689003133025, + "loss": 0.0213, "step": 54010 }, { - "epoch": 0.58, - "learning_rate": 0.0002124018940131024, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.00025911932233831623, + "loss": 0.0186, "step": 54020 }, { - "epoch": 0.58, - "learning_rate": 0.0002123856781474995, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.0002591117546453022, + "loss": 0.0197, "step": 54030 }, { - "epoch": 0.58, - "learning_rate": 0.00021236946228189659, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.0002591041869522882, + "loss": 0.0207, "step": 54040 }, { - "epoch": 0.58, - "learning_rate": 0.0002123532464162937, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.0002590966192592742, + "loss": 0.0218, "step": 54050 }, { - "epoch": 0.58, - "learning_rate": 0.00021233703055069077, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.00025908905156626016, + "loss": 0.022, "step": 54060 }, { - "epoch": 0.58, - "learning_rate": 0.00021232081468508786, - "loss": 0.0174, + "epoch": 0.27, + "learning_rate": 0.00025908148387324614, + "loss": 0.0279, "step": 54070 }, { - "epoch": 0.58, - "learning_rate": 0.00021230459881948498, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002590739161802322, + "loss": 0.0219, "step": 54080 }, { - "epoch": 0.58, - "learning_rate": 0.00021228838295388208, - "loss": 0.0207, + "epoch": 0.27, + "learning_rate": 0.00025906634848721816, + "loss": 0.0769, "step": 54090 }, { - "epoch": 0.58, - "learning_rate": 0.00021227216708827914, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.00025905878079420414, + "loss": 0.0249, "step": 54100 }, { - "epoch": 0.58, - "learning_rate": 0.00021225595122267624, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002590512131011901, + "loss": 0.0208, "step": 54110 }, { - "epoch": 0.59, - "learning_rate": 0.00021223973535707336, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.0002590436454081761, + "loss": 0.0231, "step": 54120 }, { - "epoch": 0.59, - "learning_rate": 0.00021222351949147045, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.0002590360777151621, + "loss": 0.025, "step": 54130 }, { - "epoch": 0.59, - "learning_rate": 0.0002122073036258675, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002590285100221481, + "loss": 0.0341, "step": 54140 }, { - "epoch": 0.59, - "learning_rate": 0.00021219108776026463, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.0002590209423291341, + "loss": 0.0182, "step": 54150 }, { - "epoch": 0.59, - "learning_rate": 0.00021217487189466173, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.0002590133746361201, + "loss": 0.0226, "step": 54160 }, { - "epoch": 0.59, - "learning_rate": 0.00021215865602905882, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.00025900580694310606, + "loss": 0.0229, "step": 54170 }, { - "epoch": 0.59, - "learning_rate": 0.00021214244016345588, + "epoch": 0.27, + "learning_rate": 0.00025899823925009204, "loss": 0.0222, "step": 54180 }, { - "epoch": 0.59, - "learning_rate": 0.000212126224297853, - "loss": 0.0182, + "epoch": 0.27, + "learning_rate": 0.000258990671557078, + "loss": 0.0165, "step": 54190 }, { - "epoch": 0.59, - "learning_rate": 0.0002121100084322501, - "loss": 0.0195, + "epoch": 0.27, + "learning_rate": 0.00025898310386406406, + "loss": 0.0272, "step": 54200 }, { - "epoch": 0.59, - "learning_rate": 0.0002120937925666472, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.00025897553617105004, + "loss": 0.0251, "step": 54210 }, { - "epoch": 0.59, - "learning_rate": 0.00021207757670104428, - "loss": 0.0137, + "epoch": 0.27, + "learning_rate": 0.000258967968478036, + "loss": 0.0219, "step": 54220 }, { - "epoch": 0.59, - "learning_rate": 0.00021206136083544138, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.000258960400785022, + "loss": 0.0223, "step": 54230 }, { - "epoch": 0.59, - "learning_rate": 0.00021204514496983847, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.000258952833092008, + "loss": 0.0248, "step": 54240 }, { - "epoch": 0.59, - "learning_rate": 0.0002120289291042356, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00025894526539899397, + "loss": 0.0204, "step": 54250 }, { - "epoch": 0.59, - "learning_rate": 0.00021201271323863265, - "loss": 0.0203, + "epoch": 0.27, + "learning_rate": 0.00025893769770597995, + "loss": 0.0218, "step": 54260 }, { - "epoch": 0.59, - "learning_rate": 0.00021199649737302975, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.000258930130012966, + "loss": 0.0197, "step": 54270 }, { - "epoch": 0.59, - "learning_rate": 0.00021198028150742684, - "loss": 0.0126, + "epoch": 0.27, + "learning_rate": 0.00025892256231995197, + "loss": 0.0206, "step": 54280 }, { - "epoch": 0.59, - "learning_rate": 0.00021196406564182396, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025891499462693795, + "loss": 0.0197, "step": 54290 }, { - "epoch": 0.59, - "learning_rate": 0.00021194784977622102, - "loss": 0.0192, + "epoch": 0.27, + "learning_rate": 0.00025890742693392393, + "loss": 0.019, "step": 54300 }, { - "epoch": 0.59, - "learning_rate": 0.00021193163391061812, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.0002588998592409099, + "loss": 0.0159, "step": 54310 }, { - "epoch": 0.59, - "learning_rate": 0.00021191541804501524, - "loss": 0.0189, + "epoch": 0.27, + "learning_rate": 0.0002588922915478959, + "loss": 0.0225, "step": 54320 }, { - "epoch": 0.59, - "learning_rate": 0.00021189920217941233, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.00025888472385488193, + "loss": 0.0188, "step": 54330 }, { - "epoch": 0.59, - "learning_rate": 0.0002118829863138094, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002588771561618679, + "loss": 0.0232, "step": 54340 }, { - "epoch": 0.59, - "learning_rate": 0.00021186677044820652, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.0002588695884688539, + "loss": 0.0184, "step": 54350 }, { - "epoch": 0.59, - "learning_rate": 0.0002118505545826036, - "loss": 0.0222, + "epoch": 0.27, + "learning_rate": 0.00025886202077583987, + "loss": 0.0213, "step": 54360 }, { - "epoch": 0.59, - "learning_rate": 0.0002118343387170007, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.00025885445308282585, + "loss": 0.0231, "step": 54370 }, { - "epoch": 0.59, - "learning_rate": 0.00021181812285139777, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00025884688538981184, + "loss": 0.02, "step": 54380 }, { - "epoch": 0.59, - "learning_rate": 0.00021180190698579489, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.0002588393176967978, + "loss": 0.022, "step": 54390 }, { - "epoch": 0.59, - "learning_rate": 0.00021178569112019198, - "loss": 0.0201, + "epoch": 0.27, + "learning_rate": 0.00025883175000378385, + "loss": 0.0253, "step": 54400 }, { - "epoch": 0.59, - "learning_rate": 0.00021176947525458907, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025882418231076983, + "loss": 0.025, "step": 54410 }, { - "epoch": 0.59, - "learning_rate": 0.00021175325938898616, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002588166146177558, + "loss": 0.0224, "step": 54420 }, { - "epoch": 0.59, - "learning_rate": 0.00021173704352338326, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.0002588090469247418, + "loss": 0.0216, "step": 54430 }, { - "epoch": 0.59, - "learning_rate": 0.00021172082765778035, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.0002588014792317278, + "loss": 0.0204, "step": 54440 }, { - "epoch": 0.59, - "learning_rate": 0.00021170461179217747, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.00025879391153871376, + "loss": 0.0228, "step": 54450 }, { - "epoch": 0.59, - "learning_rate": 0.00021168839592657454, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.0002587863438456998, + "loss": 0.0173, "step": 54460 }, { - "epoch": 0.59, - "learning_rate": 0.00021167218006097163, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002587787761526858, + "loss": 0.0179, "step": 54470 }, { - "epoch": 0.59, - "learning_rate": 0.00021165596419536872, - "loss": 0.0191, + "epoch": 0.27, + "learning_rate": 0.00025877120845967176, + "loss": 0.0294, "step": 54480 }, { - "epoch": 0.59, - "learning_rate": 0.00021163974832976584, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.00025876364076665774, + "loss": 0.023, "step": 54490 }, { - "epoch": 0.59, - "learning_rate": 0.0002116235324641629, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002587560730736437, + "loss": 0.0196, "step": 54500 }, { - "epoch": 0.59, - "learning_rate": 0.00021160731659856, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002587485053806297, + "loss": 0.0192, "step": 54510 }, { - "epoch": 0.59, - "learning_rate": 0.00021159110073295712, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025874093768761574, + "loss": 0.0216, "step": 54520 }, { - "epoch": 0.59, - "learning_rate": 0.0002115748848673542, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.0002587333699946017, + "loss": 0.0189, "step": 54530 }, { - "epoch": 0.59, - "learning_rate": 0.00021155866900175128, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002587258023015877, + "loss": 0.022, "step": 54540 }, { - "epoch": 0.59, - "learning_rate": 0.00021154245313614837, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.0002587182346085737, + "loss": 0.0242, "step": 54550 }, { - "epoch": 0.59, - "learning_rate": 0.0002115262372705455, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025871066691555966, + "loss": 0.0205, "step": 54560 }, { - "epoch": 0.59, - "learning_rate": 0.00021151002140494258, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.00025870309922254565, + "loss": 0.0198, "step": 54570 }, { - "epoch": 0.59, - "learning_rate": 0.00021149380553933965, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025869553152953163, + "loss": 0.0218, "step": 54580 }, { - "epoch": 0.59, - "learning_rate": 0.00021147758967373677, - "loss": 0.0238, + "epoch": 0.28, + "learning_rate": 0.00025868796383651766, + "loss": 0.0232, "step": 54590 }, { - "epoch": 0.59, - "learning_rate": 0.00021146137380813386, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.00025868039614350364, + "loss": 0.0253, "step": 54600 }, { - "epoch": 0.59, - "learning_rate": 0.00021144515794253095, + "epoch": 0.28, + "learning_rate": 0.0002586728284504896, "loss": 0.0187, "step": 54610 }, { - "epoch": 0.59, - "learning_rate": 0.00021142894207692802, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002586652607574756, + "loss": 0.0187, "step": 54620 }, { - "epoch": 0.59, - "learning_rate": 0.00021141272621132514, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.0002586576930644616, + "loss": 0.0231, "step": 54630 }, { - "epoch": 0.59, - "learning_rate": 0.00021139651034572223, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025865012537144757, + "loss": 0.0232, "step": 54640 }, { - "epoch": 0.59, - "learning_rate": 0.00021138029448011935, - "loss": 0.0187, + "epoch": 0.28, + "learning_rate": 0.0002586425576784336, + "loss": 0.0191, "step": 54650 }, { - "epoch": 0.59, - "learning_rate": 0.00021136407861451642, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.0002586349899854196, + "loss": 0.0203, "step": 54660 }, { - "epoch": 0.59, - "learning_rate": 0.0002113478627489135, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025862742229240557, + "loss": 0.0224, "step": 54670 }, { - "epoch": 0.59, - "learning_rate": 0.0002113316468833106, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002586198545993915, + "loss": 0.0187, "step": 54680 }, { - "epoch": 0.59, - "learning_rate": 0.00021131543101770772, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025861228690637753, + "loss": 0.0215, "step": 54690 }, { - "epoch": 0.59, - "learning_rate": 0.00021129921515210482, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.0002586047192133635, + "loss": 0.0227, "step": 54700 }, { - "epoch": 0.59, - "learning_rate": 0.00021128299928650188, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002585971515203495, + "loss": 0.0164, "step": 54710 }, { - "epoch": 0.59, - "learning_rate": 0.000211266783420899, - "loss": 0.02, + "epoch": 0.28, + "learning_rate": 0.0002585895838273355, + "loss": 0.0203, "step": 54720 }, { - "epoch": 0.59, - "learning_rate": 0.0002112505675552961, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.00025858201613432146, + "loss": 0.0224, "step": 54730 }, { - "epoch": 0.59, - "learning_rate": 0.0002112343516896932, - "loss": 0.0177, + "epoch": 0.28, + "learning_rate": 0.00025857444844130744, + "loss": 0.0213, "step": 54740 }, { - "epoch": 0.59, - "learning_rate": 0.00021121813582409025, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.0002585668807482935, + "loss": 0.0192, "step": 54750 }, { - "epoch": 0.59, - "learning_rate": 0.00021120191995848737, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025855931305527946, + "loss": 0.0183, "step": 54760 }, { - "epoch": 0.59, - "learning_rate": 0.00021118570409288446, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025855174536226544, + "loss": 0.0232, "step": 54770 }, { - "epoch": 0.59, - "learning_rate": 0.00021116948822728156, - "loss": 0.02, + "epoch": 0.28, + "learning_rate": 0.0002585441776692514, + "loss": 0.0258, "step": 54780 }, { - "epoch": 0.59, - "learning_rate": 0.00021115327236167865, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002585366099762374, + "loss": 0.0201, "step": 54790 }, { - "epoch": 0.59, - "learning_rate": 0.00021113705649607574, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.0002585290422832234, + "loss": 0.0201, "step": 54800 }, { - "epoch": 0.59, - "learning_rate": 0.00021112084063047284, - "loss": 0.0208, + "epoch": 0.28, + "learning_rate": 0.00025852147459020936, + "loss": 0.0246, "step": 54810 }, { - "epoch": 0.59, - "learning_rate": 0.00021110462476486996, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.0002585139068971954, + "loss": 0.019, "step": 54820 }, { - "epoch": 0.59, - "learning_rate": 0.00021108840889926702, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.0002585063392041814, + "loss": 0.0237, "step": 54830 }, { - "epoch": 0.59, - "learning_rate": 0.00021107219303366411, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.00025849877151116736, + "loss": 0.0224, "step": 54840 }, { - "epoch": 0.59, - "learning_rate": 0.0002110559771680612, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.00025849120381815334, + "loss": 0.0289, "step": 54850 }, { - "epoch": 0.59, - "learning_rate": 0.00021103976130245833, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.0002584836361251393, + "loss": 0.0304, "step": 54860 }, { - "epoch": 0.59, - "learning_rate": 0.0002110235454368554, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.0002584760684321253, + "loss": 0.0211, "step": 54870 }, { - "epoch": 0.59, - "learning_rate": 0.00021100732957125248, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.00025846850073911134, + "loss": 0.0244, "step": 54880 }, { - "epoch": 0.59, - "learning_rate": 0.0002109911137056496, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.0002584609330460973, + "loss": 0.0233, "step": 54890 }, { - "epoch": 0.59, - "learning_rate": 0.0002109748978400467, - "loss": 0.0179, + "epoch": 0.28, + "learning_rate": 0.0002584533653530833, + "loss": 0.0176, "step": 54900 }, { - "epoch": 0.59, - "learning_rate": 0.00021095868197444376, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002584457976600693, + "loss": 0.019, "step": 54910 }, { - "epoch": 0.59, - "learning_rate": 0.00021094246610884086, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.00025843822996705527, + "loss": 0.0249, "step": 54920 }, { - "epoch": 0.59, - "learning_rate": 0.00021092625024323798, - "loss": 0.0188, + "epoch": 0.28, + "learning_rate": 0.00025843066227404125, + "loss": 0.0194, "step": 54930 }, { - "epoch": 0.59, - "learning_rate": 0.00021091003437763507, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.00025842309458102723, + "loss": 0.0208, "step": 54940 }, { - "epoch": 0.59, - "learning_rate": 0.00021089381851203213, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025841552688801327, + "loss": 0.0183, "step": 54950 }, { - "epoch": 0.59, - "learning_rate": 0.00021087760264642925, - "loss": 0.0192, + "epoch": 0.28, + "learning_rate": 0.00025840795919499925, + "loss": 0.0209, "step": 54960 }, { - "epoch": 0.59, - "learning_rate": 0.00021086138678082635, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025840039150198523, + "loss": 0.0214, "step": 54970 }, { - "epoch": 0.59, - "learning_rate": 0.00021084517091522344, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.0002583928238089712, + "loss": 0.0222, "step": 54980 }, { - "epoch": 0.59, - "learning_rate": 0.0002108289550496205, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002583852561159572, + "loss": 0.0208, "step": 54990 }, { - "epoch": 0.59, - "learning_rate": 0.00021081273918401762, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002583776884229432, + "loss": 0.0218, "step": 55000 }, { - "epoch": 0.59, - "eval_cer": 0.9215616786273294, - "eval_loss": 0.011711681261658669, - "eval_runtime": 121.4424, - "eval_samples_per_second": 16.469, - "eval_steps_per_second": 4.117, + "epoch": 0.28, + "eval_cer": 0.914472196695413, + "eval_loss": 0.014595328830182552, + "eval_runtime": 116.9041, + "eval_samples_per_second": 17.108, + "eval_steps_per_second": 4.277, "step": 55000 }, { - "epoch": 0.59, - "learning_rate": 0.00021079652331841472, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002583701207299292, + "loss": 0.019, "step": 55010 }, { - "epoch": 0.59, - "learning_rate": 0.00021078030745281184, - "loss": 0.0183, + "epoch": 0.28, + "learning_rate": 0.0002583625530369152, + "loss": 0.0263, "step": 55020 }, { - "epoch": 0.59, - "learning_rate": 0.0002107640915872089, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025835498534390117, + "loss": 0.0244, "step": 55030 }, { - "epoch": 0.6, - "learning_rate": 0.000210747875721606, - "loss": 0.0184, + "epoch": 0.28, + "learning_rate": 0.00025834741765088715, + "loss": 0.0189, "step": 55040 }, { - "epoch": 0.6, - "learning_rate": 0.0002107316598560031, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025833984995787313, + "loss": 0.0207, "step": 55050 }, { - "epoch": 0.6, - "learning_rate": 0.0002107154439904002, - "loss": 0.0207, + "epoch": 0.28, + "learning_rate": 0.0002583322822648591, + "loss": 0.0205, "step": 55060 }, { - "epoch": 0.6, - "learning_rate": 0.00021069922812479727, - "loss": 0.0196, + "epoch": 0.28, + "learning_rate": 0.00025832471457184515, + "loss": 0.0225, "step": 55070 }, { - "epoch": 0.6, - "learning_rate": 0.00021068301225919437, - "loss": 0.0197, + "epoch": 0.28, + "learning_rate": 0.00025831714687883113, + "loss": 0.0212, "step": 55080 }, { - "epoch": 0.6, - "learning_rate": 0.0002106667963935915, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.0002583095791858171, + "loss": 0.0208, "step": 55090 }, { - "epoch": 0.6, - "learning_rate": 0.00021065058052798858, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002583020114928031, + "loss": 0.0224, "step": 55100 }, { - "epoch": 0.6, - "learning_rate": 0.00021063436466238565, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.0002582944437997891, + "loss": 0.0239, "step": 55110 }, { - "epoch": 0.6, - "learning_rate": 0.00021061814879678274, - "loss": 0.018, + "epoch": 0.28, + "learning_rate": 0.00025828687610677506, + "loss": 0.0173, "step": 55120 }, { - "epoch": 0.6, - "learning_rate": 0.00021060193293117986, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.00025827930841376104, + "loss": 0.0308, "step": 55130 }, { - "epoch": 0.6, - "learning_rate": 0.00021058571706557695, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002582717407207471, + "loss": 0.0244, "step": 55140 }, { - "epoch": 0.6, - "learning_rate": 0.00021056950119997402, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.00025826417302773306, + "loss": 0.0239, "step": 55150 }, { - "epoch": 0.6, - "learning_rate": 0.00021055328533437114, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025825660533471904, + "loss": 0.025, "step": 55160 }, { - "epoch": 0.6, - "learning_rate": 0.00021053706946876823, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.000258249037641705, + "loss": 0.0309, "step": 55170 }, { - "epoch": 0.6, - "learning_rate": 0.00021052085360316532, - "loss": 0.0205, + "epoch": 0.28, + "learning_rate": 0.000258241469948691, + "loss": 0.024, "step": 55180 }, { - "epoch": 0.6, - "learning_rate": 0.0002105046377375624, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.000258233902255677, + "loss": 0.0204, "step": 55190 }, { - "epoch": 0.6, - "learning_rate": 0.0002104884218719595, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.000258226334562663, + "loss": 0.0193, "step": 55200 }, { - "epoch": 0.6, - "learning_rate": 0.0002104722060063566, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.000258218766869649, + "loss": 0.0225, "step": 55210 }, { - "epoch": 0.6, - "learning_rate": 0.0002104559901407537, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.000258211199176635, + "loss": 0.02, "step": 55220 }, { - "epoch": 0.6, - "learning_rate": 0.00021043977427515079, - "loss": 0.0248, + "epoch": 0.28, + "learning_rate": 0.00025820363148362096, + "loss": 0.0266, "step": 55230 }, { - "epoch": 0.6, - "learning_rate": 0.00021042355840954788, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025819606379060694, + "loss": 0.0234, "step": 55240 }, { - "epoch": 0.6, - "learning_rate": 0.00021040734254394497, - "loss": 0.0193, + "epoch": 0.28, + "learning_rate": 0.0002581884960975929, + "loss": 0.0198, "step": 55250 }, { - "epoch": 0.6, - "learning_rate": 0.0002103911266783421, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025818092840457896, + "loss": 0.0241, "step": 55260 }, { - "epoch": 0.6, - "learning_rate": 0.00021037491081273916, - "loss": 0.0193, + "epoch": 0.28, + "learning_rate": 0.00025817336071156494, + "loss": 0.0204, "step": 55270 }, { - "epoch": 0.6, - "learning_rate": 0.00021035869494713625, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.0002581657930185509, + "loss": 0.0225, "step": 55280 }, { - "epoch": 0.6, - "learning_rate": 0.00021034247908153334, - "loss": 0.0196, + "epoch": 0.28, + "learning_rate": 0.0002581582253255369, + "loss": 0.0206, "step": 55290 }, { - "epoch": 0.6, - "learning_rate": 0.00021032626321593046, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.0002581506576325229, + "loss": 0.0208, "step": 55300 }, { - "epoch": 0.6, - "learning_rate": 0.00021031004735032753, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.00025814308993950887, + "loss": 0.0211, "step": 55310 }, { - "epoch": 0.6, - "learning_rate": 0.00021029383148472462, - "loss": 0.0206, + "epoch": 0.28, + "learning_rate": 0.00025813552224649485, + "loss": 0.0247, "step": 55320 }, { - "epoch": 0.6, - "learning_rate": 0.00021027761561912174, - "loss": 0.0334, + "epoch": 0.28, + "learning_rate": 0.0002581279545534809, + "loss": 0.0197, "step": 55330 }, { - "epoch": 0.6, - "learning_rate": 0.00021026139975351883, - "loss": 0.0188, + "epoch": 0.28, + "learning_rate": 0.00025812038686046687, + "loss": 0.0199, "step": 55340 }, { - "epoch": 0.6, - "learning_rate": 0.0002102451838879159, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.00025811281916745285, + "loss": 0.0182, "step": 55350 }, { - "epoch": 0.6, - "learning_rate": 0.00021022896802231302, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.00025810525147443883, + "loss": 0.0203, "step": 55360 }, { - "epoch": 0.6, - "learning_rate": 0.0002102127521567101, - "loss": 0.0183, + "epoch": 0.28, + "learning_rate": 0.0002580976837814248, + "loss": 0.018, "step": 55370 }, { - "epoch": 0.6, - "learning_rate": 0.0002101965362911072, - "loss": 0.0206, + "epoch": 0.28, + "learning_rate": 0.0002580901160884108, + "loss": 0.0194, "step": 55380 }, { - "epoch": 0.6, - "learning_rate": 0.00021018032042550432, - "loss": 0.02, + "epoch": 0.28, + "learning_rate": 0.00025808254839539683, + "loss": 0.0196, "step": 55390 }, { - "epoch": 0.6, - "learning_rate": 0.0002101641045599014, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002580749807023828, + "loss": 0.0212, "step": 55400 }, { - "epoch": 0.6, - "learning_rate": 0.00021014788869429848, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.0002580674130093688, + "loss": 0.025, "step": 55410 }, { - "epoch": 0.6, - "learning_rate": 0.00021013167282869557, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002580598453163548, + "loss": 0.0202, "step": 55420 }, { - "epoch": 0.6, - "learning_rate": 0.0002101154569630927, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.00025805227762334075, + "loss": 0.0212, "step": 55430 }, { - "epoch": 0.6, - "learning_rate": 0.00021009924109748976, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.00025804470993032674, + "loss": 0.0207, "step": 55440 }, { - "epoch": 0.6, - "learning_rate": 0.00021008302523188685, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.0002580371422373127, + "loss": 0.0199, "step": 55450 }, { - "epoch": 0.6, - "learning_rate": 0.00021006680936628397, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.00025802957454429875, + "loss": 0.0186, "step": 55460 }, { - "epoch": 0.6, - "learning_rate": 0.00021005059350068107, - "loss": 0.0177, + "epoch": 0.28, + "learning_rate": 0.00025802200685128473, + "loss": 0.0188, "step": 55470 }, { - "epoch": 0.6, - "learning_rate": 0.00021003437763507813, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.0002580144391582707, + "loss": 0.0219, "step": 55480 }, { - "epoch": 0.6, - "learning_rate": 0.00021001816176947522, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.0002580068714652567, + "loss": 0.0261, "step": 55490 }, { - "epoch": 0.6, - "learning_rate": 0.00021000194590387234, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.0002579993037722427, + "loss": 0.0177, "step": 55500 }, { - "epoch": 0.6, - "learning_rate": 0.00020998573003826944, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.00025799173607922866, + "loss": 0.0188, "step": 55510 }, { - "epoch": 0.6, - "learning_rate": 0.0002099695141726665, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.0002579841683862147, + "loss": 0.0184, "step": 55520 }, { - "epoch": 0.6, - "learning_rate": 0.00020995329830706362, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002579766006932007, + "loss": 0.021, "step": 55530 }, { - "epoch": 0.6, - "learning_rate": 0.00020993708244146071, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025796903300018666, + "loss": 0.0221, "step": 55540 }, { - "epoch": 0.6, - "learning_rate": 0.0002099208665758578, - "loss": 0.018, + "epoch": 0.28, + "learning_rate": 0.00025796146530717264, + "loss": 0.0187, "step": 55550 }, { - "epoch": 0.6, - "learning_rate": 0.00020990465071025487, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002579538976141586, + "loss": 0.0187, "step": 55560 }, { - "epoch": 0.6, - "learning_rate": 0.000209888434844652, - "loss": 0.0208, + "epoch": 0.28, + "learning_rate": 0.0002579463299211446, + "loss": 0.0199, "step": 55570 }, { - "epoch": 0.6, - "learning_rate": 0.00020987221897904909, - "loss": 0.0177, + "epoch": 0.28, + "learning_rate": 0.00025793876222813064, + "loss": 0.0181, "step": 55580 }, { - "epoch": 0.6, - "learning_rate": 0.00020985600311344618, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.0002579311945351166, + "loss": 0.0181, "step": 55590 }, { - "epoch": 0.6, - "learning_rate": 0.00020983978724784327, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002579236268421026, + "loss": 0.0198, "step": 55600 }, { - "epoch": 0.6, - "learning_rate": 0.00020982357138224036, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.0002579160591490886, + "loss": 0.0223, "step": 55610 }, { - "epoch": 0.6, - "learning_rate": 0.00020980735551663746, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025790849145607456, + "loss": 0.0208, "step": 55620 }, { - "epoch": 0.6, - "learning_rate": 0.00020979113965103458, - "loss": 0.0194, + "epoch": 0.28, + "learning_rate": 0.00025790092376306055, + "loss": 0.0192, "step": 55630 }, { - "epoch": 0.6, - "learning_rate": 0.00020977492378543164, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.00025789335607004653, + "loss": 0.0182, "step": 55640 }, { - "epoch": 0.6, - "learning_rate": 0.00020975870791982873, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025788578837703256, + "loss": 0.0224, "step": 55650 }, { - "epoch": 0.6, - "learning_rate": 0.00020974249205422585, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025787822068401854, + "loss": 0.0204, "step": 55660 }, { - "epoch": 0.6, - "learning_rate": 0.00020972627618862295, - "loss": 0.0187, + "epoch": 0.28, + "learning_rate": 0.0002578706529910045, + "loss": 0.0186, "step": 55670 }, { - "epoch": 0.6, - "learning_rate": 0.00020971006032302, - "loss": 0.0182, + "epoch": 0.28, + "learning_rate": 0.0002578630852979905, + "loss": 0.023, "step": 55680 }, { - "epoch": 0.6, - "learning_rate": 0.0002096938444574171, - "loss": 0.0209, + "epoch": 0.28, + "learning_rate": 0.0002578555176049765, + "loss": 0.0216, "step": 55690 }, { - "epoch": 0.6, - "learning_rate": 0.00020967762859181423, - "loss": 0.02, + "epoch": 0.28, + "learning_rate": 0.00025784794991196247, + "loss": 0.0186, "step": 55700 }, { - "epoch": 0.6, - "learning_rate": 0.00020966141272621132, - "loss": 0.0182, + "epoch": 0.28, + "learning_rate": 0.0002578403822189485, + "loss": 0.0194, "step": 55710 }, { - "epoch": 0.6, - "learning_rate": 0.00020964519686060838, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.0002578328145259345, + "loss": 0.0233, "step": 55720 }, { - "epoch": 0.6, - "learning_rate": 0.0002096289809950055, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.00025782524683292047, + "loss": 0.0215, "step": 55730 }, { - "epoch": 0.6, - "learning_rate": 0.0002096127651294026, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.00025781767913990645, + "loss": 0.0178, "step": 55740 }, { - "epoch": 0.6, - "learning_rate": 0.0002095965492637997, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.00025781011144689243, + "loss": 0.0205, "step": 55750 }, { - "epoch": 0.6, - "learning_rate": 0.00020958033339819675, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002578025437538784, + "loss": 0.0231, "step": 55760 }, { - "epoch": 0.6, - "learning_rate": 0.00020956411753259387, - "loss": 0.0193, + "epoch": 0.28, + "learning_rate": 0.00025779497606086445, + "loss": 0.0192, "step": 55770 }, { - "epoch": 0.6, - "learning_rate": 0.00020954790166699097, - "loss": 0.0182, + "epoch": 0.28, + "learning_rate": 0.00025778740836785043, + "loss": 0.0209, "step": 55780 }, { - "epoch": 0.6, - "learning_rate": 0.00020953168580138806, - "loss": 0.0183, + "epoch": 0.28, + "learning_rate": 0.0002577798406748364, + "loss": 0.0225, "step": 55790 }, { - "epoch": 0.6, - "learning_rate": 0.00020951546993578515, - "loss": 0.018, + "epoch": 0.28, + "learning_rate": 0.0002577722729818224, + "loss": 0.0188, "step": 55800 }, { - "epoch": 0.6, - "learning_rate": 0.00020949925407018225, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.0002577647052888084, + "loss": 0.0206, "step": 55810 }, { - "epoch": 0.6, - "learning_rate": 0.00020948303820457934, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.00025775713759579436, + "loss": 0.0156, "step": 55820 }, { - "epoch": 0.6, - "learning_rate": 0.00020946682233897646, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025774956990278034, + "loss": 0.0205, "step": 55830 }, { - "epoch": 0.6, - "learning_rate": 0.00020945060647337352, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002577420022097664, + "loss": 0.0191, "step": 55840 }, { - "epoch": 0.6, - "learning_rate": 0.00020943439060777062, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025773443451675235, + "loss": 0.0242, "step": 55850 }, { - "epoch": 0.6, - "learning_rate": 0.0002094181747421677, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.00025772686682373834, + "loss": 0.0188, "step": 55860 }, { - "epoch": 0.6, - "learning_rate": 0.00020940195887656483, + "epoch": 0.28, + "learning_rate": 0.0002577192991307243, "loss": 0.0188, "step": 55870 }, { - "epoch": 0.6, - "learning_rate": 0.0002093857430109619, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.0002577117314377103, + "loss": 0.0239, "step": 55880 }, { - "epoch": 0.6, - "learning_rate": 0.000209369527145359, - "loss": 0.0193, + "epoch": 0.28, + "learning_rate": 0.0002577041637446963, + "loss": 0.0209, "step": 55890 }, { - "epoch": 0.6, - "learning_rate": 0.0002093533112797561, - "loss": 0.0196, + "epoch": 0.28, + "learning_rate": 0.0002576965960516823, + "loss": 0.0239, "step": 55900 }, { - "epoch": 0.6, - "learning_rate": 0.0002093370954141532, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.0002576890283586683, + "loss": 0.0183, "step": 55910 }, { - "epoch": 0.6, - "learning_rate": 0.00020932087954855027, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.0002576814606656543, + "loss": 0.0171, "step": 55920 }, { - "epoch": 0.6, - "learning_rate": 0.00020930466368294736, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025767389297264026, + "loss": 0.0187, "step": 55930 }, { - "epoch": 0.6, - "learning_rate": 0.00020928844781734448, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.00025766632527962624, + "loss": 0.0229, "step": 55940 }, { - "epoch": 0.6, - "learning_rate": 0.00020927223195174157, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.0002576587575866122, + "loss": 0.0203, "step": 55950 }, { - "epoch": 0.6, - "learning_rate": 0.00020925601608613864, - "loss": 0.0212, + "epoch": 0.28, + "learning_rate": 0.0002576511898935982, + "loss": 0.0193, "step": 55960 }, { - "epoch": 0.61, - "learning_rate": 0.00020923980022053576, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.0002576436222005842, + "loss": 0.0203, "step": 55970 }, { - "epoch": 0.61, - "learning_rate": 0.00020922358435493285, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.00025763605450757017, + "loss": 0.0202, "step": 55980 }, { - "epoch": 0.61, - "learning_rate": 0.00020920736848932994, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.00025762848681455615, + "loss": 0.0217, "step": 55990 }, { - "epoch": 0.61, - "learning_rate": 0.000209191152623727, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002576209191215422, + "loss": 0.0231, "step": 56000 }, { - "epoch": 0.61, - "eval_cer": 0.9215573356125475, - "eval_loss": 0.01228960882872343, - "eval_runtime": 121.224, - "eval_samples_per_second": 16.498, - "eval_steps_per_second": 4.125, + "epoch": 0.28, + "eval_cer": 0.9144886934295449, + "eval_loss": 0.014846866950392723, + "eval_runtime": 116.7024, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.284, "step": 56000 }, { - "epoch": 0.61, - "learning_rate": 0.00020917493675812413, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025761335142852817, + "loss": 0.0217, "step": 56010 }, { - "epoch": 0.61, - "learning_rate": 0.00020915872089252122, - "loss": 0.0183, + "epoch": 0.28, + "learning_rate": 0.00025760578373551415, + "loss": 0.0188, "step": 56020 }, { - "epoch": 0.61, - "learning_rate": 0.00020914250502691834, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.00025759821604250013, + "loss": 0.0211, "step": 56030 }, { - "epoch": 0.61, - "learning_rate": 0.0002091262891613154, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.0002575906483494861, + "loss": 0.0206, "step": 56040 }, { - "epoch": 0.61, - "learning_rate": 0.0002091100732957125, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002575830806564721, + "loss": 0.0159, "step": 56050 }, { - "epoch": 0.61, - "learning_rate": 0.0002090938574301096, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.0002575755129634581, + "loss": 0.0219, "step": 56060 }, { - "epoch": 0.61, - "learning_rate": 0.0002090776415645067, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.0002575679452704441, + "loss": 0.0194, "step": 56070 }, { - "epoch": 0.61, - "learning_rate": 0.00020906142569890378, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.0002575603775774301, + "loss": 0.0193, "step": 56080 }, { - "epoch": 0.61, - "learning_rate": 0.00020904520983330087, - "loss": 0.0202, + "epoch": 0.28, + "learning_rate": 0.00025755280988441607, + "loss": 0.0166, "step": 56090 }, { - "epoch": 0.61, - "learning_rate": 0.000209028993967698, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025754524219140205, + "loss": 0.0205, "step": 56100 }, { - "epoch": 0.61, - "learning_rate": 0.00020901277810209508, - "loss": 0.0188, + "epoch": 0.28, + "learning_rate": 0.00025753767449838803, + "loss": 0.0187, "step": 56110 }, { - "epoch": 0.61, - "learning_rate": 0.00020899656223649217, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.000257530106805374, + "loss": 0.022, "step": 56120 }, { - "epoch": 0.61, - "learning_rate": 0.00020898034637088924, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025752253911236005, + "loss": 0.0186, "step": 56130 }, { - "epoch": 0.61, - "learning_rate": 0.00020896413050528636, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025751497141934603, + "loss": 0.0186, "step": 56140 }, { - "epoch": 0.61, - "learning_rate": 0.00020894791463968345, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.000257507403726332, + "loss": 0.0208, "step": 56150 }, { - "epoch": 0.61, - "learning_rate": 0.00020893169877408055, - "loss": 0.0206, + "epoch": 0.28, + "learning_rate": 0.000257499836033318, + "loss": 0.0181, "step": 56160 }, { - "epoch": 0.61, - "learning_rate": 0.00020891548290847764, - "loss": 0.0126, + "epoch": 0.28, + "learning_rate": 0.000257492268340304, + "loss": 0.021, "step": 56170 }, { - "epoch": 0.61, - "learning_rate": 0.00020889926704287473, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.00025748470064728996, + "loss": 0.0231, "step": 56180 }, { - "epoch": 0.61, - "learning_rate": 0.00020888305117727182, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.00025747713295427594, + "loss": 0.0215, "step": 56190 }, { - "epoch": 0.61, - "learning_rate": 0.00020886683531166894, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.000257469565261262, + "loss": 0.0171, "step": 56200 }, { - "epoch": 0.61, - "learning_rate": 0.000208850619446066, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025746199756824796, + "loss": 0.0192, "step": 56210 }, { - "epoch": 0.61, - "learning_rate": 0.0002088344035804631, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.00025745442987523394, + "loss": 0.0196, "step": 56220 }, { - "epoch": 0.61, - "learning_rate": 0.0002088181877148602, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002574468621822199, + "loss": 0.0239, "step": 56230 }, { - "epoch": 0.61, - "learning_rate": 0.00020880197184925731, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.0002574392944892059, + "loss": 0.0216, "step": 56240 }, { - "epoch": 0.61, - "learning_rate": 0.00020878575598365438, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.0002574317267961919, + "loss": 0.0229, "step": 56250 }, { - "epoch": 0.61, - "learning_rate": 0.00020876954011805147, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002574241591031779, + "loss": 0.0239, "step": 56260 }, { - "epoch": 0.61, - "learning_rate": 0.0002087533242524486, - "loss": 0.0201, + "epoch": 0.28, + "learning_rate": 0.0002574165914101639, + "loss": 0.0189, "step": 56270 }, { - "epoch": 0.61, - "learning_rate": 0.00020873710838684569, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.0002574090237171499, + "loss": 0.0235, "step": 56280 }, { - "epoch": 0.61, - "learning_rate": 0.00020872089252124275, - "loss": 0.0192, + "epoch": 0.28, + "learning_rate": 0.00025740145602413586, + "loss": 0.0223, "step": 56290 }, { - "epoch": 0.61, - "learning_rate": 0.00020870467665563984, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.00025739388833112184, + "loss": 0.0204, "step": 56300 }, { - "epoch": 0.61, - "learning_rate": 0.00020868846079003696, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.0002573863206381078, + "loss": 0.0243, "step": 56310 }, { - "epoch": 0.61, - "learning_rate": 0.00020867224492443406, - "loss": 0.018, + "epoch": 0.28, + "learning_rate": 0.00025737875294509386, + "loss": 0.0205, "step": 56320 }, { - "epoch": 0.61, - "learning_rate": 0.00020865602905883112, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.00025737118525207984, + "loss": 0.0221, "step": 56330 }, { - "epoch": 0.61, - "learning_rate": 0.00020863981319322824, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.0002573636175590658, + "loss": 0.0257, "step": 56340 }, { - "epoch": 0.61, - "learning_rate": 0.00020862359732762534, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.0002573560498660518, + "loss": 0.0195, "step": 56350 }, { - "epoch": 0.61, - "learning_rate": 0.00020860738146202243, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002573484821730378, + "loss": 0.0186, "step": 56360 }, { - "epoch": 0.61, - "learning_rate": 0.00020859116559641952, - "loss": 0.0185, + "epoch": 0.28, + "learning_rate": 0.00025734091448002377, + "loss": 0.0191, "step": 56370 }, { - "epoch": 0.61, - "learning_rate": 0.0002085749497308166, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.00025733334678700975, + "loss": 0.02, "step": 56380 }, { - "epoch": 0.61, - "learning_rate": 0.0002085587338652137, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.0002573257790939958, + "loss": 0.0203, "step": 56390 }, { - "epoch": 0.61, - "learning_rate": 0.00020854251799961083, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025731821140098177, + "loss": 0.0212, "step": 56400 }, { - "epoch": 0.61, - "learning_rate": 0.0002085263021340079, - "loss": 0.0185, + "epoch": 0.28, + "learning_rate": 0.00025731064370796775, + "loss": 0.0216, "step": 56410 }, { - "epoch": 0.61, - "learning_rate": 0.00020851008626840498, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025730307601495373, + "loss": 0.0271, "step": 56420 }, { - "epoch": 0.61, - "learning_rate": 0.00020849387040280208, - "loss": 0.0155, + "epoch": 0.28, + "learning_rate": 0.0002572955083219397, + "loss": 0.0196, "step": 56430 }, { - "epoch": 0.61, - "learning_rate": 0.0002084776545371992, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.0002572879406289257, + "loss": 0.0235, "step": 56440 }, { - "epoch": 0.61, - "learning_rate": 0.00020846143867159626, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025728037293591173, + "loss": 0.0213, "step": 56450 }, { - "epoch": 0.61, - "learning_rate": 0.00020844522280599336, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002572728052428977, + "loss": 0.037, "step": 56460 }, { - "epoch": 0.61, - "learning_rate": 0.00020842900694039048, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002572652375498837, + "loss": 0.0182, "step": 56470 }, { - "epoch": 0.61, - "learning_rate": 0.00020841279107478757, - "loss": 0.0185, + "epoch": 0.28, + "learning_rate": 0.0002572576698568697, + "loss": 0.0186, "step": 56480 }, { - "epoch": 0.61, - "learning_rate": 0.00020839657520918463, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.00025725010216385565, + "loss": 0.0186, "step": 56490 }, { - "epoch": 0.61, - "learning_rate": 0.00020838035934358173, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.00025724253447084164, + "loss": 0.0252, "step": 56500 }, { - "epoch": 0.61, - "learning_rate": 0.00020836414347797885, - "loss": 0.0233, + "epoch": 0.29, + "learning_rate": 0.0002572349667778276, + "loss": 0.0242, "step": 56510 }, { - "epoch": 0.61, - "learning_rate": 0.00020834792761237594, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.00025722739908481365, + "loss": 0.0204, "step": 56520 }, { - "epoch": 0.61, - "learning_rate": 0.000208331711746773, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.00025721983139179963, + "loss": 0.0236, "step": 56530 }, { - "epoch": 0.61, - "learning_rate": 0.00020831549588117012, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002572122636987856, + "loss": 0.0248, "step": 56540 }, { - "epoch": 0.61, - "learning_rate": 0.00020829928001556722, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002572046960057716, + "loss": 0.0227, "step": 56550 }, { - "epoch": 0.61, - "learning_rate": 0.0002082830641499643, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.0002571971283127576, + "loss": 0.0206, "step": 56560 }, { - "epoch": 0.61, - "learning_rate": 0.00020826684828436138, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025718956061974356, + "loss": 0.0212, "step": 56570 }, { - "epoch": 0.61, - "learning_rate": 0.0002082506324187585, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.0002571819929267296, + "loss": 0.0183, "step": 56580 }, { - "epoch": 0.61, - "learning_rate": 0.0002082344165531556, - "loss": 0.0209, + "epoch": 0.29, + "learning_rate": 0.0002571744252337156, + "loss": 0.0237, "step": 56590 }, { - "epoch": 0.61, - "learning_rate": 0.00020821820068755268, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.00025716685754070156, + "loss": 0.0188, "step": 56600 }, { - "epoch": 0.61, - "learning_rate": 0.00020820198482194977, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.00025715928984768754, + "loss": 0.0202, "step": 56610 }, { - "epoch": 0.61, - "learning_rate": 0.00020818576895634687, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002571517221546735, + "loss": 0.02, "step": 56620 }, { - "epoch": 0.61, - "learning_rate": 0.00020816955309074396, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.0002571441544616595, + "loss": 0.0222, "step": 56630 }, { - "epoch": 0.61, - "learning_rate": 0.00020815333722514108, - "loss": 0.019, + "epoch": 0.29, + "learning_rate": 0.00025713658676864554, + "loss": 0.0181, "step": 56640 }, { - "epoch": 0.61, - "learning_rate": 0.00020813712135953814, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002571290190756315, + "loss": 0.0193, "step": 56650 }, { - "epoch": 0.61, - "learning_rate": 0.00020812090549393524, - "loss": 0.0187, + "epoch": 0.29, + "learning_rate": 0.0002571214513826175, + "loss": 0.0206, "step": 56660 }, { - "epoch": 0.61, - "learning_rate": 0.00020810468962833236, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.0002571138836896035, + "loss": 0.0208, "step": 56670 }, { - "epoch": 0.61, - "learning_rate": 0.00020808847376272945, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025710631599658946, + "loss": 0.0205, "step": 56680 }, { - "epoch": 0.61, - "learning_rate": 0.00020807225789712652, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025709874830357545, + "loss": 0.0229, "step": 56690 }, { - "epoch": 0.61, - "learning_rate": 0.0002080560420315236, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.00025709118061056143, + "loss": 0.0234, "step": 56700 }, { - "epoch": 0.61, - "learning_rate": 0.00020803982616592073, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.00025708361291754746, + "loss": 0.027, "step": 56710 }, { - "epoch": 0.61, - "learning_rate": 0.00020802361030031782, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.00025707604522453344, + "loss": 0.0241, "step": 56720 }, { - "epoch": 0.61, - "learning_rate": 0.0002080073944347149, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.0002570684775315194, + "loss": 0.0194, "step": 56730 }, { - "epoch": 0.61, - "learning_rate": 0.000207991178569112, - "loss": 0.0188, + "epoch": 0.29, + "learning_rate": 0.0002570609098385054, + "loss": 0.0168, "step": 56740 }, { - "epoch": 0.61, - "learning_rate": 0.0002079749627035091, - "loss": 0.0181, + "epoch": 0.29, + "learning_rate": 0.0002570533421454914, + "loss": 0.0177, "step": 56750 }, { - "epoch": 0.61, - "learning_rate": 0.0002079587468379062, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025704577445247737, + "loss": 0.0176, "step": 56760 }, { - "epoch": 0.61, - "learning_rate": 0.00020794253097230326, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002570382067594634, + "loss": 0.0233, "step": 56770 }, { - "epoch": 0.61, - "learning_rate": 0.00020792631510670038, - "loss": 0.012, + "epoch": 0.29, + "learning_rate": 0.0002570306390664494, + "loss": 0.0194, "step": 56780 }, { - "epoch": 0.61, - "learning_rate": 0.00020791009924109747, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.00025702307137343537, + "loss": 0.0209, "step": 56790 }, { - "epoch": 0.61, - "learning_rate": 0.00020789388337549456, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.00025701550368042135, + "loss": 0.0257, "step": 56800 }, { - "epoch": 0.61, - "learning_rate": 0.00020787766750989166, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.00025700793598740733, + "loss": 0.0195, "step": 56810 }, { - "epoch": 0.61, - "learning_rate": 0.00020786145164428875, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002570003682943933, + "loss": 0.0198, "step": 56820 }, { - "epoch": 0.61, - "learning_rate": 0.00020784523577868584, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025699280060137935, + "loss": 0.0229, "step": 56830 }, { - "epoch": 0.61, - "learning_rate": 0.00020782901991308296, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.00025698523290836533, + "loss": 0.0193, "step": 56840 }, { - "epoch": 0.61, - "learning_rate": 0.00020781280404748005, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.0002569776652153513, + "loss": 0.0187, "step": 56850 }, { - "epoch": 0.61, - "learning_rate": 0.00020779658818187712, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002569700975223373, + "loss": 0.0213, "step": 56860 }, { - "epoch": 0.61, - "learning_rate": 0.0002077803723162742, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002569625298293233, + "loss": 0.0171, "step": 56870 }, { - "epoch": 0.61, - "learning_rate": 0.00020776415645067133, - "loss": 0.0212, + "epoch": 0.29, + "learning_rate": 0.00025695496213630926, + "loss": 0.0196, "step": 56880 }, { - "epoch": 0.62, - "learning_rate": 0.00020774794058506842, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025694739444329524, + "loss": 0.017, "step": 56890 }, { - "epoch": 0.62, - "learning_rate": 0.0002077317247194655, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.0002569398267502813, + "loss": 0.0427, "step": 56900 }, { - "epoch": 0.62, - "learning_rate": 0.0002077155088538626, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.00025693225905726725, + "loss": 0.0221, "step": 56910 }, { - "epoch": 0.62, - "learning_rate": 0.0002076992929882597, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.00025692469136425324, + "loss": 0.0206, "step": 56920 }, { - "epoch": 0.62, - "learning_rate": 0.0002076830771226568, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.0002569171236712392, + "loss": 0.03, "step": 56930 }, { - "epoch": 0.62, - "learning_rate": 0.00020766686125705386, - "loss": 0.0188, + "epoch": 0.29, + "learning_rate": 0.0002569095559782252, + "loss": 0.02, "step": 56940 }, { - "epoch": 0.62, - "learning_rate": 0.00020765064539145098, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002569019882852112, + "loss": 0.0199, "step": 56950 }, { - "epoch": 0.62, - "learning_rate": 0.00020763442952584807, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.0002568944205921972, + "loss": 0.0206, "step": 56960 }, { - "epoch": 0.62, - "learning_rate": 0.0002076182136602452, - "loss": 0.0166, + "epoch": 0.29, + "learning_rate": 0.0002568868528991832, + "loss": 0.022, "step": 56970 }, { - "epoch": 0.62, - "learning_rate": 0.00020760199779464226, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002568792852061692, + "loss": 0.028, "step": 56980 }, { - "epoch": 0.62, - "learning_rate": 0.00020758578192903935, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025687171751315516, + "loss": 0.0209, "step": 56990 }, { - "epoch": 0.62, - "learning_rate": 0.00020756956606343644, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025686414982014114, + "loss": 0.0217, "step": 57000 }, { - "epoch": 0.62, - "eval_cer": 0.9215564670095912, - "eval_loss": 0.01153921615332365, - "eval_runtime": 121.3157, - "eval_samples_per_second": 16.486, - "eval_steps_per_second": 4.121, + "epoch": 0.29, + "eval_cer": 0.9144644335264098, + "eval_loss": 0.014634103514254093, + "eval_runtime": 116.5702, + "eval_samples_per_second": 17.157, + "eval_steps_per_second": 4.289, "step": 57000 }, { - "epoch": 0.62, - "learning_rate": 0.00020755335019783356, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.0002568565821271271, + "loss": 0.0183, "step": 57010 }, { - "epoch": 0.62, - "learning_rate": 0.00020753713433223063, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.0002568490144341131, + "loss": 0.0169, "step": 57020 }, { - "epoch": 0.62, - "learning_rate": 0.00020752091846662772, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.00025684144674109914, + "loss": 0.0273, "step": 57030 }, { - "epoch": 0.62, - "learning_rate": 0.00020750470260102484, - "loss": 0.0174, + "epoch": 0.29, + "learning_rate": 0.0002568338790480851, + "loss": 0.0249, "step": 57040 }, { - "epoch": 0.62, - "learning_rate": 0.00020748848673542194, - "loss": 0.0205, + "epoch": 0.29, + "learning_rate": 0.0002568263113550711, + "loss": 0.0195, "step": 57050 }, { - "epoch": 0.62, - "learning_rate": 0.000207472270869819, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.0002568187436620571, + "loss": 0.0171, "step": 57060 }, { - "epoch": 0.62, - "learning_rate": 0.0002074560550042161, - "loss": 0.0206, + "epoch": 0.29, + "learning_rate": 0.00025681117596904307, + "loss": 0.0186, "step": 57070 }, { - "epoch": 0.62, - "learning_rate": 0.00020743983913861321, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.00025680360827602905, + "loss": 0.0236, "step": 57080 }, { - "epoch": 0.62, - "learning_rate": 0.0002074236232730103, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.0002567960405830151, + "loss": 0.019, "step": 57090 }, { - "epoch": 0.62, - "learning_rate": 0.00020740740740740737, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.00025678847289000106, + "loss": 0.0243, "step": 57100 }, { - "epoch": 0.62, - "learning_rate": 0.0002073911915418045, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025678090519698705, + "loss": 0.0207, "step": 57110 }, { - "epoch": 0.62, - "learning_rate": 0.00020737497567620158, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.00025677333750397303, + "loss": 0.0199, "step": 57120 }, { - "epoch": 0.62, - "learning_rate": 0.00020735875981059868, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.000256765769810959, + "loss": 0.0218, "step": 57130 }, { - "epoch": 0.62, - "learning_rate": 0.00020734254394499574, - "loss": 0.0206, + "epoch": 0.29, + "learning_rate": 0.000256758202117945, + "loss": 0.0233, "step": 57140 }, { - "epoch": 0.62, - "learning_rate": 0.00020732632807939286, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.000256750634424931, + "loss": 0.0202, "step": 57150 }, { - "epoch": 0.62, - "learning_rate": 0.00020731011221378996, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.000256743066731917, + "loss": 0.0222, "step": 57160 }, { - "epoch": 0.62, - "learning_rate": 0.00020729389634818705, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.000256735499038903, + "loss": 0.0229, "step": 57170 }, { - "epoch": 0.62, - "learning_rate": 0.00020727768048258414, - "loss": 0.0211, + "epoch": 0.29, + "learning_rate": 0.00025672793134588897, + "loss": 0.0185, "step": 57180 }, { - "epoch": 0.62, - "learning_rate": 0.00020726146461698123, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.00025672036365287495, + "loss": 0.0251, "step": 57190 }, { - "epoch": 0.62, - "learning_rate": 0.00020724524875137833, - "loss": 0.0217, + "epoch": 0.29, + "learning_rate": 0.00025671279595986093, + "loss": 0.0174, "step": 57200 }, { - "epoch": 0.62, - "learning_rate": 0.00020722903288577545, - "loss": 0.018, + "epoch": 0.29, + "learning_rate": 0.0002567052282668469, + "loss": 0.0226, "step": 57210 }, { - "epoch": 0.62, - "learning_rate": 0.0002072128170201725, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.0002566976605738329, + "loss": 0.0242, "step": 57220 }, { - "epoch": 0.62, - "learning_rate": 0.0002071966011545696, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002566900928808189, + "loss": 0.0263, "step": 57230 }, { - "epoch": 0.62, - "learning_rate": 0.0002071803852889667, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025668252518780486, + "loss": 0.0278, "step": 57240 }, { - "epoch": 0.62, - "learning_rate": 0.00020716416942336382, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.00025667495749479084, + "loss": 0.0207, "step": 57250 }, { - "epoch": 0.62, - "learning_rate": 0.00020714795355776088, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.0002566673898017769, + "loss": 0.0209, "step": 57260 }, { - "epoch": 0.62, - "learning_rate": 0.00020713173769215798, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025665982210876286, + "loss": 0.0188, "step": 57270 }, { - "epoch": 0.62, - "learning_rate": 0.0002071155218265551, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025665225441574884, + "loss": 0.0194, "step": 57280 }, { - "epoch": 0.62, - "learning_rate": 0.0002070993059609522, - "loss": 0.019, + "epoch": 0.29, + "learning_rate": 0.0002566446867227348, + "loss": 0.021, "step": 57290 }, { - "epoch": 0.62, - "learning_rate": 0.00020708309009534925, - "loss": 0.0185, + "epoch": 0.29, + "learning_rate": 0.0002566371190297208, + "loss": 0.0245, "step": 57300 }, { - "epoch": 0.62, - "learning_rate": 0.00020706687422974635, - "loss": 0.0205, + "epoch": 0.29, + "learning_rate": 0.0002566295513367068, + "loss": 0.0265, "step": 57310 }, { - "epoch": 0.62, - "learning_rate": 0.00020705065836414347, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.0002566219836436928, + "loss": 0.0186, "step": 57320 }, { - "epoch": 0.62, - "learning_rate": 0.00020703444249854056, - "loss": 0.0226, + "epoch": 0.29, + "learning_rate": 0.0002566144159506788, + "loss": 0.0239, "step": 57330 }, { - "epoch": 0.62, - "learning_rate": 0.00020701822663293763, - "loss": 0.0184, + "epoch": 0.29, + "learning_rate": 0.0002566068482576648, + "loss": 0.0198, "step": 57340 }, { - "epoch": 0.62, - "learning_rate": 0.00020700201076733474, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.00025659928056465076, + "loss": 0.0241, "step": 57350 }, { - "epoch": 0.62, - "learning_rate": 0.00020698579490173184, - "loss": 0.019, + "epoch": 0.29, + "learning_rate": 0.00025659171287163674, + "loss": 0.0189, "step": 57360 }, { - "epoch": 0.62, - "learning_rate": 0.00020696957903612893, - "loss": 0.018, + "epoch": 0.29, + "learning_rate": 0.0002565841451786227, + "loss": 0.0187, "step": 57370 }, { - "epoch": 0.62, - "learning_rate": 0.00020695336317052602, - "loss": 0.0189, + "epoch": 0.29, + "learning_rate": 0.00025657657748560876, + "loss": 0.0195, "step": 57380 }, { - "epoch": 0.62, - "learning_rate": 0.00020693714730492312, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025656900979259474, + "loss": 0.0241, "step": 57390 }, { - "epoch": 0.62, - "learning_rate": 0.0002069209314393202, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.0002565614420995807, + "loss": 0.0166, "step": 57400 }, { - "epoch": 0.62, - "learning_rate": 0.00020690471557371733, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.0002565538744065667, + "loss": 0.0163, "step": 57410 }, { - "epoch": 0.62, - "learning_rate": 0.0002068884997081144, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.0002565463067135527, + "loss": 0.0186, "step": 57420 }, { - "epoch": 0.62, - "learning_rate": 0.0002068722838425115, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025653873902053867, + "loss": 0.0186, "step": 57430 }, { - "epoch": 0.62, - "learning_rate": 0.00020685606797690858, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025653117132752465, + "loss": 0.0214, "step": 57440 }, { - "epoch": 0.62, - "learning_rate": 0.0002068398521113057, - "loss": 0.0197, + "epoch": 0.29, + "learning_rate": 0.0002565236036345107, + "loss": 0.0215, "step": 57450 }, { - "epoch": 0.62, - "learning_rate": 0.00020682363624570277, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.00025651603594149667, + "loss": 0.0198, "step": 57460 }, { - "epoch": 0.62, - "learning_rate": 0.00020680742038009986, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.00025650846824848265, + "loss": 0.0209, "step": 57470 }, { - "epoch": 0.62, - "learning_rate": 0.00020679120451449698, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025650090055546863, + "loss": 0.0219, "step": 57480 }, { - "epoch": 0.62, - "learning_rate": 0.00020677498864889407, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.0002564933328624546, + "loss": 0.0249, "step": 57490 }, { - "epoch": 0.62, - "learning_rate": 0.00020675877278329114, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.0002564857651694406, + "loss": 0.0168, "step": 57500 }, { - "epoch": 0.62, - "learning_rate": 0.00020674255691768823, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025647819747642663, + "loss": 0.0211, "step": 57510 }, { - "epoch": 0.62, - "learning_rate": 0.00020672634105208535, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002564706297834126, + "loss": 0.0206, "step": 57520 }, { - "epoch": 0.62, - "learning_rate": 0.00020671012518648244, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.0002564630620903986, + "loss": 0.0218, "step": 57530 }, { - "epoch": 0.62, - "learning_rate": 0.0002066939093208795, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.0002564554943973846, + "loss": 0.0201, "step": 57540 }, { - "epoch": 0.62, - "learning_rate": 0.00020667769345527663, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.00025644792670437056, + "loss": 0.0209, "step": 57550 }, { - "epoch": 0.62, - "learning_rate": 0.00020666147758967372, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.00025644035901135654, + "loss": 0.0171, "step": 57560 }, { - "epoch": 0.62, - "learning_rate": 0.0002066452617240708, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.00025643279131834257, + "loss": 0.0197, "step": 57570 }, { - "epoch": 0.62, - "learning_rate": 0.00020662904585846793, - "loss": 0.0195, + "epoch": 0.29, + "learning_rate": 0.00025642522362532855, + "loss": 0.0187, "step": 57580 }, { - "epoch": 0.62, - "learning_rate": 0.000206612829992865, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.00025641765593231454, + "loss": 0.0191, "step": 57590 }, { - "epoch": 0.62, - "learning_rate": 0.0002065966141272621, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.0002564100882393005, + "loss": 0.0213, "step": 57600 }, { - "epoch": 0.62, - "learning_rate": 0.00020658039826165918, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002564025205462865, + "loss": 0.0176, "step": 57610 }, { - "epoch": 0.62, - "learning_rate": 0.0002065641823960563, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.0002563949528532725, + "loss": 0.0206, "step": 57620 }, { - "epoch": 0.62, - "learning_rate": 0.00020654796653045337, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.00025638738516025846, + "loss": 0.0181, "step": 57630 }, { - "epoch": 0.62, - "learning_rate": 0.00020653175066485046, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002563798174672445, + "loss": 0.0229, "step": 57640 }, { - "epoch": 0.62, - "learning_rate": 0.00020651553479924758, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002563722497742305, + "loss": 0.0235, "step": 57650 }, { - "epoch": 0.62, - "learning_rate": 0.00020649931893364467, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025636468208121646, + "loss": 0.0192, "step": 57660 }, { - "epoch": 0.62, - "learning_rate": 0.00020648310306804174, - "loss": 0.0188, + "epoch": 0.29, + "learning_rate": 0.00025635711438820244, + "loss": 0.017, "step": 57670 }, { - "epoch": 0.62, - "learning_rate": 0.00020646688720243886, - "loss": 0.0252, + "epoch": 0.29, + "learning_rate": 0.0002563495466951884, + "loss": 0.0178, "step": 57680 }, { - "epoch": 0.62, - "learning_rate": 0.00020645067133683595, - "loss": 0.0229, + "epoch": 0.29, + "learning_rate": 0.0002563419790021744, + "loss": 0.0167, "step": 57690 }, { - "epoch": 0.62, - "learning_rate": 0.00020643445547123305, - "loss": 0.0186, + "epoch": 0.29, + "learning_rate": 0.00025633441130916044, + "loss": 0.017, "step": 57700 }, { - "epoch": 0.62, - "learning_rate": 0.0002064182396056301, - "loss": 0.0227, + "epoch": 0.29, + "learning_rate": 0.0002563268436161464, + "loss": 0.0176, "step": 57710 }, { - "epoch": 0.62, - "learning_rate": 0.00020640202374002723, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002563192759231324, + "loss": 0.0204, "step": 57720 }, { - "epoch": 0.62, - "learning_rate": 0.00020638580787442432, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.0002563117082301184, + "loss": 0.024, "step": 57730 }, { - "epoch": 0.62, - "learning_rate": 0.00020636959200882142, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.00025630414053710437, + "loss": 0.0171, "step": 57740 }, { - "epoch": 0.62, - "learning_rate": 0.0002063533761432185, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.00025629657284409035, + "loss": 0.0136, "step": 57750 }, { - "epoch": 0.62, - "learning_rate": 0.0002063371602776156, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.00025628900515107633, + "loss": 0.0175, "step": 57760 }, { - "epoch": 0.62, - "learning_rate": 0.0002063209444120127, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.00025628143745806236, + "loss": 0.0213, "step": 57770 }, { - "epoch": 0.62, - "learning_rate": 0.00020630472854640981, - "loss": 0.0225, + "epoch": 0.29, + "learning_rate": 0.00025627386976504835, + "loss": 0.0175, "step": 57780 }, { - "epoch": 0.62, - "learning_rate": 0.00020628851268080688, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.0002562663020720343, + "loss": 0.0196, "step": 57790 }, { - "epoch": 0.62, - "learning_rate": 0.00020627229681520397, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.0002562587343790203, + "loss": 0.0179, "step": 57800 }, { - "epoch": 0.62, - "learning_rate": 0.00020625608094960107, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002562511666860063, + "loss": 0.0197, "step": 57810 }, { - "epoch": 0.63, - "learning_rate": 0.00020623986508399819, - "loss": 0.0186, + "epoch": 0.29, + "learning_rate": 0.00025624359899299227, + "loss": 0.0187, "step": 57820 }, { - "epoch": 0.63, - "learning_rate": 0.00020622364921839525, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002562360312999783, + "loss": 0.0199, "step": 57830 }, { - "epoch": 0.63, - "learning_rate": 0.00020620743335279234, - "loss": 0.0174, + "epoch": 0.29, + "learning_rate": 0.0002562284636069643, + "loss": 0.0206, "step": 57840 }, { - "epoch": 0.63, - "learning_rate": 0.00020619121748718946, - "loss": 0.0187, + "epoch": 0.29, + "learning_rate": 0.00025622089591395027, + "loss": 0.0188, "step": 57850 }, { - "epoch": 0.63, - "learning_rate": 0.00020617500162158656, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.00025621332822093625, + "loss": 0.017, "step": 57860 }, { - "epoch": 0.63, - "learning_rate": 0.00020615878575598362, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.00025620576052792223, + "loss": 0.0177, "step": 57870 }, { - "epoch": 0.63, - "learning_rate": 0.00020614256989038071, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.0002561981928349082, + "loss": 0.0188, "step": 57880 }, { - "epoch": 0.63, - "learning_rate": 0.00020612635402477783, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025619062514189425, + "loss": 0.0194, "step": 57890 }, { - "epoch": 0.63, - "learning_rate": 0.00020611013815917493, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025618305744888023, + "loss": 0.0226, "step": 57900 }, { - "epoch": 0.63, - "learning_rate": 0.000206093922293572, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002561754897558662, + "loss": 0.0199, "step": 57910 }, { - "epoch": 0.63, - "learning_rate": 0.0002060777064279691, - "loss": 0.0184, + "epoch": 0.29, + "learning_rate": 0.0002561679220628522, + "loss": 0.0172, "step": 57920 }, { - "epoch": 0.63, - "learning_rate": 0.0002060614905623662, - "loss": 0.0132, + "epoch": 0.29, + "learning_rate": 0.0002561603543698382, + "loss": 0.0197, "step": 57930 }, { - "epoch": 0.63, - "learning_rate": 0.0002060452746967633, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025615278667682416, + "loss": 0.0196, "step": 57940 }, { - "epoch": 0.63, - "learning_rate": 0.00020602905883116036, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.00025614521898381014, + "loss": 0.0179, "step": 57950 }, { - "epoch": 0.63, - "learning_rate": 0.00020601284296555748, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.0002561376512907962, + "loss": 0.0268, "step": 57960 }, { - "epoch": 0.63, - "learning_rate": 0.00020599662709995458, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.00025613008359778216, + "loss": 0.0231, "step": 57970 }, { - "epoch": 0.63, - "learning_rate": 0.0002059804112343517, - "loss": 0.0189, + "epoch": 0.29, + "learning_rate": 0.00025612251590476814, + "loss": 0.0186, "step": 57980 }, { - "epoch": 0.63, - "learning_rate": 0.00020596419536874876, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002561149482117541, + "loss": 0.0204, "step": 57990 }, { - "epoch": 0.63, - "learning_rate": 0.00020594797950314585, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.0002561073805187401, + "loss": 0.019, "step": 58000 }, { - "epoch": 0.63, - "eval_cer": 0.9215660216421112, - "eval_loss": 0.011522618122398853, - "eval_runtime": 121.2413, - "eval_samples_per_second": 16.496, - "eval_steps_per_second": 4.124, + "epoch": 0.29, + "eval_cer": 0.914472196695413, + "eval_loss": 0.014296288602054119, + "eval_runtime": 116.695, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 58000 }, { - "epoch": 0.63, - "learning_rate": 0.00020593176363754295, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.0002560998128257261, + "loss": 0.0212, "step": 58010 }, { - "epoch": 0.63, - "learning_rate": 0.00020591554777194007, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002560922451327121, + "loss": 0.0204, "step": 58020 }, { - "epoch": 0.63, - "learning_rate": 0.00020589933190633713, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.0002560846774396981, + "loss": 0.015, "step": 58030 }, { - "epoch": 0.63, - "learning_rate": 0.00020588311604073423, - "loss": 0.0212, + "epoch": 0.29, + "learning_rate": 0.0002560771097466841, + "loss": 0.0206, "step": 58040 }, { - "epoch": 0.63, - "learning_rate": 0.00020586690017513135, - "loss": 0.0193, + "epoch": 0.29, + "learning_rate": 0.00025606954205367006, + "loss": 0.0218, "step": 58050 }, { - "epoch": 0.63, - "learning_rate": 0.00020585068430952844, - "loss": 0.0181, + "epoch": 0.29, + "learning_rate": 0.00025606197436065604, + "loss": 0.0192, "step": 58060 }, { - "epoch": 0.63, - "learning_rate": 0.0002058344684439255, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.000256054406667642, + "loss": 0.0203, "step": 58070 }, { - "epoch": 0.63, - "learning_rate": 0.0002058182525783226, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.00025604683897462806, + "loss": 0.0193, "step": 58080 }, { - "epoch": 0.63, - "learning_rate": 0.00020580203671271972, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.00025603927128161404, + "loss": 0.019, "step": 58090 }, { - "epoch": 0.63, - "learning_rate": 0.0002057858208471168, - "loss": 0.0198, + "epoch": 0.29, + "learning_rate": 0.0002560317035886, + "loss": 0.0174, "step": 58100 }, { - "epoch": 0.63, - "learning_rate": 0.00020576960498151387, - "loss": 0.0174, + "epoch": 0.29, + "learning_rate": 0.000256024135895586, + "loss": 0.0199, "step": 58110 }, { - "epoch": 0.63, - "learning_rate": 0.000205753389115911, - "loss": 0.0188, + "epoch": 0.29, + "learning_rate": 0.000256016568202572, + "loss": 0.02, "step": 58120 }, { - "epoch": 0.63, - "learning_rate": 0.0002057371732503081, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.00025600900050955797, + "loss": 0.0179, "step": 58130 }, { - "epoch": 0.63, - "learning_rate": 0.00020572095738470518, - "loss": 0.0125, + "epoch": 0.29, + "learning_rate": 0.00025600143281654395, + "loss": 0.0192, "step": 58140 }, { - "epoch": 0.63, - "learning_rate": 0.00020570474151910225, - "loss": 0.0185, + "epoch": 0.29, + "learning_rate": 0.00025599386512353, + "loss": 0.0195, "step": 58150 }, { - "epoch": 0.63, - "learning_rate": 0.00020568852565349937, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025598629743051597, + "loss": 0.0211, "step": 58160 }, { - "epoch": 0.63, - "learning_rate": 0.00020567230978789646, - "loss": 0.0166, + "epoch": 0.29, + "learning_rate": 0.00025597872973750195, + "loss": 0.0255, "step": 58170 }, { - "epoch": 0.63, - "learning_rate": 0.00020565609392229355, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025597116204448793, + "loss": 0.0201, "step": 58180 }, { - "epoch": 0.63, - "learning_rate": 0.00020563987805669064, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002559635943514739, + "loss": 0.0198, "step": 58190 }, { - "epoch": 0.63, - "learning_rate": 0.00020562366219108774, - "loss": 0.0189, + "epoch": 0.29, + "learning_rate": 0.0002559560266584599, + "loss": 0.0187, "step": 58200 }, { - "epoch": 0.63, - "learning_rate": 0.00020560744632548483, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.0002559484589654459, + "loss": 0.0221, "step": 58210 }, { - "epoch": 0.63, - "learning_rate": 0.00020559123045988195, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002559408912724319, + "loss": 0.0192, "step": 58220 }, { - "epoch": 0.63, - "learning_rate": 0.00020557501459427901, - "loss": 0.0218, + "epoch": 0.29, + "learning_rate": 0.0002559333235794179, + "loss": 0.0217, "step": 58230 }, { - "epoch": 0.63, - "learning_rate": 0.0002055587987286761, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.00025592575588640387, + "loss": 0.0174, "step": 58240 }, { - "epoch": 0.63, - "learning_rate": 0.0002055425828630732, - "loss": 0.0194, + "epoch": 0.29, + "learning_rate": 0.00025591818819338985, + "loss": 0.0188, "step": 58250 }, { - "epoch": 0.63, - "learning_rate": 0.00020552636699747032, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.00025591062050037583, + "loss": 0.0195, "step": 58260 }, { - "epoch": 0.63, - "learning_rate": 0.0002055101511318674, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002559030528073618, + "loss": 0.0199, "step": 58270 }, { - "epoch": 0.63, - "learning_rate": 0.00020549393526626448, - "loss": 0.02, + "epoch": 0.29, + "learning_rate": 0.00025589548511434785, + "loss": 0.0215, "step": 58280 }, { - "epoch": 0.63, - "learning_rate": 0.0002054777194006616, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.00025588791742133383, + "loss": 0.0226, "step": 58290 }, { - "epoch": 0.63, - "learning_rate": 0.0002054615035350587, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002558803497283198, + "loss": 0.0203, "step": 58300 }, { - "epoch": 0.63, - "learning_rate": 0.00020544528766945578, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.0002558727820353058, + "loss": 0.0201, "step": 58310 }, { - "epoch": 0.63, - "learning_rate": 0.00020542907180385285, - "loss": 0.0204, + "epoch": 0.29, + "learning_rate": 0.0002558652143422918, + "loss": 0.0253, "step": 58320 }, { - "epoch": 0.63, - "learning_rate": 0.00020541285593824997, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.00025585764664927776, + "loss": 0.018, "step": 58330 }, { - "epoch": 0.63, - "learning_rate": 0.00020539664007264706, - "loss": 0.0202, + "epoch": 0.29, + "learning_rate": 0.0002558500789562638, + "loss": 0.0206, "step": 58340 }, { - "epoch": 0.63, - "learning_rate": 0.00020538042420704418, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.0002558425112632498, + "loss": 0.0159, "step": 58350 }, { - "epoch": 0.63, - "learning_rate": 0.00020536420834144125, - "loss": 0.0187, + "epoch": 0.29, + "learning_rate": 0.00025583494357023576, + "loss": 0.0183, "step": 58360 }, { - "epoch": 0.63, - "learning_rate": 0.00020534799247583834, - "loss": 0.0192, + "epoch": 0.29, + "learning_rate": 0.00025582737587722174, + "loss": 0.0208, "step": 58370 }, { - "epoch": 0.63, - "learning_rate": 0.00020533177661023543, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002558198081842077, + "loss": 0.018, "step": 58380 }, { - "epoch": 0.63, - "learning_rate": 0.00020531556074463255, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.0002558122404911937, + "loss": 0.0215, "step": 58390 }, { - "epoch": 0.63, - "learning_rate": 0.00020529934487902962, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.00025580467279817974, + "loss": 0.0199, "step": 58400 }, { - "epoch": 0.63, - "learning_rate": 0.0002052831290134267, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.0002557971051051657, + "loss": 0.0212, "step": 58410 }, { - "epoch": 0.63, - "learning_rate": 0.00020526691314782383, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.0002557895374121517, + "loss": 0.0298, "step": 58420 }, { - "epoch": 0.63, - "learning_rate": 0.00020525069728222092, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.0002557819697191377, + "loss": 0.0216, "step": 58430 }, { - "epoch": 0.63, - "learning_rate": 0.000205234481416618, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025577440202612366, + "loss": 0.0188, "step": 58440 }, { - "epoch": 0.63, - "learning_rate": 0.00020521826555101508, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.00025576683433310964, + "loss": 0.0182, "step": 58450 }, { - "epoch": 0.63, - "learning_rate": 0.0002052020496854122, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.0002557592666400956, + "loss": 0.0166, "step": 58460 }, { - "epoch": 0.63, - "learning_rate": 0.0002051858338198093, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002557516989470816, + "loss": 0.0229, "step": 58470 }, { - "epoch": 0.63, - "learning_rate": 0.00020516961795420636, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.0002557441312540676, + "loss": 0.0194, "step": 58480 }, { - "epoch": 0.63, - "learning_rate": 0.00020515340208860348, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025573656356105357, + "loss": 0.0227, "step": 58490 }, { - "epoch": 0.63, - "learning_rate": 0.00020513718622300057, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025572899586803955, + "loss": 0.0189, "step": 58500 }, { - "epoch": 0.63, - "learning_rate": 0.00020512097035739767, - "loss": 0.0187, + "epoch": 0.3, + "learning_rate": 0.0002557214281750256, + "loss": 0.0191, "step": 58510 }, { - "epoch": 0.63, - "learning_rate": 0.00020510475449179473, - "loss": 0.0204, + "epoch": 0.3, + "learning_rate": 0.00025571386048201157, + "loss": 0.019, "step": 58520 }, { - "epoch": 0.63, - "learning_rate": 0.00020508853862619185, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025570629278899755, + "loss": 0.019, "step": 58530 }, { - "epoch": 0.63, - "learning_rate": 0.00020507232276058894, - "loss": 0.0207, + "epoch": 0.3, + "learning_rate": 0.00025569872509598353, + "loss": 0.0174, "step": 58540 }, { - "epoch": 0.63, - "learning_rate": 0.00020505610689498604, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002556911574029695, + "loss": 0.0252, "step": 58550 }, { - "epoch": 0.63, - "learning_rate": 0.00020503989102938313, - "loss": 0.018, + "epoch": 0.3, + "learning_rate": 0.0002556835897099555, + "loss": 0.0192, "step": 58560 }, { - "epoch": 0.63, - "learning_rate": 0.00020502367516378022, - "loss": 0.0206, + "epoch": 0.3, + "learning_rate": 0.00025567602201694153, + "loss": 0.0203, "step": 58570 }, { - "epoch": 0.63, - "learning_rate": 0.00020500745929817732, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002556684543239275, + "loss": 0.018, "step": 58580 }, { - "epoch": 0.63, - "learning_rate": 0.00020499124343257443, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.0002556608866309135, + "loss": 0.0187, "step": 58590 }, { - "epoch": 0.63, - "learning_rate": 0.0002049750275669715, - "loss": 0.0125, + "epoch": 0.3, + "learning_rate": 0.0002556533189378995, + "loss": 0.02, "step": 58600 }, { - "epoch": 0.63, - "learning_rate": 0.0002049588117013686, - "loss": 0.0206, + "epoch": 0.3, + "learning_rate": 0.00025564575124488546, + "loss": 0.0192, "step": 58610 }, { - "epoch": 0.63, - "learning_rate": 0.00020494259583576569, - "loss": 0.0199, + "epoch": 0.3, + "learning_rate": 0.00025563818355187144, + "loss": 0.0189, "step": 58620 }, { - "epoch": 0.63, - "learning_rate": 0.0002049263799701628, - "loss": 0.0178, + "epoch": 0.3, + "learning_rate": 0.00025563061585885747, + "loss": 0.0226, "step": 58630 }, { - "epoch": 0.63, - "learning_rate": 0.00020491016410455987, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025562304816584345, + "loss": 0.02, "step": 58640 }, { - "epoch": 0.63, - "learning_rate": 0.00020489394823895696, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025561548047282944, + "loss": 0.0194, "step": 58650 }, { - "epoch": 0.63, - "learning_rate": 0.00020487773237335408, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.0002556079127798154, + "loss": 0.0212, "step": 58660 }, { - "epoch": 0.63, - "learning_rate": 0.00020486151650775118, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002556003450868014, + "loss": 0.0214, "step": 58670 }, { - "epoch": 0.63, - "learning_rate": 0.00020484530064214824, - "loss": 0.0197, + "epoch": 0.3, + "learning_rate": 0.0002555927773937874, + "loss": 0.0227, "step": 58680 }, { - "epoch": 0.63, - "learning_rate": 0.00020482908477654536, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.00025558520970077336, + "loss": 0.0171, "step": 58690 }, { - "epoch": 0.63, - "learning_rate": 0.00020481286891094246, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002555776420077594, + "loss": 0.0217, "step": 58700 }, { - "epoch": 0.63, - "learning_rate": 0.00020479665304533955, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002555700743147454, + "loss": 0.0233, "step": 58710 }, { - "epoch": 0.63, - "learning_rate": 0.0002047804371797366, - "loss": 0.0182, + "epoch": 0.3, + "learning_rate": 0.00025556250662173136, + "loss": 0.0233, "step": 58720 }, { - "epoch": 0.63, - "learning_rate": 0.00020476422131413373, - "loss": 0.0181, + "epoch": 0.3, + "learning_rate": 0.00025555493892871734, + "loss": 0.0195, "step": 58730 }, { - "epoch": 0.64, - "learning_rate": 0.00020474800544853083, - "loss": 0.0198, + "epoch": 0.3, + "learning_rate": 0.0002555473712357033, + "loss": 0.0206, "step": 58740 }, { - "epoch": 0.64, - "learning_rate": 0.00020473178958292792, - "loss": 0.0167, + "epoch": 0.3, + "learning_rate": 0.0002555398035426893, + "loss": 0.0236, "step": 58750 }, { - "epoch": 0.64, - "learning_rate": 0.000204715573717325, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.00025553223584967534, + "loss": 0.0218, "step": 58760 }, { - "epoch": 0.64, - "learning_rate": 0.0002046993578517221, - "loss": 0.0183, + "epoch": 0.3, + "learning_rate": 0.0002555246681566613, + "loss": 0.0205, "step": 58770 }, { - "epoch": 0.64, - "learning_rate": 0.0002046831419861192, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.0002555171004636473, + "loss": 0.0196, "step": 58780 }, { - "epoch": 0.64, - "learning_rate": 0.00020466692612051632, - "loss": 0.019, + "epoch": 0.3, + "learning_rate": 0.0002555095327706333, + "loss": 0.0209, "step": 58790 }, { - "epoch": 0.64, - "learning_rate": 0.00020465071025491338, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025550196507761927, + "loss": 0.0205, "step": 58800 }, { - "epoch": 0.64, - "learning_rate": 0.00020463449438931048, - "loss": 0.0175, + "epoch": 0.3, + "learning_rate": 0.00025549439738460525, + "loss": 0.0206, "step": 58810 }, { - "epoch": 0.64, - "learning_rate": 0.00020461827852370757, - "loss": 0.0204, + "epoch": 0.3, + "learning_rate": 0.00025548682969159123, + "loss": 0.021, "step": 58820 }, { - "epoch": 0.64, - "learning_rate": 0.0002046020626581047, - "loss": 0.0181, + "epoch": 0.3, + "learning_rate": 0.00025547926199857726, + "loss": 0.0188, "step": 58830 }, { - "epoch": 0.64, - "learning_rate": 0.00020458584679250175, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.00025547169430556325, + "loss": 0.0202, "step": 58840 }, { - "epoch": 0.64, - "learning_rate": 0.00020456963092689885, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002554641266125492, + "loss": 0.0244, "step": 58850 }, { - "epoch": 0.64, - "learning_rate": 0.00020455341506129597, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.0002554565589195352, + "loss": 0.053, "step": 58860 }, { - "epoch": 0.64, - "learning_rate": 0.00020453719919569306, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002554489912265212, + "loss": 0.0232, "step": 58870 }, { - "epoch": 0.64, - "learning_rate": 0.00020452098333009012, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025544142353350717, + "loss": 0.0183, "step": 58880 }, { - "epoch": 0.64, - "learning_rate": 0.00020450476746448722, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002554338558404932, + "loss": 0.0426, "step": 58890 }, { - "epoch": 0.64, - "learning_rate": 0.00020448855159888434, + "epoch": 0.3, + "learning_rate": 0.0002554262881474792, "loss": 0.0177, "step": 58900 }, { - "epoch": 0.64, - "learning_rate": 0.00020447233573328143, - "loss": 0.0127, + "epoch": 0.3, + "learning_rate": 0.00025541872045446517, + "loss": 0.0179, "step": 58910 }, { - "epoch": 0.64, - "learning_rate": 0.0002044561198676785, - "loss": 0.0159, + "epoch": 0.3, + "learning_rate": 0.00025541115276145115, + "loss": 0.0202, "step": 58920 }, { - "epoch": 0.64, - "learning_rate": 0.00020443990400207562, - "loss": 0.0184, + "epoch": 0.3, + "learning_rate": 0.00025540358506843713, + "loss": 0.0236, "step": 58930 }, { - "epoch": 0.64, - "learning_rate": 0.0002044236881364727, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.0002553960173754231, + "loss": 0.0213, "step": 58940 }, { - "epoch": 0.64, - "learning_rate": 0.0002044074722708698, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025538844968240915, + "loss": 0.0203, "step": 58950 }, { - "epoch": 0.64, - "learning_rate": 0.00020439125640526687, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.00025538088198939513, + "loss": 0.022, "step": 58960 }, { - "epoch": 0.64, - "learning_rate": 0.00020437504053966399, - "loss": 0.0188, + "epoch": 0.3, + "learning_rate": 0.0002553733142963811, + "loss": 0.0185, "step": 58970 }, { - "epoch": 0.64, - "learning_rate": 0.00020435882467406108, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002553657466033671, + "loss": 0.0215, "step": 58980 }, { - "epoch": 0.64, - "learning_rate": 0.0002043426088084582, - "loss": 0.018, + "epoch": 0.3, + "learning_rate": 0.0002553581789103531, + "loss": 0.0176, "step": 58990 }, { - "epoch": 0.64, - "learning_rate": 0.0002043263929428553, - "loss": 0.0178, + "epoch": 0.3, + "learning_rate": 0.00025535061121733906, + "loss": 0.0179, "step": 59000 }, { - "epoch": 0.64, - "eval_cer": 0.9215251973031615, - "eval_loss": 0.011170790530741215, - "eval_runtime": 121.4022, - "eval_samples_per_second": 16.474, - "eval_steps_per_second": 4.119, + "epoch": 0.3, + "eval_cer": 0.9144916046179211, + "eval_loss": 0.014513496309518814, + "eval_runtime": 116.7004, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.284, "step": 59000 }, { - "epoch": 0.64, - "learning_rate": 0.00020431017707725236, - "loss": 0.0191, + "epoch": 0.3, + "learning_rate": 0.00025534304352432504, + "loss": 0.024, "step": 59010 }, { - "epoch": 0.64, - "learning_rate": 0.00020429396121164945, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.0002553354758313111, + "loss": 0.0185, "step": 59020 }, { - "epoch": 0.64, - "learning_rate": 0.00020427774534604657, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025532790813829706, + "loss": 0.0185, "step": 59030 }, { - "epoch": 0.64, - "learning_rate": 0.00020426152948044366, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025532034044528304, + "loss": 0.0213, "step": 59040 }, { - "epoch": 0.64, - "learning_rate": 0.00020424531361484073, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.000255312772752269, + "loss": 0.0171, "step": 59050 }, { - "epoch": 0.64, - "learning_rate": 0.00020422909774923785, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.000255305205059255, + "loss": 0.0214, "step": 59060 }, { - "epoch": 0.64, - "learning_rate": 0.00020421288188363494, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.000255297637366241, + "loss": 0.0191, "step": 59070 }, { - "epoch": 0.64, - "learning_rate": 0.00020419666601803203, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.000255290069673227, + "loss": 0.0181, "step": 59080 }, { - "epoch": 0.64, - "learning_rate": 0.0002041804501524291, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.000255282501980213, + "loss": 0.019, "step": 59090 }, { - "epoch": 0.64, - "learning_rate": 0.00020416423428682622, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.000255274934287199, + "loss": 0.0217, "step": 59100 }, { - "epoch": 0.64, - "learning_rate": 0.0002041480184212233, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.00025526736659418496, + "loss": 0.0169, "step": 59110 }, { - "epoch": 0.64, - "learning_rate": 0.0002041318025556204, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025525979890117094, + "loss": 0.0203, "step": 59120 }, { - "epoch": 0.64, - "learning_rate": 0.0002041155866900175, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002552522312081569, + "loss": 0.0228, "step": 59130 }, { - "epoch": 0.64, - "learning_rate": 0.0002040993708244146, - "loss": 0.0185, + "epoch": 0.3, + "learning_rate": 0.00025524466351514296, + "loss": 0.0209, "step": 59140 }, { - "epoch": 0.64, - "learning_rate": 0.00020408315495881168, - "loss": 0.0159, + "epoch": 0.3, + "learning_rate": 0.00025523709582212894, + "loss": 0.025, "step": 59150 }, { - "epoch": 0.64, - "learning_rate": 0.0002040669390932088, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002552295281291149, + "loss": 0.0197, "step": 59160 }, { - "epoch": 0.64, - "learning_rate": 0.00020405072322760587, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.0002552219604361009, + "loss": 0.0191, "step": 59170 }, { - "epoch": 0.64, - "learning_rate": 0.00020403450736200296, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.0002552143927430869, + "loss": 0.0208, "step": 59180 }, { - "epoch": 0.64, - "learning_rate": 0.00020401829149640005, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025520682505007287, + "loss": 0.0202, "step": 59190 }, { - "epoch": 0.64, - "learning_rate": 0.00020400207563079717, - "loss": 0.019, + "epoch": 0.3, + "learning_rate": 0.00025519925735705885, + "loss": 0.0194, "step": 59200 }, { - "epoch": 0.64, - "learning_rate": 0.00020398585976519424, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.0002551916896640449, + "loss": 0.0189, "step": 59210 }, { - "epoch": 0.64, - "learning_rate": 0.00020396964389959133, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025518412197103087, + "loss": 0.0223, "step": 59220 }, { - "epoch": 0.64, - "learning_rate": 0.00020395342803398845, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.00025517655427801685, + "loss": 0.0222, "step": 59230 }, { - "epoch": 0.64, - "learning_rate": 0.00020393721216838554, - "loss": 0.0194, + "epoch": 0.3, + "learning_rate": 0.00025516898658500283, + "loss": 0.0189, "step": 59240 }, { - "epoch": 0.64, - "learning_rate": 0.0002039209963027826, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.0002551614188919888, + "loss": 0.0214, "step": 59250 }, { - "epoch": 0.64, - "learning_rate": 0.0002039047804371797, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002551538511989748, + "loss": 0.0198, "step": 59260 }, { - "epoch": 0.64, - "learning_rate": 0.00020388856457157682, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.0002551462835059608, + "loss": 0.0212, "step": 59270 }, { - "epoch": 0.64, - "learning_rate": 0.00020387234870597392, - "loss": 0.0141, + "epoch": 0.3, + "learning_rate": 0.0002551387158129468, + "loss": 0.0223, "step": 59280 }, { - "epoch": 0.64, - "learning_rate": 0.00020385613284037098, - "loss": 0.0174, + "epoch": 0.3, + "learning_rate": 0.0002551311481199328, + "loss": 0.0205, "step": 59290 }, { - "epoch": 0.64, - "learning_rate": 0.0002038399169747681, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025512358042691877, + "loss": 0.0179, "step": 59300 }, { - "epoch": 0.64, - "learning_rate": 0.0002038237011091652, + "epoch": 0.3, + "learning_rate": 0.00025511601273390475, "loss": 0.0182, "step": 59310 }, { - "epoch": 0.64, - "learning_rate": 0.0002038074852435623, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.00025510844504089073, + "loss": 0.0184, "step": 59320 }, { - "epoch": 0.64, - "learning_rate": 0.00020379126937795935, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.0002551008773478767, + "loss": 0.0181, "step": 59330 }, { - "epoch": 0.64, - "learning_rate": 0.00020377505351235647, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.00025509330965486275, + "loss": 0.0206, "step": 59340 }, { - "epoch": 0.64, - "learning_rate": 0.00020375883764675356, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025508574196184873, + "loss": 0.0164, "step": 59350 }, { - "epoch": 0.64, - "learning_rate": 0.00020374262178115068, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002550781742688347, + "loss": 0.0216, "step": 59360 }, { - "epoch": 0.64, - "learning_rate": 0.00020372640591554775, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002550706065758207, + "loss": 0.0213, "step": 59370 }, { - "epoch": 0.64, - "learning_rate": 0.00020371019004994484, - "loss": 0.0181, + "epoch": 0.3, + "learning_rate": 0.0002550630388828067, + "loss": 0.0218, "step": 59380 }, { - "epoch": 0.64, - "learning_rate": 0.00020369397418434194, - "loss": 0.0313, + "epoch": 0.3, + "learning_rate": 0.00025505547118979266, + "loss": 0.0208, "step": 59390 }, { - "epoch": 0.64, - "learning_rate": 0.00020367775831873906, - "loss": 0.0281, + "epoch": 0.3, + "learning_rate": 0.0002550479034967787, + "loss": 0.0233, "step": 59400 }, { - "epoch": 0.64, - "learning_rate": 0.00020366154245313612, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.0002550403358037647, + "loss": 0.0239, "step": 59410 }, { - "epoch": 0.64, - "learning_rate": 0.00020364532658753321, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.00025503276811075066, + "loss": 0.0208, "step": 59420 }, { - "epoch": 0.64, - "learning_rate": 0.00020362911072193033, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025502520041773664, + "loss": 0.0208, "step": 59430 }, { - "epoch": 0.64, - "learning_rate": 0.00020361289485632743, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002550176327247226, + "loss": 0.0222, "step": 59440 }, { - "epoch": 0.64, - "learning_rate": 0.0002035966789907245, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002550100650317086, + "loss": 0.0214, "step": 59450 }, { - "epoch": 0.64, - "learning_rate": 0.00020358046312512158, - "loss": 0.0197, + "epoch": 0.3, + "learning_rate": 0.00025500249733869464, + "loss": 0.0329, "step": 59460 }, { - "epoch": 0.64, - "learning_rate": 0.0002035642472595187, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002549949296456806, + "loss": 0.0242, "step": 59470 }, { - "epoch": 0.64, - "learning_rate": 0.0002035480313939158, - "loss": 0.0159, + "epoch": 0.3, + "learning_rate": 0.0002549873619526666, + "loss": 0.0266, "step": 59480 }, { - "epoch": 0.64, - "learning_rate": 0.00020353181552831286, - "loss": 0.0182, + "epoch": 0.3, + "learning_rate": 0.0002549797942596526, + "loss": 0.0795, "step": 59490 }, { - "epoch": 0.64, - "learning_rate": 0.00020351559966270998, - "loss": 0.0197, + "epoch": 0.3, + "learning_rate": 0.00025497222656663856, + "loss": 0.0277, "step": 59500 }, { - "epoch": 0.64, - "learning_rate": 0.00020349938379710708, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025496465887362454, + "loss": 0.02, "step": 59510 }, { - "epoch": 0.64, - "learning_rate": 0.00020348316793150417, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002549570911806105, + "loss": 0.0209, "step": 59520 }, { - "epoch": 0.64, - "learning_rate": 0.00020346695206590123, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025494952348759656, + "loss": 0.0174, "step": 59530 }, { - "epoch": 0.64, - "learning_rate": 0.00020345073620029835, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025494195579458254, + "loss": 0.0194, "step": 59540 }, { - "epoch": 0.64, - "learning_rate": 0.00020343452033469545, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.0002549343881015685, + "loss": 0.0272, "step": 59550 }, { - "epoch": 0.64, - "learning_rate": 0.00020341830446909254, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002549268204085545, + "loss": 0.0196, "step": 59560 }, { - "epoch": 0.64, - "learning_rate": 0.00020340208860348963, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.0002549192527155405, + "loss": 0.022, "step": 59570 }, { - "epoch": 0.64, - "learning_rate": 0.00020338587273788672, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025491168502252647, + "loss": 0.0221, "step": 59580 }, { - "epoch": 0.64, - "learning_rate": 0.00020336965687228382, - "loss": 0.0176, + "epoch": 0.3, + "learning_rate": 0.0002549041173295125, + "loss": 0.0304, "step": 59590 }, { - "epoch": 0.64, - "learning_rate": 0.00020335344100668094, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002548965496364985, + "loss": 0.0214, "step": 59600 }, { - "epoch": 0.64, - "learning_rate": 0.000203337225141078, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025488898194348447, + "loss": 0.0246, "step": 59610 }, { - "epoch": 0.64, - "learning_rate": 0.0002033210092754751, - "loss": 0.012, + "epoch": 0.3, + "learning_rate": 0.00025488141425047045, + "loss": 0.0211, "step": 59620 }, { - "epoch": 0.64, - "learning_rate": 0.0002033047934098722, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.00025487384655745643, + "loss": 0.0215, "step": 59630 }, { - "epoch": 0.64, - "learning_rate": 0.0002032885775442693, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002548662788644424, + "loss": 0.0218, "step": 59640 }, { - "epoch": 0.64, - "learning_rate": 0.00020327236167866637, - "loss": 0.0212, + "epoch": 0.3, + "learning_rate": 0.00025485871117142845, + "loss": 0.0214, "step": 59650 }, { - "epoch": 0.64, - "learning_rate": 0.00020325614581306347, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.00025485114347841443, + "loss": 0.0248, "step": 59660 }, { - "epoch": 0.65, - "learning_rate": 0.0002032399299474606, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002548435757854004, + "loss": 0.022, "step": 59670 }, { - "epoch": 0.65, - "learning_rate": 0.00020322371408185768, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.0002548360080923864, + "loss": 0.0206, "step": 59680 }, { - "epoch": 0.65, - "learning_rate": 0.00020320749821625475, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025482844039937237, + "loss": 0.0213, "step": 59690 }, { - "epoch": 0.65, - "learning_rate": 0.00020319128235065186, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025482087270635835, + "loss": 0.0178, "step": 59700 }, { - "epoch": 0.65, - "learning_rate": 0.00020317506648504896, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.00025481330501334434, + "loss": 0.0318, "step": 59710 }, { - "epoch": 0.65, - "learning_rate": 0.00020315885061944605, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002548057373203303, + "loss": 0.0239, "step": 59720 }, { - "epoch": 0.65, - "learning_rate": 0.00020314263475384317, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002547981696273163, + "loss": 0.0198, "step": 59730 }, { - "epoch": 0.65, - "learning_rate": 0.00020312641888824024, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.0002547906019343023, + "loss": 0.0214, "step": 59740 }, { - "epoch": 0.65, - "learning_rate": 0.00020311020302263733, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.00025478303424128826, + "loss": 0.0176, "step": 59750 }, { - "epoch": 0.65, - "learning_rate": 0.00020309398715703442, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002547754665482743, + "loss": 0.021, "step": 59760 }, { - "epoch": 0.65, - "learning_rate": 0.00020307777129143154, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.0002547678988552603, + "loss": 0.0196, "step": 59770 }, { - "epoch": 0.65, - "learning_rate": 0.0002030615554258286, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025476033116224626, + "loss": 0.0192, "step": 59780 }, { - "epoch": 0.65, - "learning_rate": 0.0002030453395602257, - "loss": 0.0174, + "epoch": 0.3, + "learning_rate": 0.00025475276346923224, + "loss": 0.025, "step": 59790 }, { - "epoch": 0.65, - "learning_rate": 0.00020302912369462282, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.0002547451957762182, + "loss": 0.019, "step": 59800 }, { - "epoch": 0.65, - "learning_rate": 0.0002030129078290199, - "loss": 0.0181, + "epoch": 0.3, + "learning_rate": 0.0002547376280832042, + "loss": 0.0182, "step": 59810 }, { - "epoch": 0.65, - "learning_rate": 0.00020299669196341698, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.00025473006039019024, + "loss": 0.0199, "step": 59820 }, { - "epoch": 0.65, - "learning_rate": 0.00020298047609781407, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.0002547224926971762, + "loss": 0.02, "step": 59830 }, { - "epoch": 0.65, - "learning_rate": 0.0002029642602322112, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002547149250041622, + "loss": 0.0212, "step": 59840 }, { - "epoch": 0.65, - "learning_rate": 0.00020294804436660828, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002547073573111482, + "loss": 0.016, "step": 59850 }, { - "epoch": 0.65, - "learning_rate": 0.00020293182850100535, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025469978961813417, + "loss": 0.0213, "step": 59860 }, { - "epoch": 0.65, - "learning_rate": 0.00020291561263540247, - "loss": 0.0185, + "epoch": 0.3, + "learning_rate": 0.00025469222192512015, + "loss": 0.0211, "step": 59870 }, { - "epoch": 0.65, - "learning_rate": 0.00020289939676979956, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002546846542321062, + "loss": 0.0208, "step": 59880 }, { - "epoch": 0.65, - "learning_rate": 0.00020288318090419665, - "loss": 0.0191, + "epoch": 0.3, + "learning_rate": 0.00025467708653909216, + "loss": 0.0223, "step": 59890 }, { - "epoch": 0.65, - "learning_rate": 0.00020286696503859372, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025466951884607815, + "loss": 0.0217, "step": 59900 }, { - "epoch": 0.65, - "learning_rate": 0.00020285074917299084, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002546619511530641, + "loss": 0.0192, "step": 59910 }, { - "epoch": 0.65, - "learning_rate": 0.00020283453330738793, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.0002546543834600501, + "loss": 0.0191, "step": 59920 }, { - "epoch": 0.65, - "learning_rate": 0.00020281831744178505, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.0002546468157670361, + "loss": 0.0181, "step": 59930 }, { - "epoch": 0.65, - "learning_rate": 0.00020280210157618212, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025463924807402207, + "loss": 0.0208, "step": 59940 }, { - "epoch": 0.65, - "learning_rate": 0.0002027858857105792, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.0002546316803810081, + "loss": 0.0267, "step": 59950 }, { - "epoch": 0.65, - "learning_rate": 0.0002027696698449763, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002546241126879941, + "loss": 0.0264, "step": 59960 }, { - "epoch": 0.65, - "learning_rate": 0.00020275345397937342, - "loss": 0.0176, + "epoch": 0.3, + "learning_rate": 0.00025461654499498007, + "loss": 0.0235, "step": 59970 }, { - "epoch": 0.65, - "learning_rate": 0.0002027372381137705, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.00025460897730196605, + "loss": 0.0181, "step": 59980 }, { - "epoch": 0.65, - "learning_rate": 0.00020272102224816758, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.00025460140960895203, + "loss": 0.0188, "step": 59990 }, { - "epoch": 0.65, - "learning_rate": 0.0002027048063825647, - "loss": 0.0187, + "epoch": 0.3, + "learning_rate": 0.000254593841915938, + "loss": 0.0241, "step": 60000 }, { - "epoch": 0.65, - "eval_cer": 0.9215121682588159, - "eval_loss": 0.01132188830524683, - "eval_runtime": 121.508, - "eval_samples_per_second": 16.46, - "eval_steps_per_second": 4.115, + "epoch": 0.3, + "eval_cer": 0.9145197461055578, + "eval_loss": 0.01466525811702013, + "eval_runtime": 116.7343, + "eval_samples_per_second": 17.133, + "eval_steps_per_second": 4.283, "step": 60000 }, { - "epoch": 0.65, - "learning_rate": 0.0002026885905169618, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025458627422292405, + "loss": 0.0222, "step": 60010 }, { - "epoch": 0.65, - "learning_rate": 0.00020267237465135886, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.00025457870652991003, + "loss": 0.022, "step": 60020 }, { - "epoch": 0.65, - "learning_rate": 0.00020265615878575595, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.000254571138836896, + "loss": 0.025, "step": 60030 }, { - "epoch": 0.65, - "learning_rate": 0.00020263994292015307, - "loss": 0.02, + "epoch": 0.3, + "learning_rate": 0.000254563571143882, + "loss": 0.0254, "step": 60040 }, { - "epoch": 0.65, - "learning_rate": 0.00020262372705455017, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.000254556003450868, + "loss": 0.0161, "step": 60050 }, { - "epoch": 0.65, - "learning_rate": 0.00020260751118894723, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025454843575785396, + "loss": 0.0222, "step": 60060 }, { - "epoch": 0.65, - "learning_rate": 0.00020259129532334435, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.00025454086806483994, + "loss": 0.0249, "step": 60070 }, { - "epoch": 0.65, - "learning_rate": 0.00020257507945774144, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.000254533300371826, + "loss": 0.0201, "step": 60080 }, { - "epoch": 0.65, - "learning_rate": 0.00020255886359213854, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.00025452573267881196, + "loss": 0.0251, "step": 60090 }, { - "epoch": 0.65, - "learning_rate": 0.0002025426477265356, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.00025451816498579794, + "loss": 0.0184, "step": 60100 }, { - "epoch": 0.65, - "learning_rate": 0.00020252643186093272, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002545105972927839, + "loss": 0.0202, "step": 60110 }, { - "epoch": 0.65, - "learning_rate": 0.00020251021599532981, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.0002545030295997699, + "loss": 0.0188, "step": 60120 }, { - "epoch": 0.65, - "learning_rate": 0.0002024940001297269, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002544954619067559, + "loss": 0.0217, "step": 60130 }, { - "epoch": 0.65, - "learning_rate": 0.000202477784264124, - "loss": 0.0159, + "epoch": 0.3, + "learning_rate": 0.0002544878942137419, + "loss": 0.0195, "step": 60140 }, { - "epoch": 0.65, - "learning_rate": 0.0002024615683985211, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002544803265207279, + "loss": 0.0158, "step": 60150 }, { - "epoch": 0.65, - "learning_rate": 0.00020244535253291819, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002544727588277139, + "loss": 0.0186, "step": 60160 }, { - "epoch": 0.65, - "learning_rate": 0.0002024291366673153, - "loss": 0.0183, + "epoch": 0.3, + "learning_rate": 0.00025446519113469986, + "loss": 0.0186, "step": 60170 }, { - "epoch": 0.65, - "learning_rate": 0.00020241292080171237, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025445762344168584, + "loss": 0.0174, "step": 60180 }, { - "epoch": 0.65, - "learning_rate": 0.00020239670493610946, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.0002544500557486718, + "loss": 0.0219, "step": 60190 }, { - "epoch": 0.65, - "learning_rate": 0.00020238048907050656, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.00025444248805565786, + "loss": 0.0207, "step": 60200 }, { - "epoch": 0.65, - "learning_rate": 0.00020236427320490368, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.00025443492036264384, + "loss": 0.0172, "step": 60210 }, { - "epoch": 0.65, - "learning_rate": 0.00020234805733930074, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002544273526696298, + "loss": 0.0183, "step": 60220 }, { - "epoch": 0.65, - "learning_rate": 0.00020233184147369783, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002544197849766158, + "loss": 0.0178, "step": 60230 }, { - "epoch": 0.65, - "learning_rate": 0.00020231562560809495, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.0002544122172836018, + "loss": 0.0183, "step": 60240 }, { - "epoch": 0.65, - "learning_rate": 0.00020229940974249205, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025440464959058777, + "loss": 0.0244, "step": 60250 }, { - "epoch": 0.65, - "learning_rate": 0.0002022831938768891, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025439708189757375, + "loss": 0.0236, "step": 60260 }, { - "epoch": 0.65, - "learning_rate": 0.0002022669780112862, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002543895142045598, + "loss": 0.0188, "step": 60270 }, { - "epoch": 0.65, - "learning_rate": 0.00020225076214568333, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.00025438194651154577, + "loss": 0.0188, "step": 60280 }, { - "epoch": 0.65, - "learning_rate": 0.00020223454628008042, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.00025437437881853175, + "loss": 0.0232, "step": 60290 }, { - "epoch": 0.65, - "learning_rate": 0.00020221833041447748, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025436681112551773, + "loss": 0.0174, "step": 60300 }, { - "epoch": 0.65, - "learning_rate": 0.0002022021145488746, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002543592434325037, + "loss": 0.0225, "step": 60310 }, { - "epoch": 0.65, - "learning_rate": 0.0002021858986832717, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002543516757394897, + "loss": 0.02, "step": 60320 }, { - "epoch": 0.65, - "learning_rate": 0.0002021696828176688, - "loss": 0.0135, + "epoch": 0.3, + "learning_rate": 0.0002543441080464757, + "loss": 0.0178, "step": 60330 }, { - "epoch": 0.65, - "learning_rate": 0.00020215346695206585, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002543365403534617, + "loss": 0.0174, "step": 60340 }, { - "epoch": 0.65, - "learning_rate": 0.00020213725108646297, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002543289726604477, + "loss": 0.0205, "step": 60350 }, { - "epoch": 0.65, - "learning_rate": 0.00020212103522086007, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025432140496743367, + "loss": 0.0188, "step": 60360 }, { - "epoch": 0.65, - "learning_rate": 0.0002021048193552572, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025431383727441965, + "loss": 0.0151, "step": 60370 }, { - "epoch": 0.65, - "learning_rate": 0.00020208860348965425, - "loss": 0.019, + "epoch": 0.3, + "learning_rate": 0.00025430626958140563, + "loss": 0.0177, "step": 60380 }, { - "epoch": 0.65, - "learning_rate": 0.00020207238762405135, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002542987018883916, + "loss": 0.0193, "step": 60390 }, { - "epoch": 0.65, - "learning_rate": 0.00020205617175844844, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025429113419537765, + "loss": 0.0221, "step": 60400 }, { - "epoch": 0.65, - "learning_rate": 0.00020203995589284556, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025428356650236363, + "loss": 0.0209, "step": 60410 }, { - "epoch": 0.65, - "learning_rate": 0.00020202374002724262, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002542759988093496, + "loss": 0.0216, "step": 60420 }, { - "epoch": 0.65, - "learning_rate": 0.00020200752416163972, - "loss": 0.0181, + "epoch": 0.3, + "learning_rate": 0.0002542684311163356, + "loss": 0.0209, "step": 60430 }, { - "epoch": 0.65, - "learning_rate": 0.00020199130829603684, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002542608634233216, + "loss": 0.0154, "step": 60440 }, { - "epoch": 0.65, - "learning_rate": 0.00020197509243043393, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025425329573030756, + "loss": 0.0193, "step": 60450 }, { - "epoch": 0.65, - "learning_rate": 0.00020195887656483102, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002542457280372936, + "loss": 0.0172, "step": 60460 }, { - "epoch": 0.65, - "learning_rate": 0.0002019426606992281, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002542381603442796, + "loss": 0.0191, "step": 60470 }, { - "epoch": 0.65, - "learning_rate": 0.0002019264448336252, - "loss": 0.0148, + "epoch": 0.31, + "learning_rate": 0.00025423059265126556, + "loss": 0.0174, "step": 60480 }, { - "epoch": 0.65, - "learning_rate": 0.0002019102289680223, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.00025422302495825154, + "loss": 0.0192, "step": 60490 }, { - "epoch": 0.65, - "learning_rate": 0.0002018940131024194, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.0002542154572652375, + "loss": 0.0193, "step": 60500 }, { - "epoch": 0.65, - "learning_rate": 0.00020187779723681649, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002542078895722235, + "loss": 0.0244, "step": 60510 }, { - "epoch": 0.65, - "learning_rate": 0.00020186158137121358, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025420032187920954, + "loss": 0.0176, "step": 60520 }, { - "epoch": 0.65, - "learning_rate": 0.00020184536550561067, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.0002541927541861955, + "loss": 0.0243, "step": 60530 }, { - "epoch": 0.65, - "learning_rate": 0.0002018291496400078, - "loss": 0.0168, + "epoch": 0.31, + "learning_rate": 0.0002541851864931815, + "loss": 0.0201, "step": 60540 }, { - "epoch": 0.65, - "learning_rate": 0.00020181293377440486, - "loss": 0.0202, + "epoch": 0.31, + "learning_rate": 0.0002541776188001675, + "loss": 0.0217, "step": 60550 }, { - "epoch": 0.65, - "learning_rate": 0.00020179671790880195, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025417005110715346, + "loss": 0.0192, "step": 60560 }, { - "epoch": 0.65, - "learning_rate": 0.00020178050204319904, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025416248341413944, + "loss": 0.0218, "step": 60570 }, { - "epoch": 0.65, - "learning_rate": 0.00020176428617759616, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.0002541549157211254, + "loss": 0.0238, "step": 60580 }, { - "epoch": 0.66, - "learning_rate": 0.00020174807031199323, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.00025414734802811146, + "loss": 0.0173, "step": 60590 }, { - "epoch": 0.66, - "learning_rate": 0.00020173185444639032, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.00025413978033509744, + "loss": 0.0186, "step": 60600 }, { - "epoch": 0.66, - "learning_rate": 0.00020171563858078744, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002541322126420834, + "loss": 0.0208, "step": 60610 }, { - "epoch": 0.66, - "learning_rate": 0.00020169942271518453, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.0002541246449490694, + "loss": 0.0211, "step": 60620 }, { - "epoch": 0.66, - "learning_rate": 0.0002016832068495816, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.0002541170772560554, + "loss": 0.0186, "step": 60630 }, { - "epoch": 0.66, - "learning_rate": 0.0002016669909839787, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.00025410950956304137, + "loss": 0.0186, "step": 60640 }, { - "epoch": 0.66, - "learning_rate": 0.0002016507751183758, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002541019418700274, + "loss": 0.0193, "step": 60650 }, { - "epoch": 0.66, - "learning_rate": 0.0002016345592527729, - "loss": 0.021, + "epoch": 0.31, + "learning_rate": 0.0002540943741770134, + "loss": 0.0182, "step": 60660 }, { - "epoch": 0.66, - "learning_rate": 0.00020161834338716997, - "loss": 0.0219, + "epoch": 0.31, + "learning_rate": 0.00025408680648399937, + "loss": 0.0217, "step": 60670 }, { - "epoch": 0.66, - "learning_rate": 0.0002016021275215671, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.00025407923879098535, + "loss": 0.0216, "step": 60680 }, { - "epoch": 0.66, - "learning_rate": 0.00020158591165596418, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.00025407167109797133, + "loss": 0.0203, "step": 60690 }, { - "epoch": 0.66, - "learning_rate": 0.00020156969579036127, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.0002540641034049573, + "loss": 0.0189, "step": 60700 }, { - "epoch": 0.66, - "learning_rate": 0.00020155347992475837, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.00025405653571194335, + "loss": 0.0223, "step": 60710 }, { - "epoch": 0.66, - "learning_rate": 0.00020153726405915546, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.00025404896801892933, + "loss": 0.0173, "step": 60720 }, { - "epoch": 0.66, - "learning_rate": 0.00020152104819355255, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002540414003259153, + "loss": 0.0181, "step": 60730 }, { - "epoch": 0.66, - "learning_rate": 0.00020150483232794967, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.0002540338326329013, + "loss": 0.0196, "step": 60740 }, { - "epoch": 0.66, - "learning_rate": 0.00020148861646234674, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.0002540262649398873, + "loss": 0.0158, "step": 60750 }, { - "epoch": 0.66, - "learning_rate": 0.00020147240059674383, - "loss": 0.0154, + "epoch": 0.31, + "learning_rate": 0.00025401869724687325, + "loss": 0.0215, "step": 60760 }, { - "epoch": 0.66, - "learning_rate": 0.00020145618473114092, - "loss": 0.0198, + "epoch": 0.31, + "learning_rate": 0.00025401112955385924, + "loss": 0.018, "step": 60770 }, { - "epoch": 0.66, - "learning_rate": 0.00020143996886553804, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.00025400356186084527, + "loss": 0.0185, "step": 60780 }, { - "epoch": 0.66, - "learning_rate": 0.0002014237529999351, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.00025399599416783125, + "loss": 0.0197, "step": 60790 }, { - "epoch": 0.66, - "learning_rate": 0.0002014075371343322, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.00025398842647481723, + "loss": 0.0205, "step": 60800 }, { - "epoch": 0.66, - "learning_rate": 0.00020139132126872932, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.0002539808587818032, + "loss": 0.0225, "step": 60810 }, { - "epoch": 0.66, - "learning_rate": 0.00020137510540312641, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.0002539732910887892, + "loss": 0.0179, "step": 60820 }, { - "epoch": 0.66, - "learning_rate": 0.00020135888953752348, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002539657233957752, + "loss": 0.019, "step": 60830 }, { - "epoch": 0.66, - "learning_rate": 0.00020134267367192057, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002539581557027612, + "loss": 0.0205, "step": 60840 }, { - "epoch": 0.66, - "learning_rate": 0.0002013264578063177, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002539505880097472, + "loss": 0.0215, "step": 60850 }, { - "epoch": 0.66, - "learning_rate": 0.00020131024194071479, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.0002539430203167332, + "loss": 0.0189, "step": 60860 }, { - "epoch": 0.66, - "learning_rate": 0.00020129402607511185, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.00025393545262371916, + "loss": 0.0186, "step": 60870 }, { - "epoch": 0.66, - "learning_rate": 0.00020127781020950897, - "loss": 0.0189, + "epoch": 0.31, + "learning_rate": 0.00025392788493070514, + "loss": 0.0246, "step": 60880 }, { - "epoch": 0.66, - "learning_rate": 0.00020126159434390606, - "loss": 0.019, + "epoch": 0.31, + "learning_rate": 0.0002539203172376911, + "loss": 0.0224, "step": 60890 }, { - "epoch": 0.66, - "learning_rate": 0.00020124537847830316, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002539127495446771, + "loss": 0.0181, "step": 60900 }, { - "epoch": 0.66, - "learning_rate": 0.00020122916261270022, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025390518185166314, + "loss": 0.0198, "step": 60910 }, { - "epoch": 0.66, - "learning_rate": 0.00020121294674709734, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.0002538976141586491, + "loss": 0.0235, "step": 60920 }, { - "epoch": 0.66, - "learning_rate": 0.00020119673088149444, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.0002538900464656351, + "loss": 0.0185, "step": 60930 }, { - "epoch": 0.66, - "learning_rate": 0.00020118051501589155, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.0002538824787726211, + "loss": 0.0187, "step": 60940 }, { - "epoch": 0.66, - "learning_rate": 0.00020116429915028862, - "loss": 0.0219, + "epoch": 0.31, + "learning_rate": 0.00025387491107960706, + "loss": 0.02, "step": 60950 }, { - "epoch": 0.66, - "learning_rate": 0.0002011480832846857, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.00025386734338659305, + "loss": 0.0174, "step": 60960 }, { - "epoch": 0.66, - "learning_rate": 0.0002011318674190828, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.00025385977569357903, + "loss": 0.018, "step": 60970 }, { - "epoch": 0.66, - "learning_rate": 0.00020111565155347993, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.000253852208000565, + "loss": 0.0197, "step": 60980 }, { - "epoch": 0.66, - "learning_rate": 0.000201099435687877, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.000253844640307551, + "loss": 0.0193, "step": 60990 }, { - "epoch": 0.66, - "learning_rate": 0.00020108321982227408, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.00025383707261453697, + "loss": 0.02, "step": 61000 }, { - "epoch": 0.66, - "eval_cer": 0.9215981599514972, - "eval_loss": 0.011921165511012077, - "eval_runtime": 121.5349, - "eval_samples_per_second": 16.456, - "eval_steps_per_second": 4.114, + "epoch": 0.31, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.01344729121774435, + "eval_runtime": 116.7714, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, "step": 61000 }, { - "epoch": 0.66, - "learning_rate": 0.0002010670039566712, - "loss": 0.0148, + "epoch": 0.31, + "learning_rate": 0.000253829504921523, + "loss": 0.0177, "step": 61010 }, { - "epoch": 0.66, - "learning_rate": 0.0002010507880910683, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.000253821937228509, + "loss": 0.0203, "step": 61020 }, { - "epoch": 0.66, - "learning_rate": 0.00020103457222546536, - "loss": 0.0206, + "epoch": 0.31, + "learning_rate": 0.00025381436953549497, + "loss": 0.0181, "step": 61030 }, { - "epoch": 0.66, - "learning_rate": 0.00020101835635986246, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.00025380680184248095, + "loss": 0.0181, "step": 61040 }, { - "epoch": 0.66, - "learning_rate": 0.00020100214049425958, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.00025379923414946693, + "loss": 0.0211, "step": 61050 }, { - "epoch": 0.66, - "learning_rate": 0.00020098592462865667, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002537916664564529, + "loss": 0.0216, "step": 61060 }, { - "epoch": 0.66, - "learning_rate": 0.00020096970876305373, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.00025378409876343895, + "loss": 0.0188, "step": 61070 }, { - "epoch": 0.66, - "learning_rate": 0.00020095349289745085, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.00025377653107042493, + "loss": 0.0202, "step": 61080 }, { - "epoch": 0.66, - "learning_rate": 0.00020093727703184795, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.0002537689633774109, + "loss": 0.0203, "step": 61090 }, { - "epoch": 0.66, - "learning_rate": 0.00020092106116624504, - "loss": 0.0236, + "epoch": 0.31, + "learning_rate": 0.0002537613956843969, + "loss": 0.0198, "step": 61100 }, { - "epoch": 0.66, - "learning_rate": 0.0002009048453006421, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.0002537538279913829, + "loss": 0.0193, "step": 61110 }, { - "epoch": 0.66, - "learning_rate": 0.00020088862943503922, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.00025374626029836886, + "loss": 0.0154, "step": 61120 }, { - "epoch": 0.66, - "learning_rate": 0.00020087241356943632, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025373869260535484, + "loss": 0.0201, "step": 61130 }, { - "epoch": 0.66, - "learning_rate": 0.0002008561977038334, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.0002537311249123409, + "loss": 0.0212, "step": 61140 }, { - "epoch": 0.66, - "learning_rate": 0.00020083998183823053, - "loss": 0.0207, + "epoch": 0.31, + "learning_rate": 0.00025372355721932686, + "loss": 0.0196, "step": 61150 }, { - "epoch": 0.66, - "learning_rate": 0.0002008237659726276, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025371598952631284, + "loss": 0.0204, "step": 61160 }, { - "epoch": 0.66, - "learning_rate": 0.0002008075501070247, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002537084218332988, + "loss": 0.0205, "step": 61170 }, { - "epoch": 0.66, - "learning_rate": 0.0002007913342414218, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.0002537008541402848, + "loss": 0.0203, "step": 61180 }, { - "epoch": 0.66, - "learning_rate": 0.0002007751183758189, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.0002536932864472708, + "loss": 0.0142, "step": 61190 }, { - "epoch": 0.66, - "learning_rate": 0.00020075890251021597, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002536857187542568, + "loss": 0.0162, "step": 61200 }, { - "epoch": 0.66, - "learning_rate": 0.00020074268664461306, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.0002536781510612428, + "loss": 0.0192, "step": 61210 }, { - "epoch": 0.66, - "learning_rate": 0.00020072647077901018, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.0002536705833682288, + "loss": 0.0198, "step": 61220 }, { - "epoch": 0.66, - "learning_rate": 0.00020071025491340727, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.00025366301567521476, + "loss": 0.0182, "step": 61230 }, { - "epoch": 0.66, - "learning_rate": 0.00020069403904780434, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.00025365544798220074, + "loss": 0.0196, "step": 61240 }, { - "epoch": 0.66, - "learning_rate": 0.00020067782318220146, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.0002536478802891867, + "loss": 0.0201, "step": 61250 }, { - "epoch": 0.66, - "learning_rate": 0.00020066160731659855, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025364031259617276, + "loss": 0.0217, "step": 61260 }, { - "epoch": 0.66, - "learning_rate": 0.00020064539145099564, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.00025363274490315874, + "loss": 0.021, "step": 61270 }, { - "epoch": 0.66, - "learning_rate": 0.0002006291755853927, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.0002536251772101447, + "loss": 0.019, "step": 61280 }, { - "epoch": 0.66, - "learning_rate": 0.00020061295971978983, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002536176095171307, + "loss": 0.0201, "step": 61290 }, { - "epoch": 0.66, - "learning_rate": 0.00020059674385418692, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.0002536100418241167, + "loss": 0.0178, "step": 61300 }, { - "epoch": 0.66, - "learning_rate": 0.00020058052798858404, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.00025360247413110267, + "loss": 0.0185, "step": 61310 }, { - "epoch": 0.66, - "learning_rate": 0.0002005643121229811, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025359490643808865, + "loss": 0.0179, "step": 61320 }, { - "epoch": 0.66, - "learning_rate": 0.0002005480962573782, - "loss": 0.0168, + "epoch": 0.31, + "learning_rate": 0.0002535873387450747, + "loss": 0.0179, "step": 61330 }, { - "epoch": 0.66, - "learning_rate": 0.0002005318803917753, - "loss": 0.0172, + "epoch": 0.31, + "learning_rate": 0.00025357977105206067, + "loss": 0.0223, "step": 61340 }, { - "epoch": 0.66, - "learning_rate": 0.0002005156645261724, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025357220335904665, + "loss": 0.0179, "step": 61350 }, { - "epoch": 0.66, - "learning_rate": 0.00020049944866056948, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.00025356463566603263, + "loss": 0.0219, "step": 61360 }, { - "epoch": 0.66, - "learning_rate": 0.00020048323279496657, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.0002535570679730186, + "loss": 0.0226, "step": 61370 }, { - "epoch": 0.66, - "learning_rate": 0.0002004670169293637, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.0002535495002800046, + "loss": 0.0179, "step": 61380 }, { - "epoch": 0.66, - "learning_rate": 0.00020045080106376078, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.00025354193258699063, + "loss": 0.0198, "step": 61390 }, { - "epoch": 0.66, - "learning_rate": 0.00020043458519815785, - "loss": 0.0211, + "epoch": 0.31, + "learning_rate": 0.0002535343648939766, + "loss": 0.019, "step": 61400 }, { - "epoch": 0.66, - "learning_rate": 0.00020041836933255494, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.0002535267972009626, + "loss": 0.0229, "step": 61410 }, { - "epoch": 0.66, - "learning_rate": 0.00020040215346695206, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.00025351922950794857, + "loss": 0.0246, "step": 61420 }, { - "epoch": 0.66, - "learning_rate": 0.00020038593760134915, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025351166181493455, + "loss": 0.0162, "step": 61430 }, { - "epoch": 0.66, - "learning_rate": 0.00020036972173574622, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.00025350409412192053, + "loss": 0.0236, "step": 61440 }, { - "epoch": 0.66, - "learning_rate": 0.00020035350587014334, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025349652642890657, + "loss": 0.0207, "step": 61450 }, { - "epoch": 0.66, - "learning_rate": 0.00020033729000454043, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.00025348895873589255, + "loss": 0.0217, "step": 61460 }, { - "epoch": 0.66, - "learning_rate": 0.00020032107413893752, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.00025348139104287853, + "loss": 0.0222, "step": 61470 }, { - "epoch": 0.66, - "learning_rate": 0.0002003048582733346, - "loss": 0.0172, + "epoch": 0.31, + "learning_rate": 0.0002534738233498645, + "loss": 0.0188, "step": 61480 }, { - "epoch": 0.66, - "learning_rate": 0.0002002886424077317, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.0002534662556568505, + "loss": 0.0183, "step": 61490 }, { - "epoch": 0.66, - "learning_rate": 0.0002002724265421288, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002534586879638365, + "loss": 0.0163, "step": 61500 }, { - "epoch": 0.66, - "learning_rate": 0.0002002562106765259, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.00025345112027082246, + "loss": 0.0176, "step": 61510 }, { - "epoch": 0.67, - "learning_rate": 0.000200239994810923, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.0002534435525778085, + "loss": 0.0193, "step": 61520 }, { - "epoch": 0.67, - "learning_rate": 0.00020022377894532008, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002534359848847945, + "loss": 0.017, "step": 61530 }, { - "epoch": 0.67, - "learning_rate": 0.00020020756307971717, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025342841719178046, + "loss": 0.0197, "step": 61540 }, { - "epoch": 0.67, - "learning_rate": 0.0002001913472141143, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.00025342084949876644, + "loss": 0.0206, "step": 61550 }, { - "epoch": 0.67, - "learning_rate": 0.00020017513134851136, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.0002534132818057524, + "loss": 0.0192, "step": 61560 }, { - "epoch": 0.67, - "learning_rate": 0.00020015891548290845, - "loss": 0.0227, + "epoch": 0.31, + "learning_rate": 0.0002534057141127384, + "loss": 0.0209, "step": 61570 }, { - "epoch": 0.67, - "learning_rate": 0.00020014269961730554, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.00025339814641972444, + "loss": 0.0215, "step": 61580 }, { - "epoch": 0.67, - "learning_rate": 0.00020012648375170266, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.0002533905787267104, + "loss": 0.0207, "step": 61590 }, { - "epoch": 0.67, - "learning_rate": 0.00020011026788609973, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002533830110336964, + "loss": 0.0207, "step": 61600 }, { - "epoch": 0.67, - "learning_rate": 0.00020009405202049682, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002533754433406824, + "loss": 0.0199, "step": 61610 }, { - "epoch": 0.67, - "learning_rate": 0.00020007783615489394, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025336787564766836, + "loss": 0.0169, "step": 61620 }, { - "epoch": 0.67, - "learning_rate": 0.00020006162028929104, - "loss": 0.0206, + "epoch": 0.31, + "learning_rate": 0.00025336030795465434, + "loss": 0.0215, "step": 61630 }, { - "epoch": 0.67, - "learning_rate": 0.0002000454044236881, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.0002533527402616403, + "loss": 0.0189, "step": 61640 }, { - "epoch": 0.67, - "learning_rate": 0.0002000291885580852, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.00025334517256862636, + "loss": 0.0171, "step": 61650 }, { - "epoch": 0.67, - "learning_rate": 0.00020001297269248231, - "loss": 0.0202, + "epoch": 0.31, + "learning_rate": 0.00025333760487561234, + "loss": 0.0195, "step": 61660 }, { - "epoch": 0.67, - "learning_rate": 0.0001999967568268794, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.0002533300371825983, + "loss": 0.0215, "step": 61670 }, { - "epoch": 0.67, - "learning_rate": 0.00019998054096127647, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.0002533224694895843, + "loss": 0.0208, "step": 61680 }, { - "epoch": 0.67, - "learning_rate": 0.0001999643250956736, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.0002533149017965703, + "loss": 0.0219, "step": 61690 }, { - "epoch": 0.67, - "learning_rate": 0.00019994810923007068, - "loss": 0.0187, + "epoch": 0.31, + "learning_rate": 0.00025330733410355627, + "loss": 0.021, "step": 61700 }, { - "epoch": 0.67, - "learning_rate": 0.00019993189336446778, - "loss": 0.0189, + "epoch": 0.31, + "learning_rate": 0.0002532997664105423, + "loss": 0.0225, "step": 61710 }, { - "epoch": 0.67, - "learning_rate": 0.00019991567749886487, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.0002532921987175283, + "loss": 0.024, "step": 61720 }, { - "epoch": 0.67, - "learning_rate": 0.00019989946163326196, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025328463102451427, + "loss": 0.018, "step": 61730 }, { - "epoch": 0.67, - "learning_rate": 0.00019988324576765906, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025327706333150025, + "loss": 0.0191, "step": 61740 }, { - "epoch": 0.67, - "learning_rate": 0.00019986702990205618, - "loss": 0.0183, + "epoch": 0.31, + "learning_rate": 0.00025326949563848623, + "loss": 0.0177, "step": 61750 }, { - "epoch": 0.67, - "learning_rate": 0.00019985081403645324, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.0002532619279454722, + "loss": 0.0208, "step": 61760 }, { - "epoch": 0.67, - "learning_rate": 0.00019983459817085033, - "loss": 0.0194, + "epoch": 0.31, + "learning_rate": 0.00025325436025245825, + "loss": 0.0175, "step": 61770 }, { - "epoch": 0.67, - "learning_rate": 0.00019981838230524743, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025324679255944423, + "loss": 0.0175, "step": 61780 }, { - "epoch": 0.67, - "learning_rate": 0.00019980216643964455, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.0002532392248664302, + "loss": 0.0203, "step": 61790 }, { - "epoch": 0.67, - "learning_rate": 0.0001997859505740416, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002532316571734162, + "loss": 0.0211, "step": 61800 }, { - "epoch": 0.67, - "learning_rate": 0.0001997697347084387, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.0002532240894804022, + "loss": 0.0191, "step": 61810 }, { - "epoch": 0.67, - "learning_rate": 0.00019975351884283582, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025321652178738815, + "loss": 0.0181, "step": 61820 }, { - "epoch": 0.67, - "learning_rate": 0.00019973730297723292, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025320895409437414, + "loss": 0.0227, "step": 61830 }, { - "epoch": 0.67, - "learning_rate": 0.00019972108711162998, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.00025320138640136017, + "loss": 0.0221, "step": 61840 }, { - "epoch": 0.67, - "learning_rate": 0.00019970487124602708, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.00025319381870834615, + "loss": 0.0198, "step": 61850 }, { - "epoch": 0.67, - "learning_rate": 0.0001996886553804242, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025318625101533213, + "loss": 0.0188, "step": 61860 }, { - "epoch": 0.67, - "learning_rate": 0.0001996724395148213, - "loss": 0.0176, + "epoch": 0.31, + "learning_rate": 0.0002531786833223181, + "loss": 0.0216, "step": 61870 }, { - "epoch": 0.67, - "learning_rate": 0.00019965622364921838, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002531711156293041, + "loss": 0.0242, "step": 61880 }, { - "epoch": 0.67, - "learning_rate": 0.00019964000778361547, - "loss": 0.0192, + "epoch": 0.31, + "learning_rate": 0.0002531635479362901, + "loss": 0.0194, "step": 61890 }, { - "epoch": 0.67, - "learning_rate": 0.00019962379191801257, - "loss": 0.0172, + "epoch": 0.31, + "learning_rate": 0.0002531559802432761, + "loss": 0.0158, "step": 61900 }, { - "epoch": 0.67, - "learning_rate": 0.00019960757605240966, - "loss": 0.0192, + "epoch": 0.31, + "learning_rate": 0.0002531484125502621, + "loss": 0.0187, "step": 61910 }, { - "epoch": 0.67, - "learning_rate": 0.00019959136018680678, - "loss": 0.019, + "epoch": 0.31, + "learning_rate": 0.0002531408448572481, + "loss": 0.0213, "step": 61920 }, { - "epoch": 0.67, - "learning_rate": 0.00019957514432120384, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025313327716423406, + "loss": 0.0252, "step": 61930 }, { - "epoch": 0.67, - "learning_rate": 0.00019955892845560094, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025312570947122004, + "loss": 0.0224, "step": 61940 }, { - "epoch": 0.67, - "learning_rate": 0.00019954271258999803, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.000253118141778206, + "loss": 0.0216, "step": 61950 }, { - "epoch": 0.67, - "learning_rate": 0.00019952649672439515, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025311057408519206, + "loss": 0.0215, "step": 61960 }, { - "epoch": 0.67, - "learning_rate": 0.00019951028085879222, - "loss": 0.0183, + "epoch": 0.31, + "learning_rate": 0.00025310300639217804, + "loss": 0.0189, "step": 61970 }, { - "epoch": 0.67, - "learning_rate": 0.0001994940649931893, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.000253095438699164, + "loss": 0.0195, "step": 61980 }, { - "epoch": 0.67, - "learning_rate": 0.00019947784912758643, - "loss": 0.0201, + "epoch": 0.31, + "learning_rate": 0.00025308787100615, + "loss": 0.0169, "step": 61990 }, { - "epoch": 0.67, - "learning_rate": 0.00019946163326198352, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.000253080303313136, + "loss": 0.024, "step": 62000 }, { - "epoch": 0.67, - "eval_cer": 0.9215330147297689, - "eval_loss": 0.011450623162090778, - "eval_runtime": 121.258, - "eval_samples_per_second": 16.494, - "eval_steps_per_second": 4.123, + "epoch": 0.31, + "eval_cer": 0.9144838414489178, + "eval_loss": 0.014024483039975166, + "eval_runtime": 116.7957, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, "step": 62000 }, { - "epoch": 0.67, - "learning_rate": 0.0001994454173963806, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.00025307273562012196, + "loss": 0.0204, "step": 62010 }, { - "epoch": 0.67, - "learning_rate": 0.0001994292015307777, - "loss": 0.0172, + "epoch": 0.31, + "learning_rate": 0.00025306516792710795, + "loss": 0.0195, "step": 62020 }, { - "epoch": 0.67, - "learning_rate": 0.0001994129856651748, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.000253057600234094, + "loss": 0.0199, "step": 62030 }, { - "epoch": 0.67, - "learning_rate": 0.0001993967697995719, - "loss": 0.0421, + "epoch": 0.31, + "learning_rate": 0.00025305003254107996, + "loss": 0.0215, "step": 62040 }, { - "epoch": 0.67, - "learning_rate": 0.00019938055393396896, - "loss": 0.0281, + "epoch": 0.31, + "learning_rate": 0.00025304246484806594, + "loss": 0.0183, "step": 62050 }, { - "epoch": 0.67, - "learning_rate": 0.00019936433806836608, - "loss": 0.0206, + "epoch": 0.31, + "learning_rate": 0.0002530348971550519, + "loss": 0.0228, "step": 62060 }, { - "epoch": 0.67, - "learning_rate": 0.00019934812220276317, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.0002530273294620379, + "loss": 0.022, "step": 62070 }, { - "epoch": 0.67, - "learning_rate": 0.00019933190633716026, - "loss": 0.0183, + "epoch": 0.31, + "learning_rate": 0.0002530197617690239, + "loss": 0.0208, "step": 62080 }, { - "epoch": 0.67, - "learning_rate": 0.00019931569047155736, - "loss": 0.0212, + "epoch": 0.31, + "learning_rate": 0.0002530121940760099, + "loss": 0.0275, "step": 62090 }, { - "epoch": 0.67, - "learning_rate": 0.00019929947460595445, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.0002530046263829959, + "loss": 0.0203, "step": 62100 }, { - "epoch": 0.67, - "learning_rate": 0.00019928325874035154, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.0002529970586899819, + "loss": 0.0219, "step": 62110 }, { - "epoch": 0.67, - "learning_rate": 0.00019926704287474866, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.00025298949099696787, + "loss": 0.0225, "step": 62120 }, { - "epoch": 0.67, - "learning_rate": 0.00019925082700914573, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.00025298192330395385, + "loss": 0.0185, "step": 62130 }, { - "epoch": 0.67, - "learning_rate": 0.00019923461114354282, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025297435561093983, + "loss": 0.0206, "step": 62140 }, { - "epoch": 0.67, - "learning_rate": 0.0001992183952779399, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.0002529667879179258, + "loss": 0.0213, "step": 62150 }, { - "epoch": 0.67, - "learning_rate": 0.00019920217941233703, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.00025295922022491185, + "loss": 0.0231, "step": 62160 }, { - "epoch": 0.67, - "learning_rate": 0.0001991859635467341, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.00025295165253189783, + "loss": 0.0182, "step": 62170 }, { - "epoch": 0.67, - "learning_rate": 0.0001991697476811312, - "loss": 0.0133, + "epoch": 0.31, + "learning_rate": 0.0002529440848388838, + "loss": 0.0204, "step": 62180 }, { - "epoch": 0.67, - "learning_rate": 0.0001991535318155283, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002529365171458698, + "loss": 0.02, "step": 62190 }, { - "epoch": 0.67, - "learning_rate": 0.0001991373159499254, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.0002529289494528558, + "loss": 0.0219, "step": 62200 }, { - "epoch": 0.67, - "learning_rate": 0.00019912110008432247, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025292138175984176, + "loss": 0.0212, "step": 62210 }, { - "epoch": 0.67, - "learning_rate": 0.00019910488421871956, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.00025291381406682774, + "loss": 0.0237, "step": 62220 }, { - "epoch": 0.67, - "learning_rate": 0.00019908866835311668, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.0002529062463738137, + "loss": 0.019, "step": 62230 }, { - "epoch": 0.67, - "learning_rate": 0.00019907245248751377, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002528986786807997, + "loss": 0.0195, "step": 62240 }, { - "epoch": 0.67, - "learning_rate": 0.00019905623662191084, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002528911109877857, + "loss": 0.0205, "step": 62250 }, { - "epoch": 0.67, - "learning_rate": 0.00019904002075630796, - "loss": 0.0129, + "epoch": 0.31, + "learning_rate": 0.0002528835432947717, + "loss": 0.0231, "step": 62260 }, { - "epoch": 0.67, - "learning_rate": 0.00019902380489070505, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002528759756017577, + "loss": 0.02, "step": 62270 }, { - "epoch": 0.67, - "learning_rate": 0.00019900758902510215, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002528684079087437, + "loss": 0.0196, "step": 62280 }, { - "epoch": 0.67, - "learning_rate": 0.0001989913731594992, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025286084021572966, + "loss": 0.0176, "step": 62290 }, { - "epoch": 0.67, - "learning_rate": 0.00019897515729389633, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.00025285327252271564, + "loss": 0.0196, "step": 62300 }, { - "epoch": 0.67, - "learning_rate": 0.00019895894142829342, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.0002528457048297016, + "loss": 0.0173, "step": 62310 }, { - "epoch": 0.67, - "learning_rate": 0.00019894272556269054, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025283813713668766, + "loss": 0.0189, "step": 62320 }, { - "epoch": 0.67, - "learning_rate": 0.0001989265096970876, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025283056944367364, + "loss": 0.0228, "step": 62330 }, { - "epoch": 0.67, - "learning_rate": 0.0001989102938314847, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.0002528230017506596, + "loss": 0.0182, "step": 62340 }, { - "epoch": 0.67, - "learning_rate": 0.0001988940779658818, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.0002528154340576456, + "loss": 0.0232, "step": 62350 }, { - "epoch": 0.67, - "learning_rate": 0.00019887786210027891, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.0002528078663646316, + "loss": 0.0159, "step": 62360 }, { - "epoch": 0.67, - "learning_rate": 0.00019886164623467598, - "loss": 0.0192, + "epoch": 0.31, + "learning_rate": 0.00025280029867161757, + "loss": 0.019, "step": 62370 }, { - "epoch": 0.67, - "learning_rate": 0.00019884543036907307, - "loss": 0.0191, + "epoch": 0.31, + "learning_rate": 0.00025279273097860355, + "loss": 0.0198, "step": 62380 }, { - "epoch": 0.67, - "learning_rate": 0.0001988292145034702, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002527851632855896, + "loss": 0.023, "step": 62390 }, { - "epoch": 0.67, - "learning_rate": 0.00019881299863786729, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.00025277759559257557, + "loss": 0.0207, "step": 62400 }, { - "epoch": 0.67, - "learning_rate": 0.00019879678277226435, - "loss": 0.0168, + "epoch": 0.31, + "learning_rate": 0.00025277002789956155, + "loss": 0.0182, "step": 62410 }, { - "epoch": 0.67, - "learning_rate": 0.00019878056690666144, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.00025276246020654753, + "loss": 0.0205, "step": 62420 }, { - "epoch": 0.67, - "learning_rate": 0.00019876435104105856, - "loss": 0.0133, + "epoch": 0.31, + "learning_rate": 0.0002527548925135335, + "loss": 0.0204, "step": 62430 }, { - "epoch": 0.68, - "learning_rate": 0.00019874813517545566, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002527473248205195, + "loss": 0.0217, "step": 62440 }, { - "epoch": 0.68, - "learning_rate": 0.00019873191930985272, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.00025273975712750553, + "loss": 0.0245, "step": 62450 }, { - "epoch": 0.68, - "learning_rate": 0.00019871570344424984, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002527321894344915, + "loss": 0.0216, "step": 62460 }, { - "epoch": 0.68, - "learning_rate": 0.00019869948757864693, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002527246217414775, + "loss": 0.0215, "step": 62470 }, { - "epoch": 0.68, - "learning_rate": 0.00019868327171304403, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025271705404846347, + "loss": 0.0223, "step": 62480 }, { - "epoch": 0.68, - "learning_rate": 0.0001986670558474411, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.00025270948635544945, + "loss": 0.0195, "step": 62490 }, { - "epoch": 0.68, - "learning_rate": 0.0001986508399818382, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.00025270191866243543, + "loss": 0.0208, "step": 62500 }, { - "epoch": 0.68, - "learning_rate": 0.0001986346241162353, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025269435096942147, + "loss": 0.0197, "step": 62510 }, { - "epoch": 0.68, - "learning_rate": 0.0001986184082506324, - "loss": 0.0195, + "epoch": 0.32, + "learning_rate": 0.00025268678327640745, + "loss": 0.0188, "step": 62520 }, { - "epoch": 0.68, - "learning_rate": 0.0001986021923850295, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025267921558339343, + "loss": 0.0197, "step": 62530 }, { - "epoch": 0.68, - "learning_rate": 0.00019858597651942658, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002526716478903794, + "loss": 0.0204, "step": 62540 }, { - "epoch": 0.68, - "learning_rate": 0.00019856976065382368, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002526640801973654, + "loss": 0.0155, "step": 62550 }, { - "epoch": 0.68, - "learning_rate": 0.0001985535447882208, - "loss": 0.0202, + "epoch": 0.32, + "learning_rate": 0.0002526565125043514, + "loss": 0.0229, "step": 62560 }, { - "epoch": 0.68, - "learning_rate": 0.00019853732892261786, - "loss": 0.0142, + "epoch": 0.32, + "learning_rate": 0.00025264894481133736, + "loss": 0.0238, "step": 62570 }, { - "epoch": 0.68, - "learning_rate": 0.00019852111305701495, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002526413771183234, + "loss": 0.0245, "step": 62580 }, { - "epoch": 0.68, - "learning_rate": 0.00019850489719141205, - "loss": 0.0178, + "epoch": 0.32, + "learning_rate": 0.0002526338094253094, + "loss": 0.0196, "step": 62590 }, { - "epoch": 0.68, - "learning_rate": 0.00019848868132580917, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025262624173229536, + "loss": 0.0206, "step": 62600 }, { - "epoch": 0.68, - "learning_rate": 0.00019847246546020626, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.00025261867403928134, + "loss": 0.0193, "step": 62610 }, { - "epoch": 0.68, - "learning_rate": 0.00019845624959460333, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.0002526111063462673, + "loss": 0.0186, "step": 62620 }, { - "epoch": 0.68, - "learning_rate": 0.00019844003372900045, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002526035386532533, + "loss": 0.0173, "step": 62630 }, { - "epoch": 0.68, - "learning_rate": 0.00019842381786339754, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025259597096023934, + "loss": 0.0172, "step": 62640 }, { - "epoch": 0.68, - "learning_rate": 0.00019840760199779463, - "loss": 0.0175, + "epoch": 0.32, + "learning_rate": 0.0002525884032672253, + "loss": 0.0247, "step": 62650 }, { - "epoch": 0.68, - "learning_rate": 0.0001983913861321917, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.0002525808355742113, + "loss": 0.0177, "step": 62660 }, { - "epoch": 0.68, - "learning_rate": 0.00019837517026658882, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.0002525732678811973, + "loss": 0.0206, "step": 62670 }, { - "epoch": 0.68, - "learning_rate": 0.0001983589544009859, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.00025256570018818326, + "loss": 0.0188, "step": 62680 }, { - "epoch": 0.68, - "learning_rate": 0.00019834273853538303, - "loss": 0.0198, + "epoch": 0.32, + "learning_rate": 0.00025255813249516924, + "loss": 0.0219, "step": 62690 }, { - "epoch": 0.68, - "learning_rate": 0.0001983265226697801, - "loss": 0.0178, + "epoch": 0.32, + "learning_rate": 0.0002525505648021552, + "loss": 0.0219, "step": 62700 }, { - "epoch": 0.68, - "learning_rate": 0.0001983103068041772, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.00025254299710914126, + "loss": 0.0178, "step": 62710 }, { - "epoch": 0.68, - "learning_rate": 0.00019829409093857428, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025253542941612724, + "loss": 0.02, "step": 62720 }, { - "epoch": 0.68, - "learning_rate": 0.0001982778750729714, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.0002525278617231132, + "loss": 0.0183, "step": 62730 }, { - "epoch": 0.68, - "learning_rate": 0.00019826165920736847, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002525202940300992, + "loss": 0.0189, "step": 62740 }, { - "epoch": 0.68, - "learning_rate": 0.00019824544334176556, - "loss": 0.0184, + "epoch": 0.32, + "learning_rate": 0.0002525127263370852, + "loss": 0.0273, "step": 62750 }, { - "epoch": 0.68, - "learning_rate": 0.00019822922747616268, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.00025250515864407117, + "loss": 0.0189, "step": 62760 }, { - "epoch": 0.68, - "learning_rate": 0.00019821301161055977, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.0002524975909510572, + "loss": 0.0171, "step": 62770 }, { - "epoch": 0.68, - "learning_rate": 0.00019819679574495684, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002524900232580432, + "loss": 0.0194, "step": 62780 }, { - "epoch": 0.68, - "learning_rate": 0.00019818057987935393, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025248245556502917, + "loss": 0.0194, "step": 62790 }, { - "epoch": 0.68, - "learning_rate": 0.00019816436401375105, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.00025247488787201515, + "loss": 0.0205, "step": 62800 }, { - "epoch": 0.68, - "learning_rate": 0.00019814814814814814, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025246732017900113, + "loss": 0.0176, "step": 62810 }, { - "epoch": 0.68, - "learning_rate": 0.0001981319322825452, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.0002524597524859871, + "loss": 0.0207, "step": 62820 }, { - "epoch": 0.68, - "learning_rate": 0.00019811571641694233, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025245218479297315, + "loss": 0.0213, "step": 62830 }, { - "epoch": 0.68, - "learning_rate": 0.00019809950055133942, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.00025244461709995913, + "loss": 0.0184, "step": 62840 }, { - "epoch": 0.68, - "learning_rate": 0.0001980832846857365, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002524370494069451, + "loss": 0.0177, "step": 62850 }, { - "epoch": 0.68, - "learning_rate": 0.00019806706882013358, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002524294817139311, + "loss": 0.0194, "step": 62860 }, { - "epoch": 0.68, - "learning_rate": 0.0001980508529545307, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002524219140209171, + "loss": 0.0198, "step": 62870 }, { - "epoch": 0.68, - "learning_rate": 0.0001980346370889278, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025241434632790305, + "loss": 0.0249, "step": 62880 }, { - "epoch": 0.68, - "learning_rate": 0.00019801842122332488, - "loss": 0.0182, + "epoch": 0.32, + "learning_rate": 0.00025240677863488904, + "loss": 0.0195, "step": 62890 }, { - "epoch": 0.68, - "learning_rate": 0.00019800220535772198, - "loss": 0.0183, + "epoch": 0.32, + "learning_rate": 0.00025239921094187507, + "loss": 0.0195, "step": 62900 }, { - "epoch": 0.68, - "learning_rate": 0.00019798598949211907, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.00025239164324886105, + "loss": 0.0169, "step": 62910 }, { - "epoch": 0.68, - "learning_rate": 0.00019796977362651616, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.00025238407555584703, + "loss": 0.0203, "step": 62920 }, { - "epoch": 0.68, - "learning_rate": 0.00019795355776091328, - "loss": 0.0196, + "epoch": 0.32, + "learning_rate": 0.000252376507862833, + "loss": 0.0181, "step": 62930 }, { - "epoch": 0.68, - "learning_rate": 0.00019793734189531035, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.000252368940169819, + "loss": 0.0179, "step": 62940 }, { - "epoch": 0.68, - "learning_rate": 0.00019792112602970744, - "loss": 0.0168, + "epoch": 0.32, + "learning_rate": 0.000252361372476805, + "loss": 0.0204, "step": 62950 }, { - "epoch": 0.68, - "learning_rate": 0.00019790491016410453, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.000252353804783791, + "loss": 0.0172, "step": 62960 }, { - "epoch": 0.68, - "learning_rate": 0.00019788869429850165, - "loss": 0.0191, + "epoch": 0.32, + "learning_rate": 0.000252346237090777, + "loss": 0.0169, "step": 62970 }, { - "epoch": 0.68, - "learning_rate": 0.00019787247843289872, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.000252338669397763, + "loss": 0.0185, "step": 62980 }, { - "epoch": 0.68, - "learning_rate": 0.0001978562625672958, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025233110170474896, + "loss": 0.0192, "step": 62990 }, { - "epoch": 0.68, - "learning_rate": 0.00019784004670169293, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025232353401173494, + "loss": 0.0175, "step": 63000 }, { - "epoch": 0.68, - "eval_cer": 0.9215590728184603, - "eval_loss": 0.011219864711165428, - "eval_runtime": 121.1331, - "eval_samples_per_second": 16.511, - "eval_steps_per_second": 4.128, + "epoch": 0.32, + "eval_cer": 0.9144712262992877, + "eval_loss": 0.013699725270271301, + "eval_runtime": 116.7034, + "eval_samples_per_second": 17.137, + "eval_steps_per_second": 4.284, "step": 63000 }, { - "epoch": 0.68, - "learning_rate": 0.00019782383083609002, - "loss": 0.0196, + "epoch": 0.32, + "learning_rate": 0.0002523159663187209, + "loss": 0.0179, "step": 63010 }, { - "epoch": 0.68, - "learning_rate": 0.0001978076149704871, - "loss": 0.0175, + "epoch": 0.32, + "learning_rate": 0.00025230839862570696, + "loss": 0.0182, "step": 63020 }, { - "epoch": 0.68, - "learning_rate": 0.0001977913991048842, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.00025230083093269294, + "loss": 0.0214, "step": 63030 }, { - "epoch": 0.68, - "learning_rate": 0.0001977751832392813, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.0002522932632396789, + "loss": 0.0225, "step": 63040 }, { - "epoch": 0.68, - "learning_rate": 0.0001977589673736784, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.0002522856955466649, + "loss": 0.0154, "step": 63050 }, { - "epoch": 0.68, - "learning_rate": 0.00019774275150807546, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.0002522781278536509, + "loss": 0.0199, "step": 63060 }, { - "epoch": 0.68, - "learning_rate": 0.00019772653564247258, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025227056016063686, + "loss": 0.017, "step": 63070 }, { - "epoch": 0.68, - "learning_rate": 0.00019771031977686967, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025226299246762285, + "loss": 0.0253, "step": 63080 }, { - "epoch": 0.68, - "learning_rate": 0.00019769410391126677, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002522554247746089, + "loss": 0.0208, "step": 63090 }, { - "epoch": 0.68, - "learning_rate": 0.00019767788804566386, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.00025224785708159486, + "loss": 0.0201, "step": 63100 }, { - "epoch": 0.68, - "learning_rate": 0.00019766167218006095, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025224028938858084, + "loss": 0.0207, "step": 63110 }, { - "epoch": 0.68, - "learning_rate": 0.00019764545631445804, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002522327216955668, + "loss": 0.0171, "step": 63120 }, { - "epoch": 0.68, - "learning_rate": 0.00019762924044885516, - "loss": 0.0236, + "epoch": 0.32, + "learning_rate": 0.0002522251540025528, + "loss": 0.0183, "step": 63130 }, { - "epoch": 0.68, - "learning_rate": 0.00019761302458325223, - "loss": 0.0183, + "epoch": 0.32, + "learning_rate": 0.0002522175863095388, + "loss": 0.0175, "step": 63140 }, { - "epoch": 0.68, - "learning_rate": 0.00019759680871764932, - "loss": 0.0179, + "epoch": 0.32, + "learning_rate": 0.0002522100186165248, + "loss": 0.0194, "step": 63150 }, { - "epoch": 0.68, - "learning_rate": 0.00019758059285204641, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.0002522024509235108, + "loss": 0.0233, "step": 63160 }, { - "epoch": 0.68, - "learning_rate": 0.00019756437698644353, - "loss": 0.0168, + "epoch": 0.32, + "learning_rate": 0.0002521948832304968, + "loss": 0.0177, "step": 63170 }, { - "epoch": 0.68, - "learning_rate": 0.0001975481611208406, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.00025218731553748277, + "loss": 0.018, "step": 63180 }, { - "epoch": 0.68, - "learning_rate": 0.0001975319452552377, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025217974784446875, + "loss": 0.0212, "step": 63190 }, { - "epoch": 0.68, - "learning_rate": 0.0001975157293896348, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025217218015145473, + "loss": 0.0184, "step": 63200 }, { - "epoch": 0.68, - "learning_rate": 0.0001974995135240319, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.0002521646124584407, + "loss": 0.0193, "step": 63210 }, { - "epoch": 0.68, - "learning_rate": 0.00019748329765842897, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025215704476542675, + "loss": 0.0268, "step": 63220 }, { - "epoch": 0.68, - "learning_rate": 0.00019746708179282606, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025214947707241273, + "loss": 0.0197, "step": 63230 }, { - "epoch": 0.68, - "learning_rate": 0.00019745086592722318, - "loss": 0.0211, + "epoch": 0.32, + "learning_rate": 0.0002521419093793987, + "loss": 0.019, "step": 63240 }, { - "epoch": 0.68, - "learning_rate": 0.00019743465006162028, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.0002521343416863847, + "loss": 0.0178, "step": 63250 }, { - "epoch": 0.68, - "learning_rate": 0.00019741843419601734, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.0002521267739933707, + "loss": 0.0218, "step": 63260 }, { - "epoch": 0.68, - "learning_rate": 0.00019740221833041446, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025211920630035666, + "loss": 0.0217, "step": 63270 }, { - "epoch": 0.68, - "learning_rate": 0.00019738600246481155, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002521116386073427, + "loss": 0.0218, "step": 63280 }, { - "epoch": 0.68, - "learning_rate": 0.00019736978659920865, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.0002521040709143287, + "loss": 0.02, "step": 63290 }, { - "epoch": 0.68, - "learning_rate": 0.00019735357073360577, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025209650322131465, + "loss": 0.0262, "step": 63300 }, { - "epoch": 0.68, - "learning_rate": 0.00019733735486800283, - "loss": 0.0171, + "epoch": 0.32, + "learning_rate": 0.00025208893552830064, + "loss": 0.0206, "step": 63310 }, { - "epoch": 0.68, - "learning_rate": 0.00019732113900239993, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.0002520813678352866, + "loss": 0.019, "step": 63320 }, { - "epoch": 0.68, - "learning_rate": 0.00019730492313679705, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.0002520738001422726, + "loss": 0.017, "step": 63330 }, { - "epoch": 0.68, - "learning_rate": 0.00019728870727119414, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025206623244925863, + "loss": 0.0216, "step": 63340 }, { - "epoch": 0.68, - "learning_rate": 0.0001972724914055912, - "loss": 0.0188, + "epoch": 0.32, + "learning_rate": 0.0002520586647562446, + "loss": 0.0183, "step": 63350 }, { - "epoch": 0.68, - "learning_rate": 0.0001972562755399883, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002520510970632306, + "loss": 0.018, "step": 63360 }, { - "epoch": 0.69, - "learning_rate": 0.00019724005967438542, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002520435293702166, + "loss": 0.0185, "step": 63370 }, { - "epoch": 0.69, - "learning_rate": 0.0001972238438087825, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025203596167720256, + "loss": 0.0206, "step": 63380 }, { - "epoch": 0.69, - "learning_rate": 0.00019720762794317958, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025202839398418854, + "loss": 0.0194, "step": 63390 }, { - "epoch": 0.69, - "learning_rate": 0.0001971914120775767, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002520208262911745, + "loss": 0.0273, "step": 63400 }, { - "epoch": 0.69, - "learning_rate": 0.0001971751962119738, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025201325859816056, + "loss": 0.0179, "step": 63410 }, { - "epoch": 0.69, - "learning_rate": 0.00019715898034637088, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.00025200569090514654, + "loss": 0.0242, "step": 63420 }, { - "epoch": 0.69, - "learning_rate": 0.00019714276448076795, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002519981232121325, + "loss": 0.0193, "step": 63430 }, { - "epoch": 0.69, - "learning_rate": 0.00019712654861516507, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002519905555191185, + "loss": 0.0194, "step": 63440 }, { - "epoch": 0.69, - "learning_rate": 0.00019711033274956216, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002519829878261045, + "loss": 0.0235, "step": 63450 }, { - "epoch": 0.69, - "learning_rate": 0.00019709411688395925, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.00025197542013309047, + "loss": 0.0206, "step": 63460 }, { - "epoch": 0.69, - "learning_rate": 0.00019707790101835634, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002519678524400765, + "loss": 0.0165, "step": 63470 }, { - "epoch": 0.69, - "learning_rate": 0.00019706168515275344, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.00025196028474706243, + "loss": 0.0186, "step": 63480 }, { - "epoch": 0.69, - "learning_rate": 0.00019704546928715053, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.0002519527170540484, + "loss": 0.0216, "step": 63490 }, { - "epoch": 0.69, - "learning_rate": 0.00019702925342154765, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.0002519451493610344, + "loss": 0.0175, "step": 63500 }, { - "epoch": 0.69, - "learning_rate": 0.00019701303755594472, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.00025193758166802043, + "loss": 0.0144, "step": 63510 }, { - "epoch": 0.69, - "learning_rate": 0.0001969968216903418, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.0002519300139750064, + "loss": 0.0219, "step": 63520 }, { - "epoch": 0.69, - "learning_rate": 0.0001969806058247389, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.0002519224462819924, + "loss": 0.0196, "step": 63530 }, { - "epoch": 0.69, - "learning_rate": 0.00019696438995913602, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025191487858897837, + "loss": 0.0194, "step": 63540 }, { - "epoch": 0.69, - "learning_rate": 0.00019694817409353309, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.00025190731089596435, + "loss": 0.0176, "step": 63550 }, { - "epoch": 0.69, - "learning_rate": 0.00019693195822793018, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.00025189974320295034, + "loss": 0.0203, "step": 63560 }, { - "epoch": 0.69, - "learning_rate": 0.0001969157423623273, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.00025189217550993637, + "loss": 0.0162, "step": 63570 }, { - "epoch": 0.69, - "learning_rate": 0.0001968995264967244, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.00025188460781692235, + "loss": 0.0185, "step": 63580 }, { - "epoch": 0.69, - "learning_rate": 0.00019688331063112146, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.00025187704012390833, + "loss": 0.0205, "step": 63590 }, { - "epoch": 0.69, - "learning_rate": 0.00019686709476551855, - "loss": 0.0189, + "epoch": 0.32, + "learning_rate": 0.0002518694724308943, + "loss": 0.023, "step": 63600 }, { - "epoch": 0.69, - "learning_rate": 0.00019685087889991567, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002518619047378803, + "loss": 0.0245, "step": 63610 }, { - "epoch": 0.69, - "learning_rate": 0.00019683466303431276, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002518543370448663, + "loss": 0.0177, "step": 63620 }, { - "epoch": 0.69, - "learning_rate": 0.00019681844716870983, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025184676935185226, + "loss": 0.0182, "step": 63630 }, { - "epoch": 0.69, - "learning_rate": 0.00019680223130310695, - "loss": 0.0192, + "epoch": 0.32, + "learning_rate": 0.0002518392016588383, + "loss": 0.0235, "step": 63640 }, { - "epoch": 0.69, - "learning_rate": 0.00019678601543750404, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.0002518316339658243, + "loss": 0.0185, "step": 63650 }, { - "epoch": 0.69, - "learning_rate": 0.00019676979957190113, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025182406627281026, + "loss": 0.02, "step": 63660 }, { - "epoch": 0.69, - "learning_rate": 0.0001967535837062982, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.00025181649857979624, + "loss": 0.0162, "step": 63670 }, { - "epoch": 0.69, - "learning_rate": 0.00019673736784069532, - "loss": 0.0194, + "epoch": 0.32, + "learning_rate": 0.0002518089308867822, + "loss": 0.0181, "step": 63680 }, { - "epoch": 0.69, - "learning_rate": 0.0001967211519750924, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002518013631937682, + "loss": 0.0192, "step": 63690 }, { - "epoch": 0.69, - "learning_rate": 0.00019670493610948953, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025179379550075424, + "loss": 0.0192, "step": 63700 }, { - "epoch": 0.69, - "learning_rate": 0.0001966887202438866, - "loss": 0.0186, + "epoch": 0.32, + "learning_rate": 0.0002517862278077402, + "loss": 0.0164, "step": 63710 }, { - "epoch": 0.69, - "learning_rate": 0.0001966725043782837, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002517786601147262, + "loss": 0.0164, "step": 63720 }, { - "epoch": 0.69, - "learning_rate": 0.00019665628851268078, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002517710924217122, + "loss": 0.0245, "step": 63730 }, { - "epoch": 0.69, - "learning_rate": 0.0001966400726470779, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025176352472869816, + "loss": 0.0178, "step": 63740 }, { - "epoch": 0.69, - "learning_rate": 0.00019662385678147497, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.00025175595703568415, + "loss": 0.0236, "step": 63750 }, { - "epoch": 0.69, - "learning_rate": 0.00019660764091587206, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.0002517483893426702, + "loss": 0.026, "step": 63760 }, { - "epoch": 0.69, - "learning_rate": 0.00019659142505026918, - "loss": 0.0202, + "epoch": 0.32, + "learning_rate": 0.00025174082164965616, + "loss": 0.0185, "step": 63770 }, { - "epoch": 0.69, - "learning_rate": 0.00019657520918466627, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025173325395664214, + "loss": 0.021, "step": 63780 }, { - "epoch": 0.69, - "learning_rate": 0.00019655899331906334, - "loss": 0.0179, + "epoch": 0.32, + "learning_rate": 0.0002517256862636281, + "loss": 0.026, "step": 63790 }, { - "epoch": 0.69, - "learning_rate": 0.00019654277745346043, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002517181185706141, + "loss": 0.0196, "step": 63800 }, { - "epoch": 0.69, - "learning_rate": 0.00019652656158785755, - "loss": 0.0169, + "epoch": 0.32, + "learning_rate": 0.0002517105508776001, + "loss": 0.0189, "step": 63810 }, { - "epoch": 0.69, - "learning_rate": 0.00019651034572225464, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025170298318458607, + "loss": 0.0193, "step": 63820 }, { - "epoch": 0.69, - "learning_rate": 0.0001964941298566517, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002516954154915721, + "loss": 0.0167, "step": 63830 }, { - "epoch": 0.69, - "learning_rate": 0.00019647791399104883, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.0002516878477985581, + "loss": 0.0204, "step": 63840 }, { - "epoch": 0.69, - "learning_rate": 0.00019646169812544592, - "loss": 0.0197, + "epoch": 0.32, + "learning_rate": 0.00025168028010554407, + "loss": 0.0162, "step": 63850 }, { - "epoch": 0.69, - "learning_rate": 0.00019644548225984302, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.00025167271241253005, + "loss": 0.0192, "step": 63860 }, { - "epoch": 0.69, - "learning_rate": 0.00019642926639424008, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.00025166514471951603, + "loss": 0.0227, "step": 63870 }, { - "epoch": 0.69, - "learning_rate": 0.0001964130505286372, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.000251657577026502, + "loss": 0.0194, "step": 63880 }, { - "epoch": 0.69, - "learning_rate": 0.0001963968346630343, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.00025165000933348805, + "loss": 0.0164, "step": 63890 }, { - "epoch": 0.69, - "learning_rate": 0.00019638061879743139, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.00025164244164047403, + "loss": 0.0176, "step": 63900 }, { - "epoch": 0.69, - "learning_rate": 0.00019636440293182848, - "loss": 0.019, + "epoch": 0.32, + "learning_rate": 0.00025163487394746, + "loss": 0.0207, "step": 63910 }, { - "epoch": 0.69, - "learning_rate": 0.00019634818706622557, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.000251627306254446, + "loss": 0.019, "step": 63920 }, { - "epoch": 0.69, - "learning_rate": 0.00019633197120062266, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.000251619738561432, + "loss": 0.021, "step": 63930 }, { - "epoch": 0.69, - "learning_rate": 0.00019631575533501978, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.00025161217086841796, + "loss": 0.0194, "step": 63940 }, { - "epoch": 0.69, - "learning_rate": 0.00019629953946941685, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025160460317540394, + "loss": 0.0205, "step": 63950 }, { - "epoch": 0.69, - "learning_rate": 0.00019628332360381394, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.00025159703548238997, + "loss": 0.02, "step": 63960 }, { - "epoch": 0.69, - "learning_rate": 0.00019626710773821104, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.00025158946778937595, + "loss": 0.026, "step": 63970 }, { - "epoch": 0.69, - "learning_rate": 0.00019625089187260816, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.00025158190009636194, + "loss": 0.0201, "step": 63980 }, { - "epoch": 0.69, - "learning_rate": 0.00019623467600700522, - "loss": 0.012, + "epoch": 0.32, + "learning_rate": 0.0002515743324033479, + "loss": 0.0206, "step": 63990 }, { - "epoch": 0.69, - "learning_rate": 0.00019621846014140231, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002515667647103339, + "loss": 0.0207, "step": 64000 }, { - "epoch": 0.69, - "eval_cer": 0.9215434379652454, - "eval_loss": 0.01114691887050867, - "eval_runtime": 121.2239, - "eval_samples_per_second": 16.498, - "eval_steps_per_second": 4.125, + "epoch": 0.32, + "eval_cer": 0.9144692855070369, + "eval_loss": 0.01427229680120945, + "eval_runtime": 116.7184, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 64000 }, { - "epoch": 0.69, - "learning_rate": 0.00019620224427579943, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.0002515591970173199, + "loss": 0.0165, "step": 64010 }, { - "epoch": 0.69, - "learning_rate": 0.00019618602841019653, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002515516293243059, + "loss": 0.0222, "step": 64020 }, { - "epoch": 0.69, - "learning_rate": 0.00019616981254459362, - "loss": 0.0171, + "epoch": 0.32, + "learning_rate": 0.0002515440616312919, + "loss": 0.0173, "step": 64030 }, { - "epoch": 0.69, - "learning_rate": 0.0001961535966789907, - "loss": 0.0209, + "epoch": 0.32, + "learning_rate": 0.0002515364939382779, + "loss": 0.0215, "step": 64040 }, { - "epoch": 0.69, - "learning_rate": 0.0001961373808133878, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.00025152892624526386, + "loss": 0.0197, "step": 64050 }, { - "epoch": 0.69, - "learning_rate": 0.0001961211649477849, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.00025152135855224984, + "loss": 0.0208, "step": 64060 }, { - "epoch": 0.69, - "learning_rate": 0.00019610494908218202, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002515137908592358, + "loss": 0.0194, "step": 64070 }, { - "epoch": 0.69, - "learning_rate": 0.00019608873321657908, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.00025150622316622186, + "loss": 0.023, "step": 64080 }, { - "epoch": 0.69, - "learning_rate": 0.00019607251735097618, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.00025149865547320784, + "loss": 0.0217, "step": 64090 }, { - "epoch": 0.69, - "learning_rate": 0.00019605630148537327, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.0002514910877801938, + "loss": 0.0243, "step": 64100 }, { - "epoch": 0.69, - "learning_rate": 0.0001960400856197704, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.0002514835200871798, + "loss": 0.0202, "step": 64110 }, { - "epoch": 0.69, - "learning_rate": 0.00019602386975416745, - "loss": 0.0189, + "epoch": 0.32, + "learning_rate": 0.0002514759523941658, + "loss": 0.0224, "step": 64120 }, { - "epoch": 0.69, - "learning_rate": 0.00019600765388856455, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.00025146838470115177, + "loss": 0.0198, "step": 64130 }, { - "epoch": 0.69, - "learning_rate": 0.00019599143802296167, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025146081700813775, + "loss": 0.0193, "step": 64140 }, { - "epoch": 0.69, - "learning_rate": 0.00019597522215735876, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002514532493151238, + "loss": 0.0202, "step": 64150 }, { - "epoch": 0.69, - "learning_rate": 0.00019595900629175582, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025144568162210976, + "loss": 0.0202, "step": 64160 }, { - "epoch": 0.69, - "learning_rate": 0.00019594279042615292, - "loss": 0.0115, + "epoch": 0.32, + "learning_rate": 0.00025143811392909575, + "loss": 0.0187, "step": 64170 }, { - "epoch": 0.69, - "learning_rate": 0.00019592657456055004, - "loss": 0.0179, + "epoch": 0.32, + "learning_rate": 0.0002514305462360817, + "loss": 0.0184, "step": 64180 }, { - "epoch": 0.69, - "learning_rate": 0.00019591035869494713, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002514229785430677, + "loss": 0.02, "step": 64190 }, { - "epoch": 0.69, - "learning_rate": 0.0001958941428293442, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002514154108500537, + "loss": 0.025, "step": 64200 }, { - "epoch": 0.69, - "learning_rate": 0.00019587792696374132, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.0002514078431570397, + "loss": 0.0195, "step": 64210 }, { - "epoch": 0.69, - "learning_rate": 0.0001958617110981384, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.0002514002754640257, + "loss": 0.0231, "step": 64220 }, { - "epoch": 0.69, - "learning_rate": 0.0001958454952325355, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002513927077710117, + "loss": 0.0199, "step": 64230 }, { - "epoch": 0.69, - "learning_rate": 0.00019582927936693257, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025138514007799767, + "loss": 0.0214, "step": 64240 }, { - "epoch": 0.69, - "learning_rate": 0.0001958130635013297, - "loss": 0.0195, + "epoch": 0.32, + "learning_rate": 0.00025137757238498365, + "loss": 0.0217, "step": 64250 }, { - "epoch": 0.69, - "learning_rate": 0.00019579684763572678, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025137000469196963, + "loss": 0.0174, "step": 64260 }, { - "epoch": 0.69, - "learning_rate": 0.0001957806317701239, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.0002513624369989556, + "loss": 0.0192, "step": 64270 }, { - "epoch": 0.69, - "learning_rate": 0.00019576441590452096, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025135486930594165, + "loss": 0.0185, "step": 64280 }, { - "epoch": 0.7, - "learning_rate": 0.00019574820003891806, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.00025134730161292763, + "loss": 0.0229, "step": 64290 }, { - "epoch": 0.7, - "learning_rate": 0.00019573198417331515, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.0002513397339199136, + "loss": 0.017, "step": 64300 }, { - "epoch": 0.7, - "learning_rate": 0.00019571576830771227, - "loss": 0.018, + "epoch": 0.32, + "learning_rate": 0.0002513321662268996, + "loss": 0.0185, "step": 64310 }, { - "epoch": 0.7, - "learning_rate": 0.00019569955244210934, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002513245985338856, + "loss": 0.0183, "step": 64320 }, { - "epoch": 0.7, - "learning_rate": 0.00019568333657650643, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.00025131703084087156, + "loss": 0.0173, "step": 64330 }, { - "epoch": 0.7, - "learning_rate": 0.00019566712071090355, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.0002513094631478576, + "loss": 0.0164, "step": 64340 }, { - "epoch": 0.7, - "learning_rate": 0.00019565090484530064, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002513018954548436, + "loss": 0.0207, "step": 64350 }, { - "epoch": 0.7, - "learning_rate": 0.0001956346889796977, - "loss": 0.0171, + "epoch": 0.32, + "learning_rate": 0.00025129432776182956, + "loss": 0.0264, "step": 64360 }, { - "epoch": 0.7, - "learning_rate": 0.0001956184731140948, - "loss": 0.0144, + "epoch": 0.32, + "learning_rate": 0.00025128676006881554, + "loss": 0.0207, "step": 64370 }, { - "epoch": 0.7, - "learning_rate": 0.00019560225724849192, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002512791923758015, + "loss": 0.0179, "step": 64380 }, { - "epoch": 0.7, - "learning_rate": 0.000195586041382889, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002512716246827875, + "loss": 0.0248, "step": 64390 }, { - "epoch": 0.7, - "learning_rate": 0.00019556982551728608, - "loss": 0.0177, + "epoch": 0.32, + "learning_rate": 0.00025126405698977354, + "loss": 0.0193, "step": 64400 }, { - "epoch": 0.7, - "learning_rate": 0.0001955536096516832, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.0002512564892967595, + "loss": 0.0179, "step": 64410 }, { - "epoch": 0.7, - "learning_rate": 0.0001955373937860803, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002512489216037455, + "loss": 0.0197, "step": 64420 }, { - "epoch": 0.7, - "learning_rate": 0.00019552117792047738, - "loss": 0.0178, + "epoch": 0.33, + "learning_rate": 0.0002512413539107315, + "loss": 0.0235, "step": 64430 }, { - "epoch": 0.7, - "learning_rate": 0.00019550496205487445, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025123378621771746, + "loss": 0.0195, "step": 64440 }, { - "epoch": 0.7, - "learning_rate": 0.00019548874618927157, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.00025122621852470344, + "loss": 0.0293, "step": 64450 }, { - "epoch": 0.7, - "learning_rate": 0.00019547253032366866, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002512186508316894, + "loss": 0.0289, "step": 64460 }, { - "epoch": 0.7, - "learning_rate": 0.00019545631445806575, - "loss": 0.0178, + "epoch": 0.33, + "learning_rate": 0.00025121108313867546, + "loss": 0.0181, "step": 64470 }, { - "epoch": 0.7, - "learning_rate": 0.00019544009859246285, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.00025120351544566144, + "loss": 0.0183, "step": 64480 }, { - "epoch": 0.7, - "learning_rate": 0.00019542388272685994, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.0002511959477526474, + "loss": 0.0162, "step": 64490 }, { - "epoch": 0.7, - "learning_rate": 0.00019540766686125703, - "loss": 0.0158, + "epoch": 0.33, + "learning_rate": 0.0002511883800596334, + "loss": 0.0201, "step": 64500 }, { - "epoch": 0.7, - "learning_rate": 0.00019539145099565415, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002511808123666194, + "loss": 0.0186, "step": 64510 }, { - "epoch": 0.7, - "learning_rate": 0.00019537523513005122, - "loss": 0.0182, + "epoch": 0.33, + "learning_rate": 0.00025117324467360537, + "loss": 0.0194, "step": 64520 }, { - "epoch": 0.7, - "learning_rate": 0.0001953590192644483, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.0002511656769805914, + "loss": 0.0168, "step": 64530 }, { - "epoch": 0.7, - "learning_rate": 0.0001953428033988454, - "loss": 0.0177, + "epoch": 0.33, + "learning_rate": 0.0002511581092875774, + "loss": 0.0238, "step": 64540 }, { - "epoch": 0.7, - "learning_rate": 0.00019532658753324252, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.00025115054159456337, + "loss": 0.0161, "step": 64550 }, { - "epoch": 0.7, - "learning_rate": 0.0001953103716676396, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025114297390154935, + "loss": 0.0203, "step": 64560 }, { - "epoch": 0.7, - "learning_rate": 0.00019529415580203668, - "loss": 0.0195, + "epoch": 0.33, + "learning_rate": 0.00025113540620853533, + "loss": 0.0205, "step": 64570 }, { - "epoch": 0.7, - "learning_rate": 0.0001952779399364338, - "loss": 0.0183, + "epoch": 0.33, + "learning_rate": 0.0002511278385155213, + "loss": 0.0244, "step": 64580 }, { - "epoch": 0.7, - "learning_rate": 0.0001952617240708309, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025112027082250735, + "loss": 0.0203, "step": 64590 }, { - "epoch": 0.7, - "learning_rate": 0.00019524550820522796, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002511127031294933, + "loss": 0.0182, "step": 64600 }, { - "epoch": 0.7, - "learning_rate": 0.00019522929233962505, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.0002511051354364793, + "loss": 0.0192, "step": 64610 }, { - "epoch": 0.7, - "learning_rate": 0.00019521307647402217, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.0002510975677434653, + "loss": 0.0247, "step": 64620 }, { - "epoch": 0.7, - "learning_rate": 0.00019519686060841927, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025109000005045127, + "loss": 0.019, "step": 64630 }, { - "epoch": 0.7, - "learning_rate": 0.00019518064474281633, - "loss": 0.0173, + "epoch": 0.33, + "learning_rate": 0.00025108243235743725, + "loss": 0.0199, "step": 64640 }, { - "epoch": 0.7, - "learning_rate": 0.00019516442887721345, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.00025107486466442323, + "loss": 0.0221, "step": 64650 }, { - "epoch": 0.7, - "learning_rate": 0.00019514821301161054, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025106729697140927, + "loss": 0.022, "step": 64660 }, { - "epoch": 0.7, - "learning_rate": 0.00019513199714600764, - "loss": 0.0193, + "epoch": 0.33, + "learning_rate": 0.00025105972927839525, + "loss": 0.0178, "step": 64670 }, { - "epoch": 0.7, - "learning_rate": 0.0001951157812804047, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025105216158538123, + "loss": 0.0156, "step": 64680 }, { - "epoch": 0.7, - "learning_rate": 0.00019509956541480182, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002510445938923672, + "loss": 0.0192, "step": 64690 }, { - "epoch": 0.7, - "learning_rate": 0.00019508334954919891, - "loss": 0.0201, + "epoch": 0.33, + "learning_rate": 0.0002510370261993532, + "loss": 0.017, "step": 64700 }, { - "epoch": 0.7, - "learning_rate": 0.00019506713368359603, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.0002510294585063392, + "loss": 0.02, "step": 64710 }, { - "epoch": 0.7, - "learning_rate": 0.0001950509178179931, - "loss": 0.0166, + "epoch": 0.33, + "learning_rate": 0.0002510218908133252, + "loss": 0.0199, "step": 64720 }, { - "epoch": 0.7, - "learning_rate": 0.0001950347019523902, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.00025101432312031114, + "loss": 0.0203, "step": 64730 }, { - "epoch": 0.7, - "learning_rate": 0.00019501848608678729, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002510067554272971, + "loss": 0.0215, "step": 64740 }, { - "epoch": 0.7, - "learning_rate": 0.0001950022702211844, - "loss": 0.0193, + "epoch": 0.33, + "learning_rate": 0.0002509991877342831, + "loss": 0.0181, "step": 64750 }, { - "epoch": 0.7, - "learning_rate": 0.0001949860543555815, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.00025099162004126914, + "loss": 0.0206, "step": 64760 }, { - "epoch": 0.7, - "learning_rate": 0.00019496983848997856, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002509840523482551, + "loss": 0.0202, "step": 64770 }, { - "epoch": 0.7, - "learning_rate": 0.00019495362262437568, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002509764846552411, + "loss": 0.0167, "step": 64780 }, { - "epoch": 0.7, - "learning_rate": 0.00019493740675877278, - "loss": 0.019, + "epoch": 0.33, + "learning_rate": 0.0002509689169622271, + "loss": 0.0165, "step": 64790 }, { - "epoch": 0.7, - "learning_rate": 0.00019492119089316987, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00025096134926921306, + "loss": 0.022, "step": 64800 }, { - "epoch": 0.7, - "learning_rate": 0.00019490497502756693, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00025095378157619905, + "loss": 0.018, "step": 64810 }, { - "epoch": 0.7, - "learning_rate": 0.00019488875916196405, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.0002509462138831851, + "loss": 0.0163, "step": 64820 }, { - "epoch": 0.7, - "learning_rate": 0.00019487254329636115, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.00025093864619017106, + "loss": 0.0179, "step": 64830 }, { - "epoch": 0.7, - "learning_rate": 0.00019485632743075824, - "loss": 0.0206, + "epoch": 0.33, + "learning_rate": 0.00025093107849715704, + "loss": 0.0198, "step": 64840 }, { - "epoch": 0.7, - "learning_rate": 0.00019484011156515533, - "loss": 0.0173, + "epoch": 0.33, + "learning_rate": 0.000250923510804143, + "loss": 0.015, "step": 64850 }, { - "epoch": 0.7, - "learning_rate": 0.00019482389569955243, - "loss": 0.0182, + "epoch": 0.33, + "learning_rate": 0.000250915943111129, + "loss": 0.0222, "step": 64860 }, { - "epoch": 0.7, - "learning_rate": 0.00019480767983394952, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.000250908375418115, + "loss": 0.022, "step": 64870 }, { - "epoch": 0.7, - "learning_rate": 0.00019479146396834664, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.00025090080772510097, + "loss": 0.0169, "step": 64880 }, { - "epoch": 0.7, - "learning_rate": 0.0001947752481027437, - "loss": 0.0238, + "epoch": 0.33, + "learning_rate": 0.000250893240032087, + "loss": 0.0217, "step": 64890 }, { - "epoch": 0.7, - "learning_rate": 0.0001947590322371408, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.000250885672339073, + "loss": 0.0205, "step": 64900 }, { - "epoch": 0.7, - "learning_rate": 0.0001947428163715379, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025087810464605897, + "loss": 0.0174, "step": 64910 }, { - "epoch": 0.7, - "learning_rate": 0.000194726600505935, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025087053695304495, + "loss": 0.0171, "step": 64920 }, { - "epoch": 0.7, - "learning_rate": 0.00019471038464033207, - "loss": 0.012, + "epoch": 0.33, + "learning_rate": 0.00025086296926003093, + "loss": 0.0178, "step": 64930 }, { - "epoch": 0.7, - "learning_rate": 0.00019469416877472917, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002508554015670169, + "loss": 0.0178, "step": 64940 }, { - "epoch": 0.7, - "learning_rate": 0.0001946779529091263, - "loss": 0.0167, + "epoch": 0.33, + "learning_rate": 0.00025084783387400295, + "loss": 0.0192, "step": 64950 }, { - "epoch": 0.7, - "learning_rate": 0.00019466173704352338, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.00025084026618098893, + "loss": 0.0181, "step": 64960 }, { - "epoch": 0.7, - "learning_rate": 0.00019464552117792045, - "loss": 0.0177, + "epoch": 0.33, + "learning_rate": 0.0002508326984879749, + "loss": 0.0183, "step": 64970 }, { - "epoch": 0.7, - "learning_rate": 0.00019462930531231754, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.0002508251307949609, + "loss": 0.0263, "step": 64980 }, { - "epoch": 0.7, - "learning_rate": 0.00019461308944671466, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.0002508175631019469, + "loss": 0.0171, "step": 64990 }, { - "epoch": 0.7, - "learning_rate": 0.00019459687358111175, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.00025080999540893286, + "loss": 0.021, "step": 65000 }, { - "epoch": 0.7, - "eval_cer": 0.921535620538638, - "eval_loss": 0.011012510396540165, - "eval_runtime": 121.262, - "eval_samples_per_second": 16.493, - "eval_steps_per_second": 4.123, + "epoch": 0.33, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.013442865572869778, + "eval_runtime": 116.7164, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, "step": 65000 }, { - "epoch": 0.7, - "learning_rate": 0.00019458065771550882, - "loss": 0.0179, + "epoch": 0.33, + "learning_rate": 0.00025080242771591884, + "loss": 0.022, "step": 65010 }, { - "epoch": 0.7, - "learning_rate": 0.00019456444184990594, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.00025079486002290487, + "loss": 0.0164, "step": 65020 }, { - "epoch": 0.7, - "learning_rate": 0.00019454822598430303, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.00025078729232989085, + "loss": 0.0209, "step": 65030 }, { - "epoch": 0.7, - "learning_rate": 0.00019453201011870012, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.00025077972463687684, + "loss": 0.0224, "step": 65040 }, { - "epoch": 0.7, - "learning_rate": 0.00019451579425309721, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002507721569438628, + "loss": 0.0178, "step": 65050 }, { - "epoch": 0.7, - "learning_rate": 0.0001944995783874943, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002507645892508488, + "loss": 0.0205, "step": 65060 }, { - "epoch": 0.7, - "learning_rate": 0.0001944833625218914, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002507570215578348, + "loss": 0.0205, "step": 65070 }, { - "epoch": 0.7, - "learning_rate": 0.00019446714665628852, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002507494538648208, + "loss": 0.0166, "step": 65080 }, { - "epoch": 0.7, - "learning_rate": 0.00019445093079068559, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002507418861718068, + "loss": 0.0141, "step": 65090 }, { - "epoch": 0.7, - "learning_rate": 0.00019443471492508268, - "loss": 0.0205, + "epoch": 0.33, + "learning_rate": 0.0002507343184787928, + "loss": 0.0224, "step": 65100 }, { - "epoch": 0.7, - "learning_rate": 0.00019441849905947977, - "loss": 0.0176, + "epoch": 0.33, + "learning_rate": 0.00025072675078577876, + "loss": 0.0191, "step": 65110 }, { - "epoch": 0.7, - "learning_rate": 0.0001944022831938769, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.00025071918309276474, + "loss": 0.0214, "step": 65120 }, { - "epoch": 0.7, - "learning_rate": 0.00019438606732827396, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002507116153997507, + "loss": 0.0147, "step": 65130 }, { - "epoch": 0.7, - "learning_rate": 0.00019436985146267105, - "loss": 0.0166, + "epoch": 0.33, + "learning_rate": 0.00025070404770673676, + "loss": 0.0176, "step": 65140 }, { - "epoch": 0.7, - "learning_rate": 0.00019435363559706817, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025069648001372274, + "loss": 0.0168, "step": 65150 }, { - "epoch": 0.7, - "learning_rate": 0.00019433741973146526, - "loss": 0.0168, + "epoch": 0.33, + "learning_rate": 0.0002506889123207087, + "loss": 0.0155, "step": 65160 }, { - "epoch": 0.7, - "learning_rate": 0.00019432120386586233, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002506813446276947, + "loss": 0.0203, "step": 65170 }, { - "epoch": 0.7, - "learning_rate": 0.00019430498800025942, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002506737769346807, + "loss": 0.0213, "step": 65180 }, { - "epoch": 0.7, - "learning_rate": 0.00019428877213465654, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025066620924166667, + "loss": 0.0169, "step": 65190 }, { - "epoch": 0.7, - "learning_rate": 0.00019427255626905363, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025065864154865265, + "loss": 0.0197, "step": 65200 }, { - "epoch": 0.7, - "learning_rate": 0.0001942563404034507, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.0002506510738556387, + "loss": 0.0235, "step": 65210 }, { - "epoch": 0.71, - "learning_rate": 0.00019424012453784782, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00025064350616262466, + "loss": 0.016, "step": 65220 }, { - "epoch": 0.71, - "learning_rate": 0.0001942239086722449, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025063593846961065, + "loss": 0.0189, "step": 65230 }, { - "epoch": 0.71, - "learning_rate": 0.000194207692806642, - "loss": 0.0179, + "epoch": 0.33, + "learning_rate": 0.0002506283707765966, + "loss": 0.0181, "step": 65240 }, { - "epoch": 0.71, - "learning_rate": 0.00019419147694103907, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002506208030835826, + "loss": 0.0201, "step": 65250 }, { - "epoch": 0.71, - "learning_rate": 0.0001941752610754362, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.0002506132353905686, + "loss": 0.0207, "step": 65260 }, { - "epoch": 0.71, - "learning_rate": 0.00019415904520983328, - "loss": 0.0201, + "epoch": 0.33, + "learning_rate": 0.0002506056676975546, + "loss": 0.018, "step": 65270 }, { - "epoch": 0.71, - "learning_rate": 0.0001941428293442304, - "loss": 0.0198, + "epoch": 0.33, + "learning_rate": 0.0002505981000045406, + "loss": 0.0186, "step": 65280 }, { - "epoch": 0.71, - "learning_rate": 0.00019412661347862747, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.0002505905323115266, + "loss": 0.0237, "step": 65290 }, { - "epoch": 0.71, - "learning_rate": 0.00019411039761302456, - "loss": 0.017, + "epoch": 0.33, + "learning_rate": 0.00025058296461851257, + "loss": 0.0265, "step": 65300 }, { - "epoch": 0.71, - "learning_rate": 0.00019409418174742165, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.00025057539692549855, + "loss": 0.0166, "step": 65310 }, { - "epoch": 0.71, - "learning_rate": 0.00019407796588181877, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025056782923248453, + "loss": 0.0183, "step": 65320 }, { - "epoch": 0.71, - "learning_rate": 0.00019406175001621584, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025056026153947057, + "loss": 0.016, "step": 65330 }, { - "epoch": 0.71, - "learning_rate": 0.00019404553415061293, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00025055269384645655, + "loss": 0.0151, "step": 65340 }, { - "epoch": 0.71, - "learning_rate": 0.00019402931828501005, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.00025054512615344253, + "loss": 0.0191, "step": 65350 }, { - "epoch": 0.71, - "learning_rate": 0.00019401310241940714, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.0002505375584604285, + "loss": 0.0159, "step": 65360 }, { - "epoch": 0.71, - "learning_rate": 0.0001939968865538042, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.0002505299907674145, + "loss": 0.019, "step": 65370 }, { - "epoch": 0.71, - "learning_rate": 0.0001939806706882013, - "loss": 0.0167, + "epoch": 0.33, + "learning_rate": 0.0002505224230744005, + "loss": 0.0195, "step": 65380 }, { - "epoch": 0.71, - "learning_rate": 0.00019396445482259842, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00025051485538138646, + "loss": 0.0228, "step": 65390 }, { - "epoch": 0.71, - "learning_rate": 0.00019394823895699551, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.0002505072876883725, + "loss": 0.0193, "step": 65400 }, { - "epoch": 0.71, - "learning_rate": 0.00019393202309139258, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002504997199953585, + "loss": 0.0173, "step": 65410 }, { - "epoch": 0.71, - "learning_rate": 0.0001939158072257897, - "loss": 0.0183, + "epoch": 0.33, + "learning_rate": 0.00025049215230234446, + "loss": 0.0188, "step": 65420 }, { - "epoch": 0.71, - "learning_rate": 0.0001938995913601868, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.00025048458460933044, + "loss": 0.0192, "step": 65430 }, { - "epoch": 0.71, - "learning_rate": 0.00019388337549458389, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.0002504770169163164, + "loss": 0.0198, "step": 65440 }, { - "epoch": 0.71, - "learning_rate": 0.00019386715962898095, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.0002504694492233024, + "loss": 0.0222, "step": 65450 }, { - "epoch": 0.71, - "learning_rate": 0.00019385094376337807, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025046188153028844, + "loss": 0.0185, "step": 65460 }, { - "epoch": 0.71, - "learning_rate": 0.00019383472789777516, - "loss": 0.017, + "epoch": 0.33, + "learning_rate": 0.0002504543138372744, + "loss": 0.0213, "step": 65470 }, { - "epoch": 0.71, - "learning_rate": 0.00019381851203217226, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002504467461442604, + "loss": 0.0182, "step": 65480 }, { - "epoch": 0.71, - "learning_rate": 0.00019380229616656938, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.0002504391784512464, + "loss": 0.0168, "step": 65490 }, { - "epoch": 0.71, - "learning_rate": 0.00019378608030096644, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.00025043161075823236, + "loss": 0.0178, "step": 65500 }, { - "epoch": 0.71, - "learning_rate": 0.00019376986443536353, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025042404306521834, + "loss": 0.023, "step": 65510 }, { - "epoch": 0.71, - "learning_rate": 0.00019375364856976065, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.0002504164753722043, + "loss": 0.0213, "step": 65520 }, { - "epoch": 0.71, - "learning_rate": 0.00019373743270415775, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025040890767919036, + "loss": 0.0199, "step": 65530 }, { - "epoch": 0.71, - "learning_rate": 0.0001937212168385548, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.00025040133998617634, + "loss": 0.0193, "step": 65540 }, { - "epoch": 0.71, - "learning_rate": 0.0001937050009729519, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002503937722931623, + "loss": 0.018, "step": 65550 }, { - "epoch": 0.71, - "learning_rate": 0.00019368878510734903, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002503862046001483, + "loss": 0.0307, "step": 65560 }, { - "epoch": 0.71, - "learning_rate": 0.00019367256924174612, - "loss": 0.0173, + "epoch": 0.33, + "learning_rate": 0.0002503786369071343, + "loss": 0.0172, "step": 65570 }, { - "epoch": 0.71, - "learning_rate": 0.00019365635337614318, - "loss": 0.017, + "epoch": 0.33, + "learning_rate": 0.00025037106921412027, + "loss": 0.0179, "step": 65580 }, { - "epoch": 0.71, - "learning_rate": 0.0001936401375105403, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.0002503635015211063, + "loss": 0.0171, "step": 65590 }, { - "epoch": 0.71, - "learning_rate": 0.0001936239216449374, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.0002503559338280923, + "loss": 0.0225, "step": 65600 }, { - "epoch": 0.71, - "learning_rate": 0.0001936077057793345, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.00025034836613507827, + "loss": 0.0174, "step": 65610 }, { - "epoch": 0.71, - "learning_rate": 0.00019359148991373156, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.00025034079844206425, + "loss": 0.0236, "step": 65620 }, { - "epoch": 0.71, - "learning_rate": 0.00019357527404812867, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00025033323074905023, + "loss": 0.0174, "step": 65630 }, { - "epoch": 0.71, - "learning_rate": 0.00019355905818252577, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.0002503256630560362, + "loss": 0.0196, "step": 65640 }, { - "epoch": 0.71, - "learning_rate": 0.0001935428423169229, - "loss": 0.0166, + "epoch": 0.33, + "learning_rate": 0.00025031809536302225, + "loss": 0.0177, "step": 65650 }, { - "epoch": 0.71, - "learning_rate": 0.00019352662645131995, - "loss": 0.0189, + "epoch": 0.33, + "learning_rate": 0.0002503105276700082, + "loss": 0.0194, "step": 65660 }, { - "epoch": 0.71, - "learning_rate": 0.00019351041058571705, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002503029599769942, + "loss": 0.0185, "step": 65670 }, { - "epoch": 0.71, - "learning_rate": 0.00019349419472011414, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002502953922839802, + "loss": 0.0229, "step": 65680 }, { - "epoch": 0.71, - "learning_rate": 0.00019347797885451126, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.00025028782459096617, + "loss": 0.0224, "step": 65690 }, { - "epoch": 0.71, - "learning_rate": 0.00019346176298890832, - "loss": 0.016, + "epoch": 0.33, + "learning_rate": 0.00025028025689795215, + "loss": 0.023, "step": 65700 }, { - "epoch": 0.71, - "learning_rate": 0.00019344554712330542, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.00025027268920493813, + "loss": 0.0197, "step": 65710 }, { - "epoch": 0.71, - "learning_rate": 0.00019342933125770254, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025026512151192417, + "loss": 0.0159, "step": 65720 }, { - "epoch": 0.71, - "learning_rate": 0.00019341311539209963, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00025025755381891015, + "loss": 0.0251, "step": 65730 }, { - "epoch": 0.71, - "learning_rate": 0.0001933968995264967, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025024998612589613, + "loss": 0.0197, "step": 65740 }, { - "epoch": 0.71, - "learning_rate": 0.0001933806836608938, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002502424184328821, + "loss": 0.0168, "step": 65750 }, { - "epoch": 0.71, - "learning_rate": 0.0001933644677952909, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.0002502348507398681, + "loss": 0.019, "step": 65760 }, { - "epoch": 0.71, - "learning_rate": 0.000193348251929688, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002502272830468541, + "loss": 0.0175, "step": 65770 }, { - "epoch": 0.71, - "learning_rate": 0.00019333203606408507, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.0002502197153538401, + "loss": 0.02, "step": 65780 }, { - "epoch": 0.71, - "learning_rate": 0.00019331582019848219, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002502121476608261, + "loss": 0.0203, "step": 65790 }, { - "epoch": 0.71, - "learning_rate": 0.00019329960433287928, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002502045799678121, + "loss": 0.023, "step": 65800 }, { - "epoch": 0.71, - "learning_rate": 0.00019328338846727637, - "loss": 0.0178, + "epoch": 0.33, + "learning_rate": 0.00025019701227479806, + "loss": 0.0184, "step": 65810 }, { - "epoch": 0.71, - "learning_rate": 0.00019326717260167344, - "loss": 0.0169, + "epoch": 0.33, + "learning_rate": 0.00025018944458178404, + "loss": 0.0244, "step": 65820 }, { - "epoch": 0.71, - "learning_rate": 0.00019325095673607056, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00025018187688877, + "loss": 0.0201, "step": 65830 }, { - "epoch": 0.71, - "learning_rate": 0.00019323474087046765, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.00025017430919575606, + "loss": 0.0162, "step": 65840 }, { - "epoch": 0.71, - "learning_rate": 0.00019321852500486474, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025016674150274204, + "loss": 0.0206, "step": 65850 }, { - "epoch": 0.71, - "learning_rate": 0.00019320230913926184, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.000250159173809728, + "loss": 0.015, "step": 65860 }, { - "epoch": 0.71, - "learning_rate": 0.00019318609327365893, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.000250151606116714, + "loss": 0.0178, "step": 65870 }, { - "epoch": 0.71, - "learning_rate": 0.00019316987740805602, - "loss": 0.0175, + "epoch": 0.33, + "learning_rate": 0.0002501440384237, + "loss": 0.0303, "step": 65880 }, { - "epoch": 0.71, - "learning_rate": 0.00019315366154245314, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.00025013647073068596, + "loss": 0.0197, "step": 65890 }, { - "epoch": 0.71, - "learning_rate": 0.0001931374456768502, - "loss": 0.0175, + "epoch": 0.33, + "learning_rate": 0.00025012890303767194, + "loss": 0.0178, "step": 65900 }, { - "epoch": 0.71, - "learning_rate": 0.0001931212298112473, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.000250121335344658, + "loss": 0.0179, "step": 65910 }, { - "epoch": 0.71, - "learning_rate": 0.0001931050139456444, - "loss": 0.0172, + "epoch": 0.33, + "learning_rate": 0.00025011376765164396, + "loss": 0.0201, "step": 65920 }, { - "epoch": 0.71, - "learning_rate": 0.0001930887980800415, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.00025010619995862994, + "loss": 0.0211, "step": 65930 }, { - "epoch": 0.71, - "learning_rate": 0.00019307258221443858, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.0002500986322656159, + "loss": 0.0188, "step": 65940 }, { - "epoch": 0.71, - "learning_rate": 0.00019305636634883567, - "loss": 0.0192, + "epoch": 0.33, + "learning_rate": 0.0002500910645726019, + "loss": 0.0166, "step": 65950 }, { - "epoch": 0.71, - "learning_rate": 0.0001930401504832328, - "loss": 0.0198, + "epoch": 0.33, + "learning_rate": 0.0002500834968795879, + "loss": 0.0192, "step": 65960 }, { - "epoch": 0.71, - "learning_rate": 0.00019302393461762988, - "loss": 0.017, + "epoch": 0.33, + "learning_rate": 0.0002500759291865739, + "loss": 0.0177, "step": 65970 }, { - "epoch": 0.71, - "learning_rate": 0.00019300771875202695, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.0002500683614935599, + "loss": 0.0149, "step": 65980 }, { - "epoch": 0.71, - "learning_rate": 0.00019299150288642404, - "loss": 0.0195, + "epoch": 0.33, + "learning_rate": 0.00025006079380054583, + "loss": 0.0199, "step": 65990 }, { - "epoch": 0.71, - "learning_rate": 0.00019297528702082116, - "loss": 0.0178, + "epoch": 0.33, + "learning_rate": 0.0002500532261075318, + "loss": 0.0174, "step": 66000 }, { - "epoch": 0.71, - "eval_cer": 0.9215451751711582, - "eval_loss": 0.011317442171275616, - "eval_runtime": 121.212, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.33, + "eval_cer": 0.9144324104542716, + "eval_loss": 0.01361939124763012, + "eval_runtime": 116.6985, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.285, "step": 66000 }, { - "epoch": 0.71, - "learning_rate": 0.00019295907115521825, + "epoch": 0.33, + "learning_rate": 0.00025004565841451785, "loss": 0.0174, "step": 66010 }, { - "epoch": 0.71, - "learning_rate": 0.00019294285528961532, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025003809072150383, + "loss": 0.0191, "step": 66020 }, { - "epoch": 0.71, - "learning_rate": 0.00019292663942401244, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.0002500305230284898, + "loss": 0.0187, "step": 66030 }, { - "epoch": 0.71, - "learning_rate": 0.00019291042355840953, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.0002500229553354758, + "loss": 0.0169, "step": 66040 }, { - "epoch": 0.71, - "learning_rate": 0.00019289420769280662, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002500153876424618, + "loss": 0.0237, "step": 66050 }, { - "epoch": 0.71, - "learning_rate": 0.00019287799182720372, - "loss": 0.0176, + "epoch": 0.33, + "learning_rate": 0.00025000781994944776, + "loss": 0.0186, "step": 66060 }, { - "epoch": 0.71, - "learning_rate": 0.0001928617759616008, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025000025225643374, + "loss": 0.0148, "step": 66070 }, { - "epoch": 0.71, - "learning_rate": 0.0001928455600959979, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00024999268456341977, + "loss": 0.0197, "step": 66080 }, { - "epoch": 0.71, - "learning_rate": 0.00019282934423039502, - "loss": 0.0173, + "epoch": 0.33, + "learning_rate": 0.00024998511687040575, + "loss": 0.0197, "step": 66090 }, { - "epoch": 0.71, - "learning_rate": 0.0001928131283647921, - "loss": 0.0168, + "epoch": 0.33, + "learning_rate": 0.00024997754917739174, + "loss": 0.0172, "step": 66100 }, { - "epoch": 0.71, - "learning_rate": 0.00019279691249918918, - "loss": 0.0169, + "epoch": 0.33, + "learning_rate": 0.0002499699814843777, + "loss": 0.0189, "step": 66110 }, { - "epoch": 0.71, - "learning_rate": 0.00019278069663358627, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002499624137913637, + "loss": 0.0187, "step": 66120 }, { - "epoch": 0.71, - "learning_rate": 0.0001927644807679834, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002499548460983497, + "loss": 0.0218, "step": 66130 }, { - "epoch": 0.72, - "learning_rate": 0.00019274826490238046, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.0002499472784053357, + "loss": 0.0229, "step": 66140 }, { - "epoch": 0.72, - "learning_rate": 0.00019273204903677755, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002499397107123217, + "loss": 0.0175, "step": 66150 }, { - "epoch": 0.72, - "learning_rate": 0.00019271583317117467, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002499321430193077, + "loss": 0.0179, "step": 66160 }, { - "epoch": 0.72, - "learning_rate": 0.00019269961730557176, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00024992457532629366, + "loss": 0.0172, "step": 66170 }, { - "epoch": 0.72, - "learning_rate": 0.00019268340143996886, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.00024991700763327964, + "loss": 0.0197, "step": 66180 }, { - "epoch": 0.72, - "learning_rate": 0.00019266718557436592, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.0002499094399402656, + "loss": 0.0192, "step": 66190 }, { - "epoch": 0.72, - "learning_rate": 0.00019265096970876304, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.00024990187224725166, + "loss": 0.0175, "step": 66200 }, { - "epoch": 0.72, - "learning_rate": 0.00019263475384316014, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.00024989430455423764, + "loss": 0.0204, "step": 66210 }, { - "epoch": 0.72, - "learning_rate": 0.00019261853797755723, - "loss": 0.0176, + "epoch": 0.33, + "learning_rate": 0.0002498867368612236, + "loss": 0.0195, "step": 66220 }, { - "epoch": 0.72, - "learning_rate": 0.00019260232211195432, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.0002498791691682096, + "loss": 0.0178, "step": 66230 }, { - "epoch": 0.72, - "learning_rate": 0.00019258610624635141, - "loss": 0.0193, + "epoch": 0.33, + "learning_rate": 0.0002498716014751956, + "loss": 0.0247, "step": 66240 }, { - "epoch": 0.72, - "learning_rate": 0.0001925698903807485, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00024986403378218157, + "loss": 0.0201, "step": 66250 }, { - "epoch": 0.72, - "learning_rate": 0.00019255367451514563, - "loss": 0.0219, + "epoch": 0.33, + "learning_rate": 0.00024985646608916755, + "loss": 0.0181, "step": 66260 }, { - "epoch": 0.72, - "learning_rate": 0.0001925374586495427, - "loss": 0.0172, + "epoch": 0.33, + "learning_rate": 0.0002498488983961536, + "loss": 0.0232, "step": 66270 }, { - "epoch": 0.72, - "learning_rate": 0.00019252124278393978, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.00024984133070313956, + "loss": 0.0173, "step": 66280 }, { - "epoch": 0.72, - "learning_rate": 0.0001925050269183369, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00024983376301012555, + "loss": 0.0189, "step": 66290 }, { - "epoch": 0.72, - "learning_rate": 0.000192488811052734, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.00024982619531711153, + "loss": 0.0189, "step": 66300 }, { - "epoch": 0.72, - "learning_rate": 0.00019247259518713106, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002498186276240975, + "loss": 0.0176, "step": 66310 }, { - "epoch": 0.72, - "learning_rate": 0.00019245637932152816, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.0002498110599310835, + "loss": 0.0174, "step": 66320 }, { - "epoch": 0.72, - "learning_rate": 0.00019244016345592528, - "loss": 0.0193, + "epoch": 0.33, + "learning_rate": 0.0002498034922380695, + "loss": 0.0159, "step": 66330 }, { - "epoch": 0.72, - "learning_rate": 0.00019242394759032237, - "loss": 0.0221, + "epoch": 0.33, + "learning_rate": 0.0002497959245450555, + "loss": 0.0198, "step": 66340 }, { - "epoch": 0.72, - "learning_rate": 0.00019240773172471943, - "loss": 0.0181, + "epoch": 0.33, + "learning_rate": 0.0002497883568520415, + "loss": 0.0191, "step": 66350 }, { - "epoch": 0.72, - "learning_rate": 0.00019239151585911655, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.00024978078915902747, + "loss": 0.0234, "step": 66360 }, { - "epoch": 0.72, - "learning_rate": 0.00019237529999351365, - "loss": 0.0198, + "epoch": 0.33, + "learning_rate": 0.00024977322146601345, + "loss": 0.0172, "step": 66370 }, { - "epoch": 0.72, - "learning_rate": 0.00019235908412791074, - "loss": 0.0168, + "epoch": 0.33, + "learning_rate": 0.00024976565377299943, + "loss": 0.0188, "step": 66380 }, { - "epoch": 0.72, - "learning_rate": 0.0001923428682623078, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.00024975808607998547, + "loss": 0.0183, "step": 66390 }, { - "epoch": 0.72, - "learning_rate": 0.00019232665239670492, - "loss": 0.0318, + "epoch": 0.33, + "learning_rate": 0.00024975051838697145, + "loss": 0.0193, "step": 66400 }, { - "epoch": 0.72, - "learning_rate": 0.00019231043653110202, - "loss": 0.0237, + "epoch": 0.34, + "learning_rate": 0.00024974295069395743, + "loss": 0.02, "step": 66410 }, { - "epoch": 0.72, - "learning_rate": 0.0001922942206654991, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002497353830009434, + "loss": 0.0176, "step": 66420 }, { - "epoch": 0.72, - "learning_rate": 0.0001922780047998962, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002497278153079294, + "loss": 0.0213, "step": 66430 }, { - "epoch": 0.72, - "learning_rate": 0.0001922617889342933, + "epoch": 0.34, + "learning_rate": 0.0002497202476149154, "loss": 0.0188, "step": 66440 }, { - "epoch": 0.72, - "learning_rate": 0.0001922455730686904, - "loss": 0.0172, + "epoch": 0.34, + "learning_rate": 0.00024971267992190136, + "loss": 0.018, "step": 66450 }, { - "epoch": 0.72, - "learning_rate": 0.0001922293572030875, - "loss": 0.0172, + "epoch": 0.34, + "learning_rate": 0.0002497051122288874, + "loss": 0.0194, "step": 66460 }, { - "epoch": 0.72, - "learning_rate": 0.00019221314133748457, - "loss": 0.0158, + "epoch": 0.34, + "learning_rate": 0.0002496975445358734, + "loss": 0.0144, "step": 66470 }, { - "epoch": 0.72, - "learning_rate": 0.00019219692547188167, - "loss": 0.0186, + "epoch": 0.34, + "learning_rate": 0.00024968997684285936, + "loss": 0.0178, "step": 66480 }, { - "epoch": 0.72, - "learning_rate": 0.00019218070960627876, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024968240914984534, + "loss": 0.018, "step": 66490 }, { - "epoch": 0.72, - "learning_rate": 0.00019216449374067588, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002496748414568313, + "loss": 0.0167, "step": 66500 }, { - "epoch": 0.72, - "learning_rate": 0.00019214827787507294, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.0002496672737638173, + "loss": 0.0173, "step": 66510 }, { - "epoch": 0.72, - "learning_rate": 0.00019213206200947004, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.00024965970607080334, + "loss": 0.0172, "step": 66520 }, { - "epoch": 0.72, - "learning_rate": 0.00019211584614386716, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002496521383777893, + "loss": 0.0181, "step": 66530 }, { - "epoch": 0.72, - "learning_rate": 0.00019209963027826425, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002496445706847753, + "loss": 0.0283, "step": 66540 }, { - "epoch": 0.72, - "learning_rate": 0.00019208341441266132, - "loss": 0.023, + "epoch": 0.34, + "learning_rate": 0.0002496370029917613, + "loss": 0.0203, "step": 66550 }, { - "epoch": 0.72, - "learning_rate": 0.0001920671985470584, - "loss": 0.0183, + "epoch": 0.34, + "learning_rate": 0.00024962943529874726, + "loss": 0.0215, "step": 66560 }, { - "epoch": 0.72, - "learning_rate": 0.00019205098268145553, - "loss": 0.019, + "epoch": 0.34, + "learning_rate": 0.00024962186760573324, + "loss": 0.0156, "step": 66570 }, { - "epoch": 0.72, - "learning_rate": 0.00019203476681585262, - "loss": 0.0167, + "epoch": 0.34, + "learning_rate": 0.0002496142999127192, + "loss": 0.0211, "step": 66580 }, { - "epoch": 0.72, - "learning_rate": 0.0001920185509502497, - "loss": 0.0199, + "epoch": 0.34, + "learning_rate": 0.00024960673221970526, + "loss": 0.0181, "step": 66590 }, { - "epoch": 0.72, - "learning_rate": 0.0001920023350846468, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.00024959916452669124, + "loss": 0.0197, "step": 66600 }, { - "epoch": 0.72, - "learning_rate": 0.0001919861192190439, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002495915968336772, + "loss": 0.0229, "step": 66610 }, { - "epoch": 0.72, - "learning_rate": 0.000191969903353441, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002495840291406632, + "loss": 0.0154, "step": 66620 }, { - "epoch": 0.72, - "learning_rate": 0.00019195368748783806, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.0002495764614476492, + "loss": 0.0183, "step": 66630 }, { - "epoch": 0.72, - "learning_rate": 0.00019193747162223518, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.00024956889375463517, + "loss": 0.0215, "step": 66640 }, { - "epoch": 0.72, - "learning_rate": 0.00019192125575663227, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002495613260616212, + "loss": 0.0231, "step": 66650 }, { - "epoch": 0.72, - "learning_rate": 0.0001919050398910294, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002495537583686072, + "loss": 0.0234, "step": 66660 }, { - "epoch": 0.72, - "learning_rate": 0.00019188882402542646, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024954619067559317, + "loss": 0.0229, "step": 66670 }, { - "epoch": 0.72, - "learning_rate": 0.00019187260815982355, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.00024953862298257915, + "loss": 0.0206, "step": 66680 }, { - "epoch": 0.72, - "learning_rate": 0.00019185639229422064, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.00024953105528956513, + "loss": 0.0227, "step": 66690 }, { - "epoch": 0.72, - "learning_rate": 0.00019184017642861776, - "loss": 0.0197, + "epoch": 0.34, + "learning_rate": 0.0002495234875965511, + "loss": 0.0218, "step": 66700 }, { - "epoch": 0.72, - "learning_rate": 0.00019182396056301483, - "loss": 0.0173, + "epoch": 0.34, + "learning_rate": 0.00024951591990353715, + "loss": 0.0181, "step": 66710 }, { - "epoch": 0.72, - "learning_rate": 0.00019180774469741192, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.00024950835221052313, + "loss": 0.018, "step": 66720 }, { - "epoch": 0.72, - "learning_rate": 0.00019179152883180904, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002495007845175091, + "loss": 0.0198, "step": 66730 }, { - "epoch": 0.72, - "learning_rate": 0.00019177531296620613, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002494932168244951, + "loss": 0.0192, "step": 66740 }, { - "epoch": 0.72, - "learning_rate": 0.0001917590971006032, - "loss": 0.0175, + "epoch": 0.34, + "learning_rate": 0.00024948564913148107, + "loss": 0.017, "step": 66750 }, { - "epoch": 0.72, - "learning_rate": 0.0001917428812350003, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.00024947808143846705, + "loss": 0.0216, "step": 66760 }, { - "epoch": 0.72, - "learning_rate": 0.0001917266653693974, - "loss": 0.019, + "epoch": 0.34, + "learning_rate": 0.00024947051374545303, + "loss": 0.0171, "step": 66770 }, { - "epoch": 0.72, - "learning_rate": 0.0001917104495037945, - "loss": 0.016, + "epoch": 0.34, + "learning_rate": 0.00024946294605243907, + "loss": 0.0186, "step": 66780 }, { - "epoch": 0.72, - "learning_rate": 0.00019169423363819157, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.00024945537835942505, + "loss": 0.0214, "step": 66790 }, { - "epoch": 0.72, - "learning_rate": 0.0001916780177725887, - "loss": 0.0109, + "epoch": 0.34, + "learning_rate": 0.00024944781066641103, + "loss": 0.0191, "step": 66800 }, { - "epoch": 0.72, - "learning_rate": 0.00019166180190698578, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.000249440242973397, + "loss": 0.0166, "step": 66810 }, { - "epoch": 0.72, - "learning_rate": 0.00019164558604138287, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.000249432675280383, + "loss": 0.0183, "step": 66820 }, { - "epoch": 0.72, - "learning_rate": 0.00019162937017577994, - "loss": 0.0209, + "epoch": 0.34, + "learning_rate": 0.000249425107587369, + "loss": 0.0182, "step": 66830 }, { - "epoch": 0.72, - "learning_rate": 0.00019161315431017706, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.000249417539894355, + "loss": 0.019, "step": 66840 }, { - "epoch": 0.72, - "learning_rate": 0.00019159693844457415, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.000249409972201341, + "loss": 0.0244, "step": 66850 }, { - "epoch": 0.72, - "learning_rate": 0.00019158072257897125, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.000249402404508327, + "loss": 0.0206, "step": 66860 }, { - "epoch": 0.72, - "learning_rate": 0.00019156450671336834, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.00024939483681531296, + "loss": 0.0177, "step": 66870 }, { - "epoch": 0.72, - "learning_rate": 0.00019154829084776543, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.00024938726912229894, + "loss": 0.0174, "step": 66880 }, { - "epoch": 0.72, - "learning_rate": 0.00019153207498216252, - "loss": 0.0168, + "epoch": 0.34, + "learning_rate": 0.0002493797014292849, + "loss": 0.021, "step": 66890 }, { - "epoch": 0.72, - "learning_rate": 0.00019151585911655964, - "loss": 0.0197, + "epoch": 0.34, + "learning_rate": 0.00024937213373627096, + "loss": 0.0209, "step": 66900 }, { - "epoch": 0.72, - "learning_rate": 0.00019149964325095674, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024936456604325694, + "loss": 0.0182, "step": 66910 }, { - "epoch": 0.72, - "learning_rate": 0.0001914834273853538, - "loss": 0.0164, + "epoch": 0.34, + "learning_rate": 0.0002493569983502429, + "loss": 0.0161, "step": 66920 }, { - "epoch": 0.72, - "learning_rate": 0.0001914672115197509, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.0002493494306572289, + "loss": 0.0236, "step": 66930 }, { - "epoch": 0.72, - "learning_rate": 0.00019145099565414801, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002493418629642149, + "loss": 0.0182, "step": 66940 }, { - "epoch": 0.72, - "learning_rate": 0.0001914347797885451, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024933429527120086, + "loss": 0.0189, "step": 66950 }, { - "epoch": 0.72, - "learning_rate": 0.00019141856392294217, - "loss": 0.0151, + "epoch": 0.34, + "learning_rate": 0.00024932672757818684, + "loss": 0.0187, "step": 66960 }, { - "epoch": 0.72, - "learning_rate": 0.0001914023480573393, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002493191598851729, + "loss": 0.0196, "step": 66970 }, { - "epoch": 0.72, - "learning_rate": 0.00019138613219173639, - "loss": 0.0181, + "epoch": 0.34, + "learning_rate": 0.00024931159219215886, + "loss": 0.0187, "step": 66980 }, { - "epoch": 0.72, - "learning_rate": 0.00019136991632613348, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024930402449914484, + "loss": 0.0195, "step": 66990 }, { - "epoch": 0.72, - "learning_rate": 0.00019135370046053054, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002492964568061308, + "loss": 0.017, "step": 67000 }, { - "epoch": 0.72, - "eval_cer": 0.921521722891336, - "eval_loss": 0.010987049899995327, - "eval_runtime": 121.4092, - "eval_samples_per_second": 16.473, - "eval_steps_per_second": 4.118, + "epoch": 0.34, + "eval_cer": 0.9144518183767796, + "eval_loss": 0.013345795683562756, + "eval_runtime": 116.5962, + "eval_samples_per_second": 17.153, + "eval_steps_per_second": 4.288, "step": 67000 }, { - "epoch": 0.72, - "learning_rate": 0.00019133748459492766, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002492888891131168, + "loss": 0.0192, "step": 67010 }, { - "epoch": 0.72, - "learning_rate": 0.00019132126872932476, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002492813214201028, + "loss": 0.0234, "step": 67020 }, { - "epoch": 0.72, - "learning_rate": 0.00019130505286372188, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002492737537270888, + "loss": 0.0155, "step": 67030 }, { - "epoch": 0.72, - "learning_rate": 0.00019128883699811894, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002492661860340748, + "loss": 0.0181, "step": 67040 }, { - "epoch": 0.72, - "learning_rate": 0.00019127262113251603, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002492586183410608, + "loss": 0.0186, "step": 67050 }, { - "epoch": 0.72, - "learning_rate": 0.00019125640526691313, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.00024925105064804677, + "loss": 0.0213, "step": 67060 }, { - "epoch": 0.73, - "learning_rate": 0.00019124018940131025, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.00024924348295503275, + "loss": 0.019, "step": 67070 }, { - "epoch": 0.73, - "learning_rate": 0.0001912239735357073, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.00024923591526201873, + "loss": 0.0205, "step": 67080 }, { - "epoch": 0.73, - "learning_rate": 0.0001912077576701044, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.0002492283475690047, + "loss": 0.024, "step": 67090 }, { - "epoch": 0.73, - "learning_rate": 0.00019119154180450153, - "loss": 0.0184, + "epoch": 0.34, + "learning_rate": 0.00024922077987599075, + "loss": 0.0229, "step": 67100 }, { - "epoch": 0.73, - "learning_rate": 0.00019117532593889862, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.00024921321218297673, + "loss": 0.0218, "step": 67110 }, { - "epoch": 0.73, - "learning_rate": 0.00019115911007329568, - "loss": 0.0189, + "epoch": 0.34, + "learning_rate": 0.0002492056444899627, + "loss": 0.0178, "step": 67120 }, { - "epoch": 0.73, - "learning_rate": 0.00019114289420769278, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002491980767969487, + "loss": 0.021, "step": 67130 }, { - "epoch": 0.73, - "learning_rate": 0.0001911266783420899, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002491905091039347, + "loss": 0.0172, "step": 67140 }, { - "epoch": 0.73, - "learning_rate": 0.000191110462476487, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.00024918294141092065, + "loss": 0.0164, "step": 67150 }, { - "epoch": 0.73, - "learning_rate": 0.00019109424661088405, - "loss": 0.0182, + "epoch": 0.34, + "learning_rate": 0.0002491753737179067, + "loss": 0.0202, "step": 67160 }, { - "epoch": 0.73, - "learning_rate": 0.00019107803074528117, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.00024916780602489267, + "loss": 0.0182, "step": 67170 }, { - "epoch": 0.73, - "learning_rate": 0.00019106181487967827, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.00024916023833187865, + "loss": 0.0182, "step": 67180 }, { - "epoch": 0.73, - "learning_rate": 0.00019104559901407536, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.00024915267063886463, + "loss": 0.0179, "step": 67190 }, { - "epoch": 0.73, - "learning_rate": 0.00019102938314847243, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002491451029458506, + "loss": 0.0194, "step": 67200 }, { - "epoch": 0.73, - "learning_rate": 0.00019101316728286955, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.0002491375352528366, + "loss": 0.0171, "step": 67210 }, { - "epoch": 0.73, - "learning_rate": 0.00019099695141726664, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.00024912996755982263, + "loss": 0.0198, "step": 67220 }, { - "epoch": 0.73, - "learning_rate": 0.00019098073555166373, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002491223998668086, + "loss": 0.0203, "step": 67230 }, { - "epoch": 0.73, - "learning_rate": 0.00019096451968606082, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002491148321737946, + "loss": 0.0192, "step": 67240 }, { - "epoch": 0.73, - "learning_rate": 0.00019094830382045792, - "loss": 0.0158, + "epoch": 0.34, + "learning_rate": 0.0002491072644807805, + "loss": 0.0199, "step": 67250 }, { - "epoch": 0.73, - "learning_rate": 0.000190932087954855, - "loss": 0.0118, + "epoch": 0.34, + "learning_rate": 0.00024909969678776656, + "loss": 0.0191, "step": 67260 }, { - "epoch": 0.73, - "learning_rate": 0.00019091587208925213, - "loss": 0.0206, + "epoch": 0.34, + "learning_rate": 0.00024909212909475254, + "loss": 0.0163, "step": 67270 }, { - "epoch": 0.73, - "learning_rate": 0.0001908996562236492, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.0002490845614017385, + "loss": 0.0163, "step": 67280 }, { - "epoch": 0.73, - "learning_rate": 0.0001908834403580463, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002490769937087245, + "loss": 0.017, "step": 67290 }, { - "epoch": 0.73, - "learning_rate": 0.0001908672244924434, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002490694260157105, + "loss": 0.0186, "step": 67300 }, { - "epoch": 0.73, - "learning_rate": 0.0001908510086268405, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024906185832269647, + "loss": 0.02, "step": 67310 }, { - "epoch": 0.73, - "learning_rate": 0.00019083479276123757, - "loss": 0.0178, + "epoch": 0.34, + "learning_rate": 0.00024905429062968245, + "loss": 0.0191, "step": 67320 }, { - "epoch": 0.73, - "learning_rate": 0.00019081857689563466, - "loss": 0.0169, + "epoch": 0.34, + "learning_rate": 0.0002490467229366685, + "loss": 0.0148, "step": 67330 }, { - "epoch": 0.73, - "learning_rate": 0.00019080236103003178, - "loss": 0.0206, + "epoch": 0.34, + "learning_rate": 0.00024903915524365446, + "loss": 0.0195, "step": 67340 }, { - "epoch": 0.73, - "learning_rate": 0.00019078614516442887, - "loss": 0.0179, + "epoch": 0.34, + "learning_rate": 0.00024903158755064045, + "loss": 0.0175, "step": 67350 }, { - "epoch": 0.73, - "learning_rate": 0.00019076992929882594, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024902401985762643, + "loss": 0.017, "step": 67360 }, { - "epoch": 0.73, - "learning_rate": 0.00019075371343322306, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002490164521646124, + "loss": 0.022, "step": 67370 }, { - "epoch": 0.73, - "learning_rate": 0.00019073749756762015, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.0002490088844715984, + "loss": 0.02, "step": 67380 }, { - "epoch": 0.73, - "learning_rate": 0.00019072128170201724, - "loss": 0.0197, + "epoch": 0.34, + "learning_rate": 0.0002490013167785844, + "loss": 0.0252, "step": 67390 }, { - "epoch": 0.73, - "learning_rate": 0.0001907050658364143, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002489937490855704, + "loss": 0.0201, "step": 67400 }, { - "epoch": 0.73, - "learning_rate": 0.00019068884997081143, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.0002489861813925564, + "loss": 0.0216, "step": 67410 }, { - "epoch": 0.73, - "learning_rate": 0.00019067263410520852, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024897861369954237, + "loss": 0.0163, "step": 67420 }, { - "epoch": 0.73, - "learning_rate": 0.0001906564182396056, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.00024897104600652835, + "loss": 0.0193, "step": 67430 }, { - "epoch": 0.73, - "learning_rate": 0.0001906402023740027, - "loss": 0.0127, + "epoch": 0.34, + "learning_rate": 0.00024896347831351433, + "loss": 0.0193, "step": 67440 }, { - "epoch": 0.73, - "learning_rate": 0.0001906239865083998, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.00024895591062050037, + "loss": 0.0163, "step": 67450 }, { - "epoch": 0.73, - "learning_rate": 0.0001906077706427969, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024894834292748635, + "loss": 0.0163, "step": 67460 }, { - "epoch": 0.73, - "learning_rate": 0.000190591554777194, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024894077523447233, + "loss": 0.0185, "step": 67470 }, { - "epoch": 0.73, - "learning_rate": 0.00019057533891159108, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.0002489332075414583, + "loss": 0.0225, "step": 67480 }, { - "epoch": 0.73, - "learning_rate": 0.00019055912304598817, - "loss": 0.0178, + "epoch": 0.34, + "learning_rate": 0.0002489256398484443, + "loss": 0.0176, "step": 67490 }, { - "epoch": 0.73, - "learning_rate": 0.00019054290718038526, - "loss": 0.0179, + "epoch": 0.34, + "learning_rate": 0.0002489180721554303, + "loss": 0.0166, "step": 67500 }, { - "epoch": 0.73, - "learning_rate": 0.00019052669131478238, - "loss": 0.0195, + "epoch": 0.34, + "learning_rate": 0.00024891050446241626, + "loss": 0.0199, "step": 67510 }, { - "epoch": 0.73, - "learning_rate": 0.00019051047544917945, - "loss": 0.0179, + "epoch": 0.34, + "learning_rate": 0.0002489029367694023, + "loss": 0.0205, "step": 67520 }, { - "epoch": 0.73, - "learning_rate": 0.00019049425958357654, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002488953690763883, + "loss": 0.0201, "step": 67530 }, { - "epoch": 0.73, - "learning_rate": 0.00019047804371797366, - "loss": 0.0172, + "epoch": 0.34, + "learning_rate": 0.00024888780138337426, + "loss": 0.0173, "step": 67540 }, { - "epoch": 0.73, - "learning_rate": 0.00019046182785237075, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.00024888023369036024, + "loss": 0.02, "step": 67550 }, { - "epoch": 0.73, - "learning_rate": 0.00019044561198676782, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.0002488726659973462, + "loss": 0.0188, "step": 67560 }, { - "epoch": 0.73, - "learning_rate": 0.0001904293961211649, - "loss": 0.0169, + "epoch": 0.34, + "learning_rate": 0.0002488650983043322, + "loss": 0.0218, "step": 67570 }, { - "epoch": 0.73, - "learning_rate": 0.00019041318025556203, - "loss": 0.0195, + "epoch": 0.34, + "learning_rate": 0.00024885753061131824, + "loss": 0.015, "step": 67580 }, { - "epoch": 0.73, - "learning_rate": 0.00019039696438995912, - "loss": 0.0158, + "epoch": 0.34, + "learning_rate": 0.0002488499629183042, + "loss": 0.0174, "step": 67590 }, { - "epoch": 0.73, - "learning_rate": 0.0001903807485243562, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.0002488423952252902, + "loss": 0.0237, "step": 67600 }, { - "epoch": 0.73, - "learning_rate": 0.0001903645326587533, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002488348275322762, + "loss": 0.0171, "step": 67610 }, { - "epoch": 0.73, - "learning_rate": 0.0001903483167931504, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.00024882725983926216, + "loss": 0.0203, "step": 67620 }, { - "epoch": 0.73, - "learning_rate": 0.0001903321009275475, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.00024881969214624814, + "loss": 0.0142, "step": 67630 }, { - "epoch": 0.73, - "learning_rate": 0.00019031588506194461, - "loss": 0.016, + "epoch": 0.34, + "learning_rate": 0.0002488121244532342, + "loss": 0.0177, "step": 67640 }, { - "epoch": 0.73, - "learning_rate": 0.00019029966919634168, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.00024880455676022016, + "loss": 0.0195, "step": 67650 }, { - "epoch": 0.73, - "learning_rate": 0.00019028345333073877, - "loss": 0.0184, + "epoch": 0.34, + "learning_rate": 0.00024879698906720614, + "loss": 0.021, "step": 67660 }, { - "epoch": 0.73, - "learning_rate": 0.0001902672374651359, - "loss": 0.0199, + "epoch": 0.34, + "learning_rate": 0.0002487894213741921, + "loss": 0.0204, "step": 67670 }, { - "epoch": 0.73, - "learning_rate": 0.00019025102159953299, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002487818536811781, + "loss": 0.0162, "step": 67680 }, { - "epoch": 0.73, - "learning_rate": 0.00019023480573393005, - "loss": 0.0193, + "epoch": 0.34, + "learning_rate": 0.0002487742859881641, + "loss": 0.0174, "step": 67690 }, { - "epoch": 0.73, - "learning_rate": 0.00019021858986832714, - "loss": 0.0164, + "epoch": 0.34, + "learning_rate": 0.00024876671829515007, + "loss": 0.0177, "step": 67700 }, { - "epoch": 0.73, - "learning_rate": 0.00019020237400272426, - "loss": 0.0215, + "epoch": 0.34, + "learning_rate": 0.0002487591506021361, + "loss": 0.0166, "step": 67710 }, { - "epoch": 0.73, - "learning_rate": 0.00019018615813712136, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002487515829091221, + "loss": 0.0178, "step": 67720 }, { - "epoch": 0.73, - "learning_rate": 0.00019016994227151842, - "loss": 0.0193, + "epoch": 0.34, + "learning_rate": 0.00024874401521610807, + "loss": 0.0189, "step": 67730 }, { - "epoch": 0.73, - "learning_rate": 0.00019015372640591554, - "loss": 0.0282, + "epoch": 0.34, + "learning_rate": 0.00024873644752309405, + "loss": 0.0148, "step": 67740 }, { - "epoch": 0.73, - "learning_rate": 0.00019013751054031263, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.00024872887983008003, + "loss": 0.0177, "step": 67750 }, { - "epoch": 0.73, - "learning_rate": 0.00019012129467470973, - "loss": 0.0169, + "epoch": 0.34, + "learning_rate": 0.000248721312137066, + "loss": 0.0181, "step": 67760 }, { - "epoch": 0.73, - "learning_rate": 0.0001901050788091068, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.00024871374444405205, + "loss": 0.0165, "step": 67770 }, { - "epoch": 0.73, - "learning_rate": 0.0001900888629435039, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.00024870617675103803, + "loss": 0.0261, "step": 67780 }, { - "epoch": 0.73, - "learning_rate": 0.000190072647077901, - "loss": 0.0194, + "epoch": 0.34, + "learning_rate": 0.000248698609058024, + "loss": 0.0199, "step": 67790 }, { - "epoch": 0.73, - "learning_rate": 0.0001900564312122981, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.00024869104136501, + "loss": 0.02, "step": 67800 }, { - "epoch": 0.73, - "learning_rate": 0.0001900402153466952, - "loss": 0.0203, + "epoch": 0.34, + "learning_rate": 0.00024868347367199597, + "loss": 0.0217, "step": 67810 }, { - "epoch": 0.73, - "learning_rate": 0.00019002399948109228, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024867590597898195, + "loss": 0.0202, "step": 67820 }, { - "epoch": 0.73, - "learning_rate": 0.00019000778361548938, - "loss": 0.0202, + "epoch": 0.34, + "learning_rate": 0.00024866833828596793, + "loss": 0.0166, "step": 67830 }, { - "epoch": 0.73, - "learning_rate": 0.0001899915677498865, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.00024866077059295397, + "loss": 0.0191, "step": 67840 }, { - "epoch": 0.73, - "learning_rate": 0.00018997535188428356, - "loss": 0.0192, + "epoch": 0.34, + "learning_rate": 0.00024865320289993995, + "loss": 0.0181, "step": 67850 }, { - "epoch": 0.73, - "learning_rate": 0.00018995913601868065, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.00024864563520692593, + "loss": 0.0199, "step": 67860 }, { - "epoch": 0.73, - "learning_rate": 0.00018994292015307775, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002486380675139119, + "loss": 0.019, "step": 67870 }, { - "epoch": 0.73, - "learning_rate": 0.00018992670428747487, - "loss": 0.0196, + "epoch": 0.34, + "learning_rate": 0.0002486304998208979, + "loss": 0.0182, "step": 67880 }, { - "epoch": 0.73, - "learning_rate": 0.00018991048842187193, + "epoch": 0.34, + "learning_rate": 0.0002486229321278839, "loss": 0.0155, "step": 67890 }, { - "epoch": 0.73, - "learning_rate": 0.00018989427255626903, - "loss": 0.0185, + "epoch": 0.34, + "learning_rate": 0.0002486153644348699, + "loss": 0.0169, "step": 67900 }, { - "epoch": 0.73, - "learning_rate": 0.00018987805669066615, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.0002486077967418559, + "loss": 0.0171, "step": 67910 }, { - "epoch": 0.73, - "learning_rate": 0.00018986184082506324, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.0002486002290488419, + "loss": 0.0227, "step": 67920 }, { - "epoch": 0.73, - "learning_rate": 0.0001898456249594603, - "loss": 0.016, + "epoch": 0.34, + "learning_rate": 0.00024859266135582786, + "loss": 0.0201, "step": 67930 }, { - "epoch": 0.73, - "learning_rate": 0.0001898294090938574, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.00024858509366281384, + "loss": 0.0165, "step": 67940 }, { - "epoch": 0.73, - "learning_rate": 0.00018981319322825452, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002485775259697998, + "loss": 0.0154, "step": 67950 }, { - "epoch": 0.73, - "learning_rate": 0.0001897969773626516, - "loss": 0.0192, + "epoch": 0.34, + "learning_rate": 0.00024856995827678586, + "loss": 0.0165, "step": 67960 }, { - "epoch": 0.73, - "learning_rate": 0.00018978076149704868, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.00024856239058377184, + "loss": 0.0199, "step": 67970 }, { - "epoch": 0.73, - "learning_rate": 0.0001897645456314458, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002485548228907578, + "loss": 0.0166, "step": 67980 }, { - "epoch": 0.74, - "learning_rate": 0.0001897483297658429, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002485472551977438, + "loss": 0.0178, "step": 67990 }, { - "epoch": 0.74, - "learning_rate": 0.00018973211390023998, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002485396875047298, + "loss": 0.0206, "step": 68000 }, { - "epoch": 0.74, - "eval_cer": 0.921535620538638, - "eval_loss": 0.010959140956401825, - "eval_runtime": 121.0862, - "eval_samples_per_second": 16.517, - "eval_steps_per_second": 4.129, + "epoch": 0.34, + "eval_cer": 0.9144692855070369, + "eval_loss": 0.013180240988731384, + "eval_runtime": 116.7123, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, "step": 68000 }, { - "epoch": 0.74, - "learning_rate": 0.00018971589803463705, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024853211981171576, + "loss": 0.0169, "step": 68010 }, { - "epoch": 0.74, - "learning_rate": 0.00018969968216903417, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024852455211870174, + "loss": 0.0189, "step": 68020 }, { - "epoch": 0.74, - "learning_rate": 0.00018968346630343126, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002485169844256878, + "loss": 0.0172, "step": 68030 }, { - "epoch": 0.74, - "learning_rate": 0.00018966725043782838, - "loss": 0.0119, + "epoch": 0.34, + "learning_rate": 0.00024850941673267376, + "loss": 0.019, "step": 68040 }, { - "epoch": 0.74, - "learning_rate": 0.00018965103457222544, - "loss": 0.0213, + "epoch": 0.34, + "learning_rate": 0.00024850184903965974, + "loss": 0.0184, "step": 68050 }, { - "epoch": 0.74, - "learning_rate": 0.00018963481870662254, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.0002484942813466457, + "loss": 0.015, "step": 68060 }, { - "epoch": 0.74, - "learning_rate": 0.00018961860284101963, - "loss": 0.0166, + "epoch": 0.34, + "learning_rate": 0.0002484867136536317, + "loss": 0.0175, "step": 68070 }, { - "epoch": 0.74, - "learning_rate": 0.00018960238697541675, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002484791459606177, + "loss": 0.0203, "step": 68080 }, { - "epoch": 0.74, - "learning_rate": 0.00018958617110981382, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002484715782676037, + "loss": 0.0184, "step": 68090 }, { - "epoch": 0.74, - "learning_rate": 0.0001895699552442109, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002484640105745897, + "loss": 0.021, "step": 68100 }, { - "epoch": 0.74, - "learning_rate": 0.00018955373937860803, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002484564428815757, + "loss": 0.0204, "step": 68110 }, { - "epoch": 0.74, - "learning_rate": 0.00018953752351300512, - "loss": 0.0184, + "epoch": 0.34, + "learning_rate": 0.00024844887518856167, + "loss": 0.0199, "step": 68120 }, { - "epoch": 0.74, - "learning_rate": 0.00018952130764740219, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.00024844130749554765, + "loss": 0.0175, "step": 68130 }, { - "epoch": 0.74, - "learning_rate": 0.00018950509178179928, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024843373980253363, + "loss": 0.0201, "step": 68140 }, { - "epoch": 0.74, - "learning_rate": 0.0001894888759161964, - "loss": 0.016, + "epoch": 0.34, + "learning_rate": 0.0002484261721095196, + "loss": 0.0196, "step": 68150 }, { - "epoch": 0.74, - "learning_rate": 0.0001894726600505935, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.00024841860441650565, + "loss": 0.0186, "step": 68160 }, { - "epoch": 0.74, - "learning_rate": 0.00018945644418499056, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024841103672349163, + "loss": 0.0208, "step": 68170 }, { - "epoch": 0.74, - "learning_rate": 0.00018944022831938768, - "loss": 0.0168, + "epoch": 0.34, + "learning_rate": 0.0002484034690304776, + "loss": 0.0244, "step": 68180 }, { - "epoch": 0.74, - "learning_rate": 0.00018942401245378477, - "loss": 0.0169, + "epoch": 0.34, + "learning_rate": 0.0002483959013374636, + "loss": 0.0239, "step": 68190 }, { - "epoch": 0.74, - "learning_rate": 0.00018940779658818186, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.0002483883336444496, + "loss": 0.0216, "step": 68200 }, { - "epoch": 0.74, - "learning_rate": 0.00018939158072257893, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.00024838076595143555, + "loss": 0.0191, "step": 68210 }, { - "epoch": 0.74, - "learning_rate": 0.00018937536485697605, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002483731982584216, + "loss": 0.0216, "step": 68220 }, { - "epoch": 0.74, - "learning_rate": 0.00018935914899137314, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.00024836563056540757, + "loss": 0.0223, "step": 68230 }, { - "epoch": 0.74, - "learning_rate": 0.00018934293312577023, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024835806287239355, + "loss": 0.0246, "step": 68240 }, { - "epoch": 0.74, - "learning_rate": 0.00018932671726016733, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.00024835049517937953, + "loss": 0.0193, "step": 68250 }, { - "epoch": 0.74, - "learning_rate": 0.00018931050139456442, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.0002483429274863655, + "loss": 0.0206, "step": 68260 }, { - "epoch": 0.74, - "learning_rate": 0.0001892942855289615, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002483353597933515, + "loss": 0.0176, "step": 68270 }, { - "epoch": 0.74, - "learning_rate": 0.00018927806966335863, - "loss": 0.0175, + "epoch": 0.34, + "learning_rate": 0.00024832779210033753, + "loss": 0.0206, "step": 68280 }, { - "epoch": 0.74, - "learning_rate": 0.0001892618537977557, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002483202244073235, + "loss": 0.0177, "step": 68290 }, { - "epoch": 0.74, - "learning_rate": 0.0001892456379321528, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002483126567143095, + "loss": 0.0207, "step": 68300 }, { - "epoch": 0.74, - "learning_rate": 0.0001892294220665499, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.0002483050890212955, + "loss": 0.0214, "step": 68310 }, { - "epoch": 0.74, - "learning_rate": 0.000189213206200947, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024829752132828146, + "loss": 0.0199, "step": 68320 }, { - "epoch": 0.74, - "learning_rate": 0.00018919699033534407, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.00024828995363526744, + "loss": 0.0216, "step": 68330 }, { - "epoch": 0.74, - "learning_rate": 0.00018918077446974116, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002482823859422534, + "loss": 0.0187, "step": 68340 }, { - "epoch": 0.74, - "learning_rate": 0.00018916455860413828, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.00024827481824923946, + "loss": 0.0205, "step": 68350 }, { - "epoch": 0.74, - "learning_rate": 0.00018914834273853537, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.00024826725055622544, + "loss": 0.0198, "step": 68360 }, { - "epoch": 0.74, - "learning_rate": 0.00018913212687293247, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002482596828632114, + "loss": 0.0172, "step": 68370 }, { - "epoch": 0.74, - "learning_rate": 0.00018911591100732956, - "loss": 0.0176, + "epoch": 0.34, + "learning_rate": 0.0002482521151701974, + "loss": 0.0191, "step": 68380 }, { - "epoch": 0.74, - "learning_rate": 0.00018909969514172665, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002482445474771834, + "loss": 0.0183, "step": 68390 }, { - "epoch": 0.74, - "learning_rate": 0.00018908347927612374, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.00024823697978416936, + "loss": 0.0167, "step": 68400 }, { - "epoch": 0.74, - "learning_rate": 0.00018906726341052086, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.0002482294120911554, + "loss": 0.0175, "step": 68410 }, { - "epoch": 0.74, - "learning_rate": 0.00018905104754491793, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.0002482218443981414, + "loss": 0.0226, "step": 68420 }, { - "epoch": 0.74, - "learning_rate": 0.00018903483167931502, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024821427670512736, + "loss": 0.0181, "step": 68430 }, { - "epoch": 0.74, - "learning_rate": 0.00018901861581371212, - "loss": 0.0204, + "epoch": 0.35, + "learning_rate": 0.00024820670901211334, + "loss": 0.0177, "step": 68440 }, { - "epoch": 0.74, - "learning_rate": 0.00018900239994810924, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002481991413190993, + "loss": 0.0178, "step": 68450 }, { - "epoch": 0.74, - "learning_rate": 0.0001889861840825063, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.0002481915736260853, + "loss": 0.0184, "step": 68460 }, { - "epoch": 0.74, - "learning_rate": 0.0001889699682169034, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.00024818400593307134, + "loss": 0.0159, "step": 68470 }, { - "epoch": 0.74, - "learning_rate": 0.0001889537523513005, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.0002481764382400573, + "loss": 0.0201, "step": 68480 }, { - "epoch": 0.74, - "learning_rate": 0.0001889375364856976, - "loss": 0.0166, + "epoch": 0.35, + "learning_rate": 0.0002481688705470433, + "loss": 0.0196, "step": 68490 }, { - "epoch": 0.74, - "learning_rate": 0.00018892132062009467, - "loss": 0.018, + "epoch": 0.35, + "learning_rate": 0.0002481613028540293, + "loss": 0.0198, "step": 68500 }, { - "epoch": 0.74, - "learning_rate": 0.00018890510475449176, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024815373516101527, + "loss": 0.0162, "step": 68510 }, { - "epoch": 0.74, - "learning_rate": 0.00018888888888888888, - "loss": 0.0188, + "epoch": 0.35, + "learning_rate": 0.00024814616746800125, + "loss": 0.0233, "step": 68520 }, { - "epoch": 0.74, - "learning_rate": 0.00018887267302328598, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.00024813859977498723, + "loss": 0.0157, "step": 68530 }, { - "epoch": 0.74, - "learning_rate": 0.00018885645715768304, - "loss": 0.0172, + "epoch": 0.35, + "learning_rate": 0.0002481310320819732, + "loss": 0.0198, "step": 68540 }, { - "epoch": 0.74, - "learning_rate": 0.00018884024129208016, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.0002481234643889592, + "loss": 0.0187, "step": 68550 }, { - "epoch": 0.74, - "learning_rate": 0.00018882402542647726, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.0002481158966959452, + "loss": 0.0171, "step": 68560 }, { - "epoch": 0.74, - "learning_rate": 0.00018880780956087435, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024810832900293116, + "loss": 0.014, "step": 68570 }, { - "epoch": 0.74, - "learning_rate": 0.00018879159369527141, - "loss": 0.0168, + "epoch": 0.35, + "learning_rate": 0.0002481007613099172, + "loss": 0.0164, "step": 68580 }, { - "epoch": 0.74, - "learning_rate": 0.00018877537782966853, + "epoch": 0.35, + "learning_rate": 0.0002480931936169032, "loss": 0.0158, "step": 68590 }, { - "epoch": 0.74, - "learning_rate": 0.00018875916196406563, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.00024808562592388916, + "loss": 0.0178, "step": 68600 }, { - "epoch": 0.74, - "learning_rate": 0.00018874294609846275, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024807805823087514, + "loss": 0.0215, "step": 68610 }, { - "epoch": 0.74, - "learning_rate": 0.0001887267302328598, - "loss": 0.0176, + "epoch": 0.35, + "learning_rate": 0.0002480704905378611, + "loss": 0.0182, "step": 68620 }, { - "epoch": 0.74, - "learning_rate": 0.0001887105143672569, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.0002480629228448471, + "loss": 0.019, "step": 68630 }, { - "epoch": 0.74, - "learning_rate": 0.000188694298501654, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024805535515183314, + "loss": 0.0183, "step": 68640 }, { - "epoch": 0.74, - "learning_rate": 0.00018867808263605112, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002480477874588191, + "loss": 0.0185, "step": 68650 }, { - "epoch": 0.74, - "learning_rate": 0.00018866186677044818, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.0002480402197658051, + "loss": 0.0205, "step": 68660 }, { - "epoch": 0.74, - "learning_rate": 0.00018864565090484528, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002480326520727911, + "loss": 0.019, "step": 68670 }, { - "epoch": 0.74, - "learning_rate": 0.0001886294350392424, - "loss": 0.0196, + "epoch": 0.35, + "learning_rate": 0.00024802508437977706, + "loss": 0.0174, "step": 68680 }, { - "epoch": 0.74, - "learning_rate": 0.0001886132191736395, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024801751668676304, + "loss": 0.0223, "step": 68690 }, { - "epoch": 0.74, - "learning_rate": 0.00018859700330803655, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.0002480099489937491, + "loss": 0.0172, "step": 68700 }, { - "epoch": 0.74, - "learning_rate": 0.00018858078744243365, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024800238130073506, + "loss": 0.019, "step": 68710 }, { - "epoch": 0.74, - "learning_rate": 0.00018856457157683077, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024799481360772104, + "loss": 0.0165, "step": 68720 }, { - "epoch": 0.74, - "learning_rate": 0.00018854835571122786, - "loss": 0.0169, + "epoch": 0.35, + "learning_rate": 0.000247987245914707, + "loss": 0.0224, "step": 68730 }, { - "epoch": 0.74, - "learning_rate": 0.00018853213984562492, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.000247979678221693, + "loss": 0.0159, "step": 68740 }, { - "epoch": 0.74, - "learning_rate": 0.00018851592398002204, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.000247972110528679, + "loss": 0.0246, "step": 68750 }, { - "epoch": 0.74, - "learning_rate": 0.00018849970811441914, - "loss": 0.016, + "epoch": 0.35, + "learning_rate": 0.00024796454283566497, + "loss": 0.0189, "step": 68760 }, { - "epoch": 0.74, - "learning_rate": 0.00018848349224881623, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.000247956975142651, + "loss": 0.0204, "step": 68770 }, { - "epoch": 0.74, - "learning_rate": 0.0001884672763832133, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.000247949407449637, + "loss": 0.0139, "step": 68780 }, { - "epoch": 0.74, - "learning_rate": 0.00018845106051761042, - "loss": 0.0172, + "epoch": 0.35, + "learning_rate": 0.00024794183975662297, + "loss": 0.0155, "step": 68790 }, { - "epoch": 0.74, - "learning_rate": 0.0001884348446520075, - "loss": 0.0179, + "epoch": 0.35, + "learning_rate": 0.00024793427206360895, + "loss": 0.0197, "step": 68800 }, { - "epoch": 0.74, - "learning_rate": 0.0001884186287864046, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.00024792670437059493, + "loss": 0.0176, "step": 68810 }, { - "epoch": 0.74, - "learning_rate": 0.0001884024129208017, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002479191366775809, + "loss": 0.0352, "step": 68820 }, { - "epoch": 0.74, - "learning_rate": 0.0001883861970551988, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024791156898456695, + "loss": 0.021, "step": 68830 }, { - "epoch": 0.74, - "learning_rate": 0.00018836998118959588, - "loss": 0.0163, + "epoch": 0.35, + "learning_rate": 0.00024790400129155293, + "loss": 0.0193, "step": 68840 }, { - "epoch": 0.74, - "learning_rate": 0.000188353765323993, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.0002478964335985389, + "loss": 0.0245, "step": 68850 }, { - "epoch": 0.74, - "learning_rate": 0.00018833754945839006, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002478888659055249, + "loss": 0.0221, "step": 68860 }, { - "epoch": 0.74, - "learning_rate": 0.00018832133359278716, - "loss": 0.0174, + "epoch": 0.35, + "learning_rate": 0.00024788129821251087, + "loss": 0.0198, "step": 68870 }, { - "epoch": 0.74, - "learning_rate": 0.00018830511772718425, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.00024787373051949685, + "loss": 0.022, "step": 68880 }, { - "epoch": 0.74, - "learning_rate": 0.00018828890186158137, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024786616282648283, + "loss": 0.0186, "step": 68890 }, { - "epoch": 0.74, - "learning_rate": 0.00018827268599597844, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.00024785859513346887, + "loss": 0.0228, "step": 68900 }, { - "epoch": 0.74, - "learning_rate": 0.00018825647013037553, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.00024785102744045485, + "loss": 0.0237, "step": 68910 }, { - "epoch": 0.75, - "learning_rate": 0.00018824025426477265, - "loss": 0.0163, + "epoch": 0.35, + "learning_rate": 0.00024784345974744083, + "loss": 0.0238, "step": 68920 }, { - "epoch": 0.75, - "learning_rate": 0.00018822403839916974, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002478358920544268, + "loss": 0.0186, "step": 68930 }, { - "epoch": 0.75, - "learning_rate": 0.0001882078225335668, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.0002478283243614128, + "loss": 0.0199, "step": 68940 }, { - "epoch": 0.75, - "learning_rate": 0.0001881916066679639, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.0002478207566683988, + "loss": 0.0207, "step": 68950 }, { - "epoch": 0.75, - "learning_rate": 0.00018817539080236102, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.0002478131889753848, + "loss": 0.0246, "step": 68960 }, { - "epoch": 0.75, - "learning_rate": 0.0001881591749367581, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002478056212823708, + "loss": 0.0194, "step": 68970 }, { - "epoch": 0.75, - "learning_rate": 0.00018814295907115518, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.0002477980535893568, + "loss": 0.0235, "step": 68980 }, { - "epoch": 0.75, - "learning_rate": 0.0001881267432055523, - "loss": 0.0175, + "epoch": 0.35, + "learning_rate": 0.00024779048589634276, + "loss": 0.0227, "step": 68990 }, { - "epoch": 0.75, - "learning_rate": 0.0001881105273399494, - "loss": 0.0168, + "epoch": 0.35, + "learning_rate": 0.00024778291820332874, + "loss": 0.0194, "step": 69000 }, { - "epoch": 0.75, - "eval_cer": 0.921567758848024, - "eval_loss": 0.010564006865024567, - "eval_runtime": 121.2365, - "eval_samples_per_second": 16.497, - "eval_steps_per_second": 4.124, + "epoch": 0.35, + "eval_cer": 0.9145119829365546, + "eval_loss": 0.014301990158855915, + "eval_runtime": 116.8153, + "eval_samples_per_second": 17.121, + "eval_steps_per_second": 4.28, "step": 69000 }, { - "epoch": 0.75, - "learning_rate": 0.00018809431147434648, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002477753505103147, + "loss": 0.0174, "step": 69010 }, { - "epoch": 0.75, - "learning_rate": 0.00018807809560874355, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024776778281730076, + "loss": 0.0214, "step": 69020 }, { - "epoch": 0.75, - "learning_rate": 0.00018806187974314067, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.00024776021512428674, + "loss": 0.0158, "step": 69030 }, { - "epoch": 0.75, - "learning_rate": 0.00018804566387753776, - "loss": 0.0118, + "epoch": 0.35, + "learning_rate": 0.0002477526474312727, + "loss": 0.0175, "step": 69040 }, { - "epoch": 0.75, - "learning_rate": 0.00018802944801193488, - "loss": 0.0188, + "epoch": 0.35, + "learning_rate": 0.0002477450797382587, + "loss": 0.0176, "step": 69050 }, { - "epoch": 0.75, - "learning_rate": 0.00018801323214633197, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.0002477375120452447, + "loss": 0.0165, "step": 69060 }, { - "epoch": 0.75, - "learning_rate": 0.00018799701628072904, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.00024772994435223066, + "loss": 0.0191, "step": 69070 }, { - "epoch": 0.75, - "learning_rate": 0.00018798080041512613, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.00024772237665921665, + "loss": 0.019, "step": 69080 }, { - "epoch": 0.75, - "learning_rate": 0.00018796458454952325, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002477148089662027, + "loss": 0.0206, "step": 69090 }, { - "epoch": 0.75, - "learning_rate": 0.00018794836868392034, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024770724127318866, + "loss": 0.0244, "step": 69100 }, { - "epoch": 0.75, - "learning_rate": 0.0001879321528183174, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.00024769967358017464, + "loss": 0.0197, "step": 69110 }, { - "epoch": 0.75, - "learning_rate": 0.00018791593695271453, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.0002476921058871606, + "loss": 0.0204, "step": 69120 }, { - "epoch": 0.75, - "learning_rate": 0.00018789972108711162, - "loss": 0.0113, + "epoch": 0.35, + "learning_rate": 0.0002476845381941466, + "loss": 0.0234, "step": 69130 }, { - "epoch": 0.75, - "learning_rate": 0.00018788350522150872, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.0002476769705011326, + "loss": 0.0166, "step": 69140 }, { - "epoch": 0.75, - "learning_rate": 0.00018786728935590578, - "loss": 0.0113, + "epoch": 0.35, + "learning_rate": 0.0002476694028081186, + "loss": 0.0201, "step": 69150 }, { - "epoch": 0.75, - "learning_rate": 0.0001878510734903029, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.0002476618351151046, + "loss": 0.0182, "step": 69160 }, { - "epoch": 0.75, - "learning_rate": 0.0001878348576247, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.0002476542674220906, + "loss": 0.0224, "step": 69170 }, { - "epoch": 0.75, - "learning_rate": 0.0001878186417590971, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.00024764669972907657, + "loss": 0.0181, "step": 69180 }, { - "epoch": 0.75, - "learning_rate": 0.00018780242589349418, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.00024763913203606255, + "loss": 0.0172, "step": 69190 }, { - "epoch": 0.75, - "learning_rate": 0.00018778621002789127, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.00024763156434304853, + "loss": 0.0215, "step": 69200 }, { - "epoch": 0.75, - "learning_rate": 0.00018776999416228837, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024762399665003457, + "loss": 0.016, "step": 69210 }, { - "epoch": 0.75, - "learning_rate": 0.00018775377829668548, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.00024761642895702055, + "loss": 0.019, "step": 69220 }, { - "epoch": 0.75, - "learning_rate": 0.00018773756243108255, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024760886126400653, + "loss": 0.0175, "step": 69230 }, { - "epoch": 0.75, - "learning_rate": 0.00018772134656547964, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002476012935709925, + "loss": 0.0192, "step": 69240 }, { - "epoch": 0.75, - "learning_rate": 0.00018770513069987674, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.0002475937258779785, + "loss": 0.0171, "step": 69250 }, { - "epoch": 0.75, - "learning_rate": 0.00018768891483427386, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.0002475861581849645, + "loss": 0.016, "step": 69260 }, { - "epoch": 0.75, - "learning_rate": 0.00018767269896867092, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.00024757859049195046, + "loss": 0.0192, "step": 69270 }, { - "epoch": 0.75, - "learning_rate": 0.00018765648310306801, - "loss": 0.0178, + "epoch": 0.35, + "learning_rate": 0.0002475710227989365, + "loss": 0.0171, "step": 69280 }, { - "epoch": 0.75, - "learning_rate": 0.00018764026723746513, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.00024756345510592247, + "loss": 0.0179, "step": 69290 }, { - "epoch": 0.75, - "learning_rate": 0.00018762405137186223, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024755588741290845, + "loss": 0.0191, "step": 69300 }, { - "epoch": 0.75, - "learning_rate": 0.0001876078355062593, - "loss": 0.0121, + "epoch": 0.35, + "learning_rate": 0.00024754831971989444, + "loss": 0.0194, "step": 69310 }, { - "epoch": 0.75, - "learning_rate": 0.00018759161964065639, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.0002475407520268804, + "loss": 0.0206, "step": 69320 }, { - "epoch": 0.75, - "learning_rate": 0.0001875754037750535, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.0002475331843338664, + "loss": 0.0214, "step": 69330 }, { - "epoch": 0.75, - "learning_rate": 0.0001875591879094506, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024752561664085243, + "loss": 0.0208, "step": 69340 }, { - "epoch": 0.75, - "learning_rate": 0.00018754297204384766, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.0002475180489478384, + "loss": 0.0184, "step": 69350 }, { - "epoch": 0.75, - "learning_rate": 0.00018752675617824478, - "loss": 0.0186, + "epoch": 0.35, + "learning_rate": 0.0002475104812548244, + "loss": 0.0172, "step": 69360 }, { - "epoch": 0.75, - "learning_rate": 0.00018751054031264188, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002475029135618104, + "loss": 0.0237, "step": 69370 }, { - "epoch": 0.75, - "learning_rate": 0.00018749432444703897, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.00024749534586879636, + "loss": 0.0197, "step": 69380 }, { - "epoch": 0.75, - "learning_rate": 0.00018747810858143606, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024748777817578234, + "loss": 0.0217, "step": 69390 }, { - "epoch": 0.75, - "learning_rate": 0.00018746189271583315, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002474802104827683, + "loss": 0.0231, "step": 69400 }, { - "epoch": 0.75, - "learning_rate": 0.00018744567685023025, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024747264278975436, + "loss": 0.0189, "step": 69410 }, { - "epoch": 0.75, - "learning_rate": 0.00018742946098462737, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.00024746507509674034, + "loss": 0.0188, "step": 69420 }, { - "epoch": 0.75, - "learning_rate": 0.00018741324511902443, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002474575074037263, + "loss": 0.0446, "step": 69430 }, { - "epoch": 0.75, - "learning_rate": 0.00018739702925342153, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002474499397107123, + "loss": 0.0461, "step": 69440 }, { - "epoch": 0.75, - "learning_rate": 0.00018738081338781862, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002474423720176983, + "loss": 0.0163, "step": 69450 }, { - "epoch": 0.75, - "learning_rate": 0.00018736459752221574, - "loss": 0.0211, + "epoch": 0.35, + "learning_rate": 0.00024743480432468427, + "loss": 0.0194, "step": 69460 }, { - "epoch": 0.75, - "learning_rate": 0.0001873483816566128, - "loss": 0.016, + "epoch": 0.35, + "learning_rate": 0.0002474272366316703, + "loss": 0.019, "step": 69470 }, { - "epoch": 0.75, - "learning_rate": 0.0001873321657910099, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002474196689386563, + "loss": 0.0231, "step": 69480 }, { - "epoch": 0.75, - "learning_rate": 0.00018731594992540702, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024741210124564226, + "loss": 0.017, "step": 69490 }, { - "epoch": 0.75, - "learning_rate": 0.0001872997340598041, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024740453355262825, + "loss": 0.0185, "step": 69500 }, { - "epoch": 0.75, - "learning_rate": 0.00018728351819420117, - "loss": 0.0178, + "epoch": 0.35, + "learning_rate": 0.0002473969658596142, + "loss": 0.0169, "step": 69510 }, { - "epoch": 0.75, - "learning_rate": 0.00018726730232859827, - "loss": 0.0198, + "epoch": 0.35, + "learning_rate": 0.0002473893981666002, + "loss": 0.0238, "step": 69520 }, { - "epoch": 0.75, - "learning_rate": 0.0001872510864629954, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.00024738183047358624, + "loss": 0.021, "step": 69530 }, { - "epoch": 0.75, - "learning_rate": 0.00018723487059739248, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002473742627805722, + "loss": 0.0167, "step": 69540 }, { - "epoch": 0.75, - "learning_rate": 0.00018721865473178955, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.0002473666950875582, + "loss": 0.0204, "step": 69550 }, { - "epoch": 0.75, - "learning_rate": 0.00018720243886618667, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002473591273945442, + "loss": 0.0204, "step": 69560 }, { - "epoch": 0.75, - "learning_rate": 0.00018718622300058376, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024735155970153017, + "loss": 0.0176, "step": 69570 }, { - "epoch": 0.75, - "learning_rate": 0.00018717000713498085, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.00024734399200851615, + "loss": 0.0191, "step": 69580 }, { - "epoch": 0.75, - "learning_rate": 0.00018715379126937792, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.00024733642431550213, + "loss": 0.018, "step": 69590 }, { - "epoch": 0.75, - "learning_rate": 0.00018713757540377504, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024732885662248817, + "loss": 0.0189, "step": 69600 }, { - "epoch": 0.75, - "learning_rate": 0.00018712135953817213, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024732128892947415, + "loss": 0.0174, "step": 69610 }, { - "epoch": 0.75, - "learning_rate": 0.00018710514367256925, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.00024731372123646013, + "loss": 0.0189, "step": 69620 }, { - "epoch": 0.75, - "learning_rate": 0.00018708892780696631, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.0002473061535434461, + "loss": 0.0193, "step": 69630 }, { - "epoch": 0.75, - "learning_rate": 0.0001870727119413634, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.0002472985858504321, + "loss": 0.0202, "step": 69640 }, { - "epoch": 0.75, - "learning_rate": 0.0001870564960757605, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002472910181574181, + "loss": 0.0162, "step": 69650 }, { - "epoch": 0.75, - "learning_rate": 0.00018704028021015762, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.0002472834504644041, + "loss": 0.0184, "step": 69660 }, { - "epoch": 0.75, - "learning_rate": 0.00018702406434455469, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.0002472758827713901, + "loss": 0.0182, "step": 69670 }, { - "epoch": 0.75, - "learning_rate": 0.00018700784847895178, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.0002472683150783761, + "loss": 0.0283, "step": 69680 }, { - "epoch": 0.75, - "learning_rate": 0.0001869916326133489, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.00024726074738536206, + "loss": 0.0173, "step": 69690 }, { - "epoch": 0.75, - "learning_rate": 0.000186975416747746, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024725317969234804, + "loss": 0.0178, "step": 69700 }, { - "epoch": 0.75, - "learning_rate": 0.00018695920088214306, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.000247245611999334, + "loss": 0.0161, "step": 69710 }, { - "epoch": 0.75, - "learning_rate": 0.00018694298501654015, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024723804430632005, + "loss": 0.0178, "step": 69720 }, { - "epoch": 0.75, - "learning_rate": 0.00018692676915093727, - "loss": 0.0207, + "epoch": 0.35, + "learning_rate": 0.00024723047661330604, + "loss": 0.0196, "step": 69730 }, { - "epoch": 0.75, - "learning_rate": 0.00018691055328533436, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.000247222908920292, + "loss": 0.0208, "step": 69740 }, { - "epoch": 0.75, - "learning_rate": 0.00018689433741973143, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.000247215341227278, + "loss": 0.0175, "step": 69750 }, { - "epoch": 0.75, - "learning_rate": 0.00018687812155412855, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.000247207773534264, + "loss": 0.021, "step": 69760 }, { - "epoch": 0.75, - "learning_rate": 0.00018686190568852564, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.00024720020584124996, + "loss": 0.0157, "step": 69770 }, { - "epoch": 0.75, - "learning_rate": 0.00018684568982292273, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024719263814823594, + "loss": 0.017, "step": 69780 }, { - "epoch": 0.75, - "learning_rate": 0.00018682947395731985, - "loss": 0.016, + "epoch": 0.35, + "learning_rate": 0.0002471850704552219, + "loss": 0.0225, "step": 69790 }, { - "epoch": 0.75, - "learning_rate": 0.00018681325809171692, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002471775027622079, + "loss": 0.0189, "step": 69800 }, { - "epoch": 0.75, - "learning_rate": 0.000186797042226114, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002471699350691939, + "loss": 0.0204, "step": 69810 }, { - "epoch": 0.75, - "learning_rate": 0.0001867808263605111, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.00024716236737617987, + "loss": 0.0194, "step": 69820 }, { - "epoch": 0.75, - "learning_rate": 0.00018676461049490822, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002471547996831659, + "loss": 0.0211, "step": 69830 }, { - "epoch": 0.76, - "learning_rate": 0.0001867483946293053, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.0002471472319901519, + "loss": 0.0197, "step": 69840 }, { - "epoch": 0.76, - "learning_rate": 0.00018673217876370238, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.00024713966429713787, + "loss": 0.0183, "step": 69850 }, { - "epoch": 0.76, - "learning_rate": 0.0001867159628980995, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.00024713209660412385, + "loss": 0.0153, "step": 69860 }, { - "epoch": 0.76, - "learning_rate": 0.0001866997470324966, - "loss": 0.0169, + "epoch": 0.35, + "learning_rate": 0.00024712452891110983, + "loss": 0.0213, "step": 69870 }, { - "epoch": 0.76, - "learning_rate": 0.00018668353116689366, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.0002471169612180958, + "loss": 0.0205, "step": 69880 }, { - "epoch": 0.76, - "learning_rate": 0.00018666731530129075, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024710939352508185, + "loss": 0.0184, "step": 69890 }, { - "epoch": 0.76, - "learning_rate": 0.00018665109943568787, - "loss": 0.0166, + "epoch": 0.35, + "learning_rate": 0.00024710182583206783, + "loss": 0.0185, "step": 69900 }, { - "epoch": 0.76, - "learning_rate": 0.00018663488357008497, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470942581390538, + "loss": 0.0186, "step": 69910 }, { - "epoch": 0.76, - "learning_rate": 0.00018661866770448203, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.0002470866904460398, + "loss": 0.0167, "step": 69920 }, { - "epoch": 0.76, - "learning_rate": 0.00018660245183887915, - "loss": 0.0171, + "epoch": 0.35, + "learning_rate": 0.00024707912275302577, + "loss": 0.0193, "step": 69930 }, { - "epoch": 0.76, - "learning_rate": 0.00018658623597327624, - "loss": 0.0174, + "epoch": 0.35, + "learning_rate": 0.00024707155506001175, + "loss": 0.0223, "step": 69940 }, { - "epoch": 0.76, - "learning_rate": 0.00018657002010767334, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.00024706398736699774, + "loss": 0.0167, "step": 69950 }, { - "epoch": 0.76, - "learning_rate": 0.0001865538042420704, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024705641967398377, + "loss": 0.0175, "step": 69960 }, { - "epoch": 0.76, - "learning_rate": 0.00018653758837646752, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.00024704885198096975, + "loss": 0.0165, "step": 69970 }, { - "epoch": 0.76, - "learning_rate": 0.00018652137251086461, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.00024704128428795573, + "loss": 0.0174, "step": 69980 }, { - "epoch": 0.76, - "learning_rate": 0.00018650515664526173, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002470337165949417, + "loss": 0.0218, "step": 69990 }, { - "epoch": 0.76, - "learning_rate": 0.0001864889407796588, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002470261489019277, + "loss": 0.018, "step": 70000 }, { - "epoch": 0.76, - "eval_cer": 0.9215364891415945, - "eval_loss": 0.010723001323640347, - "eval_runtime": 121.1995, - "eval_samples_per_second": 16.502, - "eval_steps_per_second": 4.125, + "epoch": 0.35, + "eval_cer": 0.9144508479806542, + "eval_loss": 0.013182277791202068, + "eval_runtime": 116.7197, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 70000 }, { - "epoch": 0.76, - "learning_rate": 0.0001864727249140559, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002470185812089137, + "loss": 0.0209, "step": 70010 }, { - "epoch": 0.76, - "learning_rate": 0.00018645650904845299, - "loss": 0.0163, + "epoch": 0.35, + "learning_rate": 0.0002470110135158997, + "loss": 0.0188, "step": 70020 }, { - "epoch": 0.76, - "learning_rate": 0.0001864402931828501, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002470034458228857, + "loss": 0.02, "step": 70030 }, { - "epoch": 0.76, - "learning_rate": 0.00018642407731724717, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002469958781298717, + "loss": 0.0319, "step": 70040 }, { - "epoch": 0.76, - "learning_rate": 0.00018640786145164426, - "loss": 0.0166, + "epoch": 0.35, + "learning_rate": 0.00024698831043685766, + "loss": 0.0164, "step": 70050 }, { - "epoch": 0.76, - "learning_rate": 0.00018639164558604138, - "loss": 0.0174, + "epoch": 0.35, + "learning_rate": 0.00024698074274384364, + "loss": 0.0206, "step": 70060 }, { - "epoch": 0.76, - "learning_rate": 0.00018637542972043848, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002469731750508296, + "loss": 0.0208, "step": 70070 }, { - "epoch": 0.76, - "learning_rate": 0.00018635921385483554, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.00024696560735781566, + "loss": 0.0216, "step": 70080 }, { - "epoch": 0.76, - "learning_rate": 0.00018634299798923263, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024695803966480164, + "loss": 0.0189, "step": 70090 }, { - "epoch": 0.76, - "learning_rate": 0.00018632678212362975, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002469504719717876, + "loss": 0.024, "step": 70100 }, { - "epoch": 0.76, - "learning_rate": 0.00018631056625802685, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002469429042787736, + "loss": 0.0176, "step": 70110 }, { - "epoch": 0.76, - "learning_rate": 0.0001862943503924239, - "loss": 0.0172, + "epoch": 0.35, + "learning_rate": 0.0002469353365857596, + "loss": 0.0181, "step": 70120 }, { - "epoch": 0.76, - "learning_rate": 0.00018627813452682103, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024692776889274556, + "loss": 0.0192, "step": 70130 }, { - "epoch": 0.76, - "learning_rate": 0.00018626191866121813, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.00024692020119973155, + "loss": 0.0241, "step": 70140 }, { - "epoch": 0.76, - "learning_rate": 0.00018624570279561522, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.0002469126335067176, + "loss": 0.0196, "step": 70150 }, { - "epoch": 0.76, - "learning_rate": 0.00018622948693001228, - "loss": 0.0167, + "epoch": 0.35, + "learning_rate": 0.00024690506581370356, + "loss": 0.0185, "step": 70160 }, { - "epoch": 0.76, - "learning_rate": 0.0001862132710644094, - "loss": 0.017, + "epoch": 0.35, + "learning_rate": 0.00024689749812068954, + "loss": 0.0178, "step": 70170 }, { - "epoch": 0.76, - "learning_rate": 0.0001861970551988065, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002468899304276755, + "loss": 0.0179, "step": 70180 }, { - "epoch": 0.76, - "learning_rate": 0.0001861808393332036, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002468823627346615, + "loss": 0.0232, "step": 70190 }, { - "epoch": 0.76, - "learning_rate": 0.00018616462346760068, - "loss": 0.0189, + "epoch": 0.35, + "learning_rate": 0.0002468747950416475, + "loss": 0.0184, "step": 70200 }, { - "epoch": 0.76, - "learning_rate": 0.00018614840760199777, - "loss": 0.0172, + "epoch": 0.35, + "learning_rate": 0.0002468672273486335, + "loss": 0.0163, "step": 70210 }, { - "epoch": 0.76, - "learning_rate": 0.00018613219173639487, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002468596596556195, + "loss": 0.0159, "step": 70220 }, { - "epoch": 0.76, - "learning_rate": 0.000186115975870792, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002468520919626055, + "loss": 0.0198, "step": 70230 }, { - "epoch": 0.76, - "learning_rate": 0.00018609976000518905, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.00024684452426959147, + "loss": 0.0188, "step": 70240 }, { - "epoch": 0.76, - "learning_rate": 0.00018608354413958615, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024683695657657745, + "loss": 0.0212, "step": 70250 }, { - "epoch": 0.76, - "learning_rate": 0.00018606732827398324, - "loss": 0.0163, + "epoch": 0.35, + "learning_rate": 0.00024682938888356343, + "loss": 0.0175, "step": 70260 }, { - "epoch": 0.76, - "learning_rate": 0.00018605111240838036, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.00024682182119054947, + "loss": 0.0172, "step": 70270 }, { - "epoch": 0.76, - "learning_rate": 0.00018603489654277742, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.00024681425349753545, + "loss": 0.0191, "step": 70280 }, { - "epoch": 0.76, - "learning_rate": 0.00018601868067717452, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024680668580452143, + "loss": 0.0196, "step": 70290 }, { - "epoch": 0.76, - "learning_rate": 0.00018600246481157164, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.0002467991181115074, + "loss": 0.0184, "step": 70300 }, { - "epoch": 0.76, - "learning_rate": 0.00018598624894596873, + "epoch": 0.35, + "learning_rate": 0.0002467915504184934, "loss": 0.0172, "step": 70310 }, { - "epoch": 0.76, - "learning_rate": 0.0001859700330803658, - "loss": 0.0173, + "epoch": 0.35, + "learning_rate": 0.0002467839827254794, + "loss": 0.0198, "step": 70320 }, { - "epoch": 0.76, - "learning_rate": 0.0001859538172147629, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024677641503246536, + "loss": 0.0193, "step": 70330 }, { - "epoch": 0.76, - "learning_rate": 0.00018593760134916, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002467688473394514, + "loss": 0.0177, "step": 70340 }, { - "epoch": 0.76, - "learning_rate": 0.0001859213854835571, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.00024676127964643737, + "loss": 0.017, "step": 70350 }, { - "epoch": 0.76, - "learning_rate": 0.00018590516961795417, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.00024675371195342335, + "loss": 0.0191, "step": 70360 }, { - "epoch": 0.76, - "learning_rate": 0.00018588895375235129, - "loss": 0.0153, + "epoch": 0.36, + "learning_rate": 0.00024674614426040934, + "loss": 0.0194, "step": 70370 }, { - "epoch": 0.76, - "learning_rate": 0.00018587273788674838, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.0002467385765673953, + "loss": 0.0163, "step": 70380 }, { - "epoch": 0.76, - "learning_rate": 0.00018585652202114547, - "loss": 0.0164, + "epoch": 0.36, + "learning_rate": 0.0002467310088743813, + "loss": 0.0163, "step": 70390 }, { - "epoch": 0.76, - "learning_rate": 0.00018584030615554256, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.00024672344118136733, + "loss": 0.0186, "step": 70400 }, { - "epoch": 0.76, - "learning_rate": 0.00018582409028993966, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.0002467158734883533, + "loss": 0.0175, "step": 70410 }, { - "epoch": 0.76, - "learning_rate": 0.00018580787442433675, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002467083057953393, + "loss": 0.0164, "step": 70420 }, { - "epoch": 0.76, - "learning_rate": 0.00018579165855873387, - "loss": 0.0167, + "epoch": 0.36, + "learning_rate": 0.0002467007381023253, + "loss": 0.0178, "step": 70430 }, { - "epoch": 0.76, - "learning_rate": 0.00018577544269313094, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024669317040931126, + "loss": 0.021, "step": 70440 }, { - "epoch": 0.76, - "learning_rate": 0.00018575922682752803, - "loss": 0.0166, + "epoch": 0.36, + "learning_rate": 0.00024668560271629724, + "loss": 0.0229, "step": 70450 }, { - "epoch": 0.76, - "learning_rate": 0.00018574301096192512, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002466780350232832, + "loss": 0.0205, "step": 70460 }, { - "epoch": 0.76, - "learning_rate": 0.00018572679509632224, - "loss": 0.0144, + "epoch": 0.36, + "learning_rate": 0.00024667046733026926, + "loss": 0.0169, "step": 70470 }, { - "epoch": 0.76, - "learning_rate": 0.0001857105792307193, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024666289963725524, + "loss": 0.0181, "step": 70480 }, { - "epoch": 0.76, - "learning_rate": 0.0001856943633651164, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.0002466553319442412, + "loss": 0.0197, "step": 70490 }, { - "epoch": 0.76, - "learning_rate": 0.00018567814749951352, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002466477642512272, + "loss": 0.0183, "step": 70500 }, { - "epoch": 0.76, - "learning_rate": 0.0001856619316339106, - "loss": 0.0173, + "epoch": 0.36, + "learning_rate": 0.0002466401965582132, + "loss": 0.0198, "step": 70510 }, { - "epoch": 0.76, - "learning_rate": 0.0001856457157683077, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024663262886519917, + "loss": 0.0174, "step": 70520 }, { - "epoch": 0.76, - "learning_rate": 0.00018562949990270477, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002466250611721852, + "loss": 0.0221, "step": 70530 }, { - "epoch": 0.76, - "learning_rate": 0.0001856132840371019, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.0002466174934791712, + "loss": 0.0203, "step": 70540 }, { - "epoch": 0.76, - "learning_rate": 0.00018559706817149898, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.00024660992578615716, + "loss": 0.0206, "step": 70550 }, { - "epoch": 0.76, - "learning_rate": 0.00018558085230589608, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024660235809314315, + "loss": 0.0192, "step": 70560 }, { - "epoch": 0.76, - "learning_rate": 0.00018556463644029317, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002465947904001291, + "loss": 0.0157, "step": 70570 }, { - "epoch": 0.76, - "learning_rate": 0.00018554842057469026, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002465872227071151, + "loss": 0.0193, "step": 70580 }, { - "epoch": 0.76, - "learning_rate": 0.00018553220470908735, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024657965501410114, + "loss": 0.0199, "step": 70590 }, { - "epoch": 0.76, - "learning_rate": 0.00018551598884348447, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.0002465720873210871, + "loss": 0.0168, "step": 70600 }, { - "epoch": 0.76, - "learning_rate": 0.00018549977297788154, - "loss": 0.0156, + "epoch": 0.36, + "learning_rate": 0.0002465645196280731, + "loss": 0.0155, "step": 70610 }, { - "epoch": 0.76, - "learning_rate": 0.00018548355711227863, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002465569519350591, + "loss": 0.0235, "step": 70620 }, { - "epoch": 0.76, - "learning_rate": 0.00018546734124667575, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.00024654938424204507, + "loss": 0.0158, "step": 70630 }, { - "epoch": 0.76, - "learning_rate": 0.00018545112538107284, - "loss": 0.0165, + "epoch": 0.36, + "learning_rate": 0.00024654181654903105, + "loss": 0.0199, "step": 70640 }, { - "epoch": 0.76, - "learning_rate": 0.0001854349095154699, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024653424885601703, + "loss": 0.02, "step": 70650 }, { - "epoch": 0.76, - "learning_rate": 0.000185418693649867, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024652668116300307, + "loss": 0.0156, "step": 70660 }, { - "epoch": 0.76, - "learning_rate": 0.00018540247778426412, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024651911346998905, + "loss": 0.02, "step": 70670 }, { - "epoch": 0.76, - "learning_rate": 0.00018538626191866122, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024651154577697503, + "loss": 0.0187, "step": 70680 }, { - "epoch": 0.76, - "learning_rate": 0.00018537004605305828, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.000246503978083961, + "loss": 0.0175, "step": 70690 }, { - "epoch": 0.76, - "learning_rate": 0.0001853538301874554, - "loss": 0.0161, + "epoch": 0.36, + "learning_rate": 0.000246496410390947, + "loss": 0.0217, "step": 70700 }, { - "epoch": 0.76, - "learning_rate": 0.0001853376143218525, - "loss": 0.0144, + "epoch": 0.36, + "learning_rate": 0.000246488842697933, + "loss": 0.0209, "step": 70710 }, { - "epoch": 0.76, - "learning_rate": 0.00018532139845624959, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.000246481275004919, + "loss": 0.0165, "step": 70720 }, { - "epoch": 0.76, - "learning_rate": 0.00018530518259064665, - "loss": 0.0107, + "epoch": 0.36, + "learning_rate": 0.000246473707311905, + "loss": 0.0153, "step": 70730 }, { - "epoch": 0.76, - "learning_rate": 0.00018528896672504377, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.000246466139618891, + "loss": 0.0177, "step": 70740 }, { - "epoch": 0.76, - "learning_rate": 0.00018527275085944086, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024645857192587696, + "loss": 0.0173, "step": 70750 }, { - "epoch": 0.76, - "learning_rate": 0.00018525653499383796, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024645100423286294, + "loss": 0.0176, "step": 70760 }, { - "epoch": 0.77, - "learning_rate": 0.00018524031912823505, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.0002464434365398489, + "loss": 0.0163, "step": 70770 }, { - "epoch": 0.77, - "learning_rate": 0.00018522410326263214, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024643586884683495, + "loss": 0.0202, "step": 70780 }, { - "epoch": 0.77, - "learning_rate": 0.00018520788739702924, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024642830115382094, + "loss": 0.0138, "step": 70790 }, { - "epoch": 0.77, - "learning_rate": 0.00018519167153142636, - "loss": 0.0172, + "epoch": 0.36, + "learning_rate": 0.0002464207334608069, + "loss": 0.0166, "step": 70800 }, { - "epoch": 0.77, - "learning_rate": 0.00018517545566582342, - "loss": 0.0178, + "epoch": 0.36, + "learning_rate": 0.0002464131657677929, + "loss": 0.0192, "step": 70810 }, { - "epoch": 0.77, - "learning_rate": 0.0001851592398002205, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002464055980747789, + "loss": 0.0188, "step": 70820 }, { - "epoch": 0.77, - "learning_rate": 0.0001851430239346176, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024639803038176486, + "loss": 0.0169, "step": 70830 }, { - "epoch": 0.77, - "learning_rate": 0.00018512680806901473, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.00024639046268875084, + "loss": 0.0169, "step": 70840 }, { - "epoch": 0.77, - "learning_rate": 0.0001851105922034118, - "loss": 0.0144, + "epoch": 0.36, + "learning_rate": 0.0002463828949957369, + "loss": 0.0182, "step": 70850 }, { - "epoch": 0.77, - "learning_rate": 0.00018509437633780888, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.00024637532730272286, + "loss": 0.0181, "step": 70860 }, { - "epoch": 0.77, - "learning_rate": 0.000185078160472206, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.00024636775960970884, + "loss": 0.0165, "step": 70870 }, { - "epoch": 0.77, - "learning_rate": 0.0001850619446066031, - "loss": 0.0169, + "epoch": 0.36, + "learning_rate": 0.0002463601919166948, + "loss": 0.0154, "step": 70880 }, { - "epoch": 0.77, - "learning_rate": 0.00018504572874100016, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002463526242236808, + "loss": 0.0171, "step": 70890 }, { - "epoch": 0.77, - "learning_rate": 0.00018502951287539726, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.0002463450565306668, + "loss": 0.0183, "step": 70900 }, { - "epoch": 0.77, - "learning_rate": 0.00018501329700979438, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.0002463374888376528, + "loss": 0.0181, "step": 70910 }, { - "epoch": 0.77, - "learning_rate": 0.00018499708114419147, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002463299211446388, + "loss": 0.0174, "step": 70920 }, { - "epoch": 0.77, - "learning_rate": 0.00018498086527858853, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.0002463223534516248, + "loss": 0.0202, "step": 70930 }, { - "epoch": 0.77, - "learning_rate": 0.00018496464941298565, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.00024631478575861077, + "loss": 0.0203, "step": 70940 }, { - "epoch": 0.77, - "learning_rate": 0.00018494843354738275, - "loss": 0.0191, + "epoch": 0.36, + "learning_rate": 0.00024630721806559675, + "loss": 0.0189, "step": 70950 }, { - "epoch": 0.77, - "learning_rate": 0.00018493221768177984, - "loss": 0.0166, + "epoch": 0.36, + "learning_rate": 0.00024629965037258273, + "loss": 0.0199, "step": 70960 }, { - "epoch": 0.77, - "learning_rate": 0.0001849160018161769, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002462920826795687, + "loss": 0.0169, "step": 70970 }, { - "epoch": 0.77, - "learning_rate": 0.00018489978595057402, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.00024628451498655475, + "loss": 0.0166, "step": 70980 }, { - "epoch": 0.77, - "learning_rate": 0.00018488357008497112, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.0002462769472935407, + "loss": 0.0164, "step": 70990 }, { - "epoch": 0.77, - "learning_rate": 0.00018486735421936824, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002462693796005267, + "loss": 0.0199, "step": 71000 }, { - "epoch": 0.77, - "eval_cer": 0.9215330147297689, - "eval_loss": 0.010413131676614285, - "eval_runtime": 121.2759, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.36, + "eval_cer": 0.9145042197675514, + "eval_loss": 0.013640601187944412, + "eval_runtime": 116.7174, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 71000 }, { - "epoch": 0.77, - "learning_rate": 0.0001848511383537653, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.0002462618119075127, + "loss": 0.0179, "step": 71010 }, { - "epoch": 0.77, - "learning_rate": 0.0001848349224881624, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.00024625424421449867, + "loss": 0.0169, "step": 71020 }, { - "epoch": 0.77, - "learning_rate": 0.0001848187066225595, - "loss": 0.0153, + "epoch": 0.36, + "learning_rate": 0.00024624667652148465, + "loss": 0.019, "step": 71030 }, { - "epoch": 0.77, - "learning_rate": 0.0001848024907569566, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.00024623910882847063, + "loss": 0.0206, "step": 71040 }, { - "epoch": 0.77, - "learning_rate": 0.00018478627489135367, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.0002462315411354566, + "loss": 0.0143, "step": 71050 }, { - "epoch": 0.77, - "learning_rate": 0.00018477005902575077, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.0002462239734424426, + "loss": 0.0205, "step": 71060 }, { - "epoch": 0.77, - "learning_rate": 0.00018475384316014789, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.0002462164057494286, + "loss": 0.0194, "step": 71070 }, { - "epoch": 0.77, - "learning_rate": 0.00018473762729454498, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.0002462088380564146, + "loss": 0.0177, "step": 71080 }, { - "epoch": 0.77, - "learning_rate": 0.00018472141142894204, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002462012703634006, + "loss": 0.0223, "step": 71090 }, { - "epoch": 0.77, - "learning_rate": 0.00018470519556333914, - "loss": 0.0165, + "epoch": 0.36, + "learning_rate": 0.0002461937026703866, + "loss": 0.0198, "step": 71100 }, { - "epoch": 0.77, - "learning_rate": 0.00018468897969773626, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.00024618613497737256, + "loss": 0.0183, "step": 71110 }, { - "epoch": 0.77, - "learning_rate": 0.00018467276383213335, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024617856728435854, + "loss": 0.0222, "step": 71120 }, { - "epoch": 0.77, - "learning_rate": 0.00018465654796653042, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.0002461709995913445, + "loss": 0.0175, "step": 71130 }, { - "epoch": 0.77, - "learning_rate": 0.00018464033210092754, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024616343189833056, + "loss": 0.0197, "step": 71140 }, { - "epoch": 0.77, - "learning_rate": 0.00018462411623532463, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.00024615586420531654, + "loss": 0.0223, "step": 71150 }, { - "epoch": 0.77, - "learning_rate": 0.00018460790036972172, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.0002461482965123025, + "loss": 0.0152, "step": 71160 }, { - "epoch": 0.77, - "learning_rate": 0.0001845916845041188, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.0002461407288192885, + "loss": 0.0192, "step": 71170 }, { - "epoch": 0.77, - "learning_rate": 0.0001845754686385159, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.0002461331611262745, + "loss": 0.0223, "step": 71180 }, { - "epoch": 0.77, - "learning_rate": 0.000184559252772913, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.00024612559343326046, + "loss": 0.0179, "step": 71190 }, { - "epoch": 0.77, - "learning_rate": 0.0001845430369073101, - "loss": 0.017, + "epoch": 0.36, + "learning_rate": 0.00024611802574024645, + "loss": 0.0198, "step": 71200 }, { - "epoch": 0.77, - "learning_rate": 0.00018452682104170718, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002461104580472325, + "loss": 0.0182, "step": 71210 }, { - "epoch": 0.77, - "learning_rate": 0.00018451060517610428, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024610289035421846, + "loss": 0.0168, "step": 71220 }, { - "epoch": 0.77, - "learning_rate": 0.00018449438931050137, - "loss": 0.0169, + "epoch": 0.36, + "learning_rate": 0.00024609532266120444, + "loss": 0.0191, "step": 71230 }, { - "epoch": 0.77, - "learning_rate": 0.0001844781734448985, - "loss": 0.0155, + "epoch": 0.36, + "learning_rate": 0.0002460877549681904, + "loss": 0.0171, "step": 71240 }, { - "epoch": 0.77, - "learning_rate": 0.00018446195757929558, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.0002460801872751764, + "loss": 0.0154, "step": 71250 }, { - "epoch": 0.77, - "learning_rate": 0.00018444574171369265, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.0002460726195821624, + "loss": 0.0173, "step": 71260 }, { - "epoch": 0.77, - "learning_rate": 0.00018442952584808974, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.0002460650518891484, + "loss": 0.018, "step": 71270 }, { - "epoch": 0.77, - "learning_rate": 0.00018441330998248686, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.0002460574841961344, + "loss": 0.018, "step": 71280 }, { - "epoch": 0.77, - "learning_rate": 0.00018439709411688395, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.0002460499165031204, + "loss": 0.0166, "step": 71290 }, { - "epoch": 0.77, - "learning_rate": 0.00018438087825128102, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024604234881010637, + "loss": 0.02, "step": 71300 }, { - "epoch": 0.77, - "learning_rate": 0.00018436466238567814, - "loss": 0.0166, + "epoch": 0.36, + "learning_rate": 0.00024603478111709235, + "loss": 0.0157, "step": 71310 }, { - "epoch": 0.77, - "learning_rate": 0.00018434844652007523, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.00024602721342407833, + "loss": 0.0169, "step": 71320 }, { - "epoch": 0.77, - "learning_rate": 0.00018433223065447232, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.00024601964573106437, + "loss": 0.0161, "step": 71330 }, { - "epoch": 0.77, - "learning_rate": 0.0001843160147888694, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.00024601207803805035, + "loss": 0.0164, "step": 71340 }, { - "epoch": 0.77, - "learning_rate": 0.0001842997989232665, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.00024600451034503633, + "loss": 0.0193, "step": 71350 }, { - "epoch": 0.77, - "learning_rate": 0.0001842835830576636, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002459969426520223, + "loss": 0.0161, "step": 71360 }, { - "epoch": 0.77, - "learning_rate": 0.00018426736719206072, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002459893749590083, + "loss": 0.0136, "step": 71370 }, { - "epoch": 0.77, - "learning_rate": 0.0001842511513264578, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.0002459818072659943, + "loss": 0.0146, "step": 71380 }, { - "epoch": 0.77, - "learning_rate": 0.00018423493546085488, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.00024597423957298026, + "loss": 0.0178, "step": 71390 }, { - "epoch": 0.77, - "learning_rate": 0.00018421871959525197, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.0002459666718799663, + "loss": 0.0177, "step": 71400 }, { - "epoch": 0.77, - "learning_rate": 0.0001842025037296491, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024595910418695227, + "loss": 0.015, "step": 71410 }, { - "epoch": 0.77, - "learning_rate": 0.00018418628786404616, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.00024595153649393825, + "loss": 0.0234, "step": 71420 }, { - "epoch": 0.77, - "learning_rate": 0.00018417007199844325, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024594396880092424, + "loss": 0.0189, "step": 71430 }, { - "epoch": 0.77, - "learning_rate": 0.00018415385613284037, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002459364011079102, + "loss": 0.0195, "step": 71440 }, { - "epoch": 0.77, - "learning_rate": 0.00018413764026723746, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002459288334148962, + "loss": 0.018, "step": 71450 }, { - "epoch": 0.77, - "learning_rate": 0.00018412142440163453, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024592126572188223, + "loss": 0.0142, "step": 71460 }, { - "epoch": 0.77, - "learning_rate": 0.00018410520853603162, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.0002459136980288682, + "loss": 0.0171, "step": 71470 }, { - "epoch": 0.77, - "learning_rate": 0.00018408899267042874, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.0002459061303358542, + "loss": 0.018, "step": 71480 }, { - "epoch": 0.77, - "learning_rate": 0.00018407277680482584, - "loss": 0.0179, + "epoch": 0.36, + "learning_rate": 0.0002458985626428402, + "loss": 0.0163, "step": 71490 }, { - "epoch": 0.77, - "learning_rate": 0.0001840565609392229, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024589099494982616, + "loss": 0.0148, "step": 71500 }, { - "epoch": 0.77, - "learning_rate": 0.00018404034507362002, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.00024588342725681214, + "loss": 0.0154, "step": 71510 }, { - "epoch": 0.77, - "learning_rate": 0.00018402412920801711, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002458758595637982, + "loss": 0.0158, "step": 71520 }, { - "epoch": 0.77, - "learning_rate": 0.0001840079133424142, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024586829187078416, + "loss": 0.0192, "step": 71530 }, { - "epoch": 0.77, - "learning_rate": 0.00018399169747681127, - "loss": 0.0168, + "epoch": 0.36, + "learning_rate": 0.00024586072417777014, + "loss": 0.0162, "step": 71540 }, { - "epoch": 0.77, - "learning_rate": 0.0001839754816112084, - "loss": 0.0175, + "epoch": 0.36, + "learning_rate": 0.0002458531564847561, + "loss": 0.0189, "step": 71550 }, { - "epoch": 0.77, - "learning_rate": 0.00018395926574560548, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002458455887917421, + "loss": 0.0136, "step": 71560 }, { - "epoch": 0.77, - "learning_rate": 0.00018394304988000258, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002458380210987281, + "loss": 0.0169, "step": 71570 }, { - "epoch": 0.77, - "learning_rate": 0.00018392683401439967, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024583045340571407, + "loss": 0.018, "step": 71580 }, { - "epoch": 0.77, - "learning_rate": 0.00018391061814879676, - "loss": 0.0165, + "epoch": 0.36, + "learning_rate": 0.0002458228857127001, + "loss": 0.0199, "step": 71590 }, { - "epoch": 0.77, - "learning_rate": 0.00018389440228319386, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.0002458153180196861, + "loss": 0.0157, "step": 71600 }, { - "epoch": 0.77, - "learning_rate": 0.00018387818641759098, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024580775032667206, + "loss": 0.0174, "step": 71610 }, { - "epoch": 0.77, - "learning_rate": 0.00018386197055198804, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024580018263365805, + "loss": 0.0175, "step": 71620 }, { - "epoch": 0.77, - "learning_rate": 0.00018384575468638513, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.000245792614940644, + "loss": 0.0184, "step": 71630 }, { - "epoch": 0.77, - "learning_rate": 0.00018382953882078225, - "loss": 0.0148, + "epoch": 0.36, + "learning_rate": 0.00024578504724763, + "loss": 0.0176, "step": 71640 }, { - "epoch": 0.77, - "learning_rate": 0.00018381332295517935, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024577747955461604, + "loss": 0.0222, "step": 71650 }, { - "epoch": 0.77, - "learning_rate": 0.0001837971070895764, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.000245769911861602, + "loss": 0.0182, "step": 71660 }, { - "epoch": 0.77, - "learning_rate": 0.0001837808912239735, - "loss": 0.0112, + "epoch": 0.36, + "learning_rate": 0.000245762344168588, + "loss": 0.0146, "step": 71670 }, { - "epoch": 0.77, - "learning_rate": 0.00018376467535837062, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.000245754776475574, + "loss": 0.018, "step": 71680 }, { - "epoch": 0.78, - "learning_rate": 0.00018374845949276772, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.00024574720878255997, + "loss": 0.0151, "step": 71690 }, { - "epoch": 0.78, - "learning_rate": 0.00018373224362716478, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024573964108954595, + "loss": 0.0177, "step": 71700 }, { - "epoch": 0.78, - "learning_rate": 0.0001837160277615619, - "loss": 0.0164, + "epoch": 0.36, + "learning_rate": 0.00024573207339653193, + "loss": 0.0204, "step": 71710 }, { - "epoch": 0.78, - "learning_rate": 0.000183699811895959, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.00024572450570351797, + "loss": 0.0163, "step": 71720 }, { - "epoch": 0.78, - "learning_rate": 0.0001836835960303561, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024571693801050395, + "loss": 0.0202, "step": 71730 }, { - "epoch": 0.78, - "learning_rate": 0.00018366738016475315, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024570937031748993, + "loss": 0.017, "step": 71740 }, { - "epoch": 0.78, - "learning_rate": 0.00018365116429915027, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002457018026244759, + "loss": 0.0207, "step": 71750 }, { - "epoch": 0.78, - "learning_rate": 0.00018363494843354737, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.0002456942349314619, + "loss": 0.0169, "step": 71760 }, { - "epoch": 0.78, - "learning_rate": 0.00018361873256794446, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002456866672384479, + "loss": 0.0184, "step": 71770 }, { - "epoch": 0.78, - "learning_rate": 0.00018360251670234155, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.0002456790995454339, + "loss": 0.0186, "step": 71780 }, { - "epoch": 0.78, - "learning_rate": 0.00018358630083673865, - "loss": 0.0166, + "epoch": 0.36, + "learning_rate": 0.0002456715318524199, + "loss": 0.0152, "step": 71790 }, { - "epoch": 0.78, - "learning_rate": 0.00018357008497113574, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.0002456639641594059, + "loss": 0.0157, "step": 71800 }, { - "epoch": 0.78, - "learning_rate": 0.00018355386910553286, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024565639646639186, + "loss": 0.0204, "step": 71810 }, { - "epoch": 0.78, - "learning_rate": 0.00018353765323992992, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.00024564882877337784, + "loss": 0.0197, "step": 71820 }, { - "epoch": 0.78, - "learning_rate": 0.00018352143737432702, - "loss": 0.0165, + "epoch": 0.36, + "learning_rate": 0.0002456412610803638, + "loss": 0.0185, "step": 71830 }, { - "epoch": 0.78, - "learning_rate": 0.0001835052215087241, - "loss": 0.0159, + "epoch": 0.36, + "learning_rate": 0.00024563369338734985, + "loss": 0.0177, "step": 71840 }, { - "epoch": 0.78, - "learning_rate": 0.00018348900564312123, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024562612569433584, + "loss": 0.0259, "step": 71850 }, { - "epoch": 0.78, - "learning_rate": 0.0001834727897775183, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.0002456185580013218, + "loss": 0.0205, "step": 71860 }, { - "epoch": 0.78, - "learning_rate": 0.0001834565739119154, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.0002456109903083078, + "loss": 0.0149, "step": 71870 }, { - "epoch": 0.78, - "learning_rate": 0.0001834403580463125, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.0002456034226152938, + "loss": 0.018, "step": 71880 }, { - "epoch": 0.78, - "learning_rate": 0.0001834241421807096, - "loss": 0.0178, + "epoch": 0.36, + "learning_rate": 0.00024559585492227976, + "loss": 0.0192, "step": 71890 }, { - "epoch": 0.78, - "learning_rate": 0.00018340792631510667, - "loss": 0.0177, + "epoch": 0.36, + "learning_rate": 0.00024558828722926574, + "loss": 0.0223, "step": 71900 }, { - "epoch": 0.78, - "learning_rate": 0.00018339171044950376, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002455807195362518, + "loss": 0.0208, "step": 71910 }, { - "epoch": 0.78, - "learning_rate": 0.00018337549458390088, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.00024557315184323776, + "loss": 0.0185, "step": 71920 }, { - "epoch": 0.78, - "learning_rate": 0.00018335927871829797, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024556558415022374, + "loss": 0.0226, "step": 71930 }, { - "epoch": 0.78, - "learning_rate": 0.0001833430628526951, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.0002455580164572097, + "loss": 0.0202, "step": 71940 }, { - "epoch": 0.78, - "learning_rate": 0.00018332684698709216, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.0002455504487641957, + "loss": 0.0139, "step": 71950 }, { - "epoch": 0.78, - "learning_rate": 0.00018331063112148925, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.0002455428810711817, + "loss": 0.02, "step": 71960 }, { - "epoch": 0.78, - "learning_rate": 0.00018329441525588634, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.0002455353133781677, + "loss": 0.0159, "step": 71970 }, { - "epoch": 0.78, - "learning_rate": 0.00018327819939028346, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002455277456851537, + "loss": 0.0186, "step": 71980 }, { - "epoch": 0.78, - "learning_rate": 0.00018326198352468053, - "loss": 0.0194, + "epoch": 0.36, + "learning_rate": 0.0002455201779921397, + "loss": 0.0174, "step": 71990 }, { - "epoch": 0.78, - "learning_rate": 0.00018324576765907762, - "loss": 0.0217, + "epoch": 0.36, + "learning_rate": 0.00024551261029912567, + "loss": 0.0187, "step": 72000 }, { - "epoch": 0.78, - "eval_cer": 0.9215503867888964, - "eval_loss": 0.011484924703836441, - "eval_runtime": 121.1843, - "eval_samples_per_second": 16.504, - "eval_steps_per_second": 4.126, + "epoch": 0.36, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.013233224861323833, + "eval_runtime": 116.7335, + "eval_samples_per_second": 17.133, + "eval_steps_per_second": 4.283, "step": 72000 }, { - "epoch": 0.78, - "learning_rate": 0.00018322955179347474, - "loss": 0.0165, + "epoch": 0.36, + "learning_rate": 0.00024550504260611165, + "loss": 0.0232, "step": 72010 }, { - "epoch": 0.78, - "learning_rate": 0.00018321333592787183, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024549747491309763, + "loss": 0.0183, "step": 72020 }, { - "epoch": 0.78, - "learning_rate": 0.0001831971200622689, - "loss": 0.0161, + "epoch": 0.36, + "learning_rate": 0.0002454899072200836, + "loss": 0.0155, "step": 72030 }, { - "epoch": 0.78, - "learning_rate": 0.000183180904196666, - "loss": 0.0182, + "epoch": 0.36, + "learning_rate": 0.00024548233952706965, + "loss": 0.0159, "step": 72040 }, { - "epoch": 0.78, - "learning_rate": 0.0001831646883310631, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024547477183405563, + "loss": 0.0276, "step": 72050 }, { - "epoch": 0.78, - "learning_rate": 0.0001831484724654602, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.0002454672041410416, + "loss": 0.0188, "step": 72060 }, { - "epoch": 0.78, - "learning_rate": 0.00018313225659985727, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.0002454596364480276, + "loss": 0.018, "step": 72070 }, { - "epoch": 0.78, - "learning_rate": 0.0001831160407342544, - "loss": 0.018, + "epoch": 0.36, + "learning_rate": 0.00024545206875501357, + "loss": 0.0171, "step": 72080 }, { - "epoch": 0.78, - "learning_rate": 0.00018309982486865148, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024544450106199955, + "loss": 0.0187, "step": 72090 }, { - "epoch": 0.78, - "learning_rate": 0.00018308360900304857, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002454369333689856, + "loss": 0.0166, "step": 72100 }, { - "epoch": 0.78, - "learning_rate": 0.00018306739313744564, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024542936567597157, + "loss": 0.0169, "step": 72110 }, { - "epoch": 0.78, - "learning_rate": 0.00018305117727184276, - "loss": 0.0104, + "epoch": 0.36, + "learning_rate": 0.00024542179798295755, + "loss": 0.0223, "step": 72120 }, { - "epoch": 0.78, - "learning_rate": 0.00018303496140623985, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.00024541423028994353, + "loss": 0.016, "step": 72130 }, { - "epoch": 0.78, - "learning_rate": 0.00018301874554063695, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.0002454066625969295, + "loss": 0.0205, "step": 72140 }, { - "epoch": 0.78, - "learning_rate": 0.00018300252967503404, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002453990949039155, + "loss": 0.0174, "step": 72150 }, { - "epoch": 0.78, - "learning_rate": 0.00018298631380943113, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024539152721090153, + "loss": 0.0176, "step": 72160 }, { - "epoch": 0.78, - "learning_rate": 0.00018297009794382822, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.0002453839595178875, + "loss": 0.0159, "step": 72170 }, { - "epoch": 0.78, - "learning_rate": 0.00018295388207822534, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002453763918248735, + "loss": 0.0234, "step": 72180 }, { - "epoch": 0.78, - "learning_rate": 0.0001829376662126224, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002453688241318595, + "loss": 0.0204, "step": 72190 }, { - "epoch": 0.78, - "learning_rate": 0.0001829214503470195, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024536125643884546, + "loss": 0.0193, "step": 72200 }, { - "epoch": 0.78, - "learning_rate": 0.0001829052344814166, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.00024535368874583144, + "loss": 0.0159, "step": 72210 }, { - "epoch": 0.78, - "learning_rate": 0.00018288901861581371, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002453461210528174, + "loss": 0.0206, "step": 72220 }, { - "epoch": 0.78, - "learning_rate": 0.00018287280275021078, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.00024533855335980346, + "loss": 0.0177, "step": 72230 }, { - "epoch": 0.78, - "learning_rate": 0.00018285658688460787, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.00024533098566678944, + "loss": 0.0162, "step": 72240 }, { - "epoch": 0.78, - "learning_rate": 0.000182840371019005, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.0002453234179737754, + "loss": 0.0202, "step": 72250 }, { - "epoch": 0.78, - "learning_rate": 0.00018282415515340209, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.0002453158502807614, + "loss": 0.0214, "step": 72260 }, { - "epoch": 0.78, - "learning_rate": 0.00018280793928779915, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.0002453082825877474, + "loss": 0.0204, "step": 72270 }, { - "epoch": 0.78, - "learning_rate": 0.00018279172342219624, - "loss": 0.0175, + "epoch": 0.36, + "learning_rate": 0.00024530071489473336, + "loss": 0.022, "step": 72280 }, { - "epoch": 0.78, - "learning_rate": 0.00018277550755659336, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.00024529314720171934, + "loss": 0.018, "step": 72290 }, { - "epoch": 0.78, - "learning_rate": 0.00018275929169099046, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.0002452855795087053, + "loss": 0.0162, "step": 72300 }, { - "epoch": 0.78, - "learning_rate": 0.00018274307582538752, - "loss": 0.0104, + "epoch": 0.36, + "learning_rate": 0.0002452780118156913, + "loss": 0.0165, "step": 72310 }, { - "epoch": 0.78, - "learning_rate": 0.00018272685995978464, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.0002452704441226773, + "loss": 0.0187, "step": 72320 }, { - "epoch": 0.78, - "learning_rate": 0.00018271064409418173, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.0002452628764296633, + "loss": 0.0176, "step": 72330 }, { - "epoch": 0.78, - "learning_rate": 0.00018269442822857883, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.0002452553087366493, + "loss": 0.0206, "step": 72340 }, { - "epoch": 0.78, - "learning_rate": 0.0001826782123629759, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.0002452477410436353, + "loss": 0.0183, "step": 72350 }, { - "epoch": 0.78, - "learning_rate": 0.000182661996497373, - "loss": 0.0259, + "epoch": 0.37, + "learning_rate": 0.00024524017335062127, + "loss": 0.0208, "step": 72360 }, { - "epoch": 0.78, - "learning_rate": 0.0001826457806317701, - "loss": 0.0172, + "epoch": 0.37, + "learning_rate": 0.00024523260565760725, + "loss": 0.0177, "step": 72370 }, { - "epoch": 0.78, - "learning_rate": 0.00018262956476616723, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024522503796459323, + "loss": 0.0196, "step": 72380 }, { - "epoch": 0.78, - "learning_rate": 0.0001826133489005643, - "loss": 0.0194, + "epoch": 0.37, + "learning_rate": 0.00024521747027157927, + "loss": 0.0188, "step": 72390 }, { - "epoch": 0.78, - "learning_rate": 0.00018259713303496138, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.00024520990257856525, + "loss": 0.0192, "step": 72400 }, { - "epoch": 0.78, - "learning_rate": 0.00018258091716935848, - "loss": 0.0188, + "epoch": 0.37, + "learning_rate": 0.00024520233488555123, + "loss": 0.0187, "step": 72410 }, { - "epoch": 0.78, - "learning_rate": 0.0001825647013037556, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.0002451947671925372, + "loss": 0.0208, "step": 72420 }, { - "epoch": 0.78, - "learning_rate": 0.00018254848543815266, - "loss": 0.0165, + "epoch": 0.37, + "learning_rate": 0.0002451871994995232, + "loss": 0.0172, "step": 72430 }, { - "epoch": 0.78, - "learning_rate": 0.00018253226957254975, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.0002451796318065092, + "loss": 0.014, "step": 72440 }, { - "epoch": 0.78, - "learning_rate": 0.00018251605370694687, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.00024517206411349516, + "loss": 0.0155, "step": 72450 }, { - "epoch": 0.78, - "learning_rate": 0.00018249983784134397, - "loss": 0.0193, + "epoch": 0.37, + "learning_rate": 0.0002451644964204812, + "loss": 0.0216, "step": 72460 }, { - "epoch": 0.78, - "learning_rate": 0.00018248362197574103, - "loss": 0.017, + "epoch": 0.37, + "learning_rate": 0.0002451569287274672, + "loss": 0.0186, "step": 72470 }, { - "epoch": 0.78, - "learning_rate": 0.00018246740611013813, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024514936103445315, + "loss": 0.0172, "step": 72480 }, { - "epoch": 0.78, - "learning_rate": 0.00018245119024453525, - "loss": 0.0187, + "epoch": 0.37, + "learning_rate": 0.00024514179334143914, + "loss": 0.0171, "step": 72490 }, { - "epoch": 0.78, - "learning_rate": 0.00018243497437893234, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002451342256484251, + "loss": 0.0176, "step": 72500 }, { - "epoch": 0.78, - "learning_rate": 0.0001824187585133294, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.0002451266579554111, + "loss": 0.0187, "step": 72510 }, { - "epoch": 0.78, - "learning_rate": 0.00018240254264772652, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024511909026239713, + "loss": 0.0176, "step": 72520 }, { - "epoch": 0.78, - "learning_rate": 0.00018238632678212362, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002451115225693831, + "loss": 0.0181, "step": 72530 }, { - "epoch": 0.78, - "learning_rate": 0.0001823701109165207, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.0002451039548763691, + "loss": 0.017, "step": 72540 }, { - "epoch": 0.78, - "learning_rate": 0.00018235389505091777, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.0002450963871833551, + "loss": 0.0195, "step": 72550 }, { - "epoch": 0.78, - "learning_rate": 0.0001823376791853149, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.00024508881949034106, + "loss": 0.017, "step": 72560 }, { - "epoch": 0.78, - "learning_rate": 0.000182321463319712, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024508125179732704, + "loss": 0.0172, "step": 72570 }, { - "epoch": 0.78, - "learning_rate": 0.00018230524745410908, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.0002450736841043131, + "loss": 0.0167, "step": 72580 }, { - "epoch": 0.78, - "learning_rate": 0.00018228903158850617, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.00024506611641129906, + "loss": 0.0177, "step": 72590 }, { - "epoch": 0.78, - "learning_rate": 0.00018227281572290327, - "loss": 0.015, + "epoch": 0.37, + "learning_rate": 0.00024505854871828504, + "loss": 0.0207, "step": 72600 }, { - "epoch": 0.78, - "learning_rate": 0.00018225659985730036, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.000245050981025271, + "loss": 0.0173, "step": 72610 }, { - "epoch": 0.79, - "learning_rate": 0.00018224038399169748, - "loss": 0.0185, + "epoch": 0.37, + "learning_rate": 0.000245043413332257, + "loss": 0.0189, "step": 72620 }, { - "epoch": 0.79, - "learning_rate": 0.00018222416812609454, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.000245035845639243, + "loss": 0.0203, "step": 72630 }, { - "epoch": 0.79, - "learning_rate": 0.00018220795226049164, - "loss": 0.0173, + "epoch": 0.37, + "learning_rate": 0.00024502827794622897, + "loss": 0.0175, "step": 72640 }, { - "epoch": 0.79, - "learning_rate": 0.00018219173639488876, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.000245020710253215, + "loss": 0.0169, "step": 72650 }, { - "epoch": 0.79, - "learning_rate": 0.00018217552052928585, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.000245013142560201, + "loss": 0.0185, "step": 72660 }, { - "epoch": 0.79, - "learning_rate": 0.00018215930466368294, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024500557486718696, + "loss": 0.0178, "step": 72670 }, { - "epoch": 0.79, - "learning_rate": 0.00018214308879808, - "loss": 0.0168, + "epoch": 0.37, + "learning_rate": 0.00024499800717417295, + "loss": 0.0239, "step": 72680 }, { - "epoch": 0.79, - "learning_rate": 0.00018212687293247713, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.00024499043948115893, + "loss": 0.017, "step": 72690 }, { - "epoch": 0.79, - "learning_rate": 0.00018211065706687422, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.0002449828717881449, + "loss": 0.0188, "step": 72700 }, { - "epoch": 0.79, - "learning_rate": 0.0001820944412012713, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.00024497530409513094, + "loss": 0.0202, "step": 72710 }, { - "epoch": 0.79, - "learning_rate": 0.0001820782253356684, - "loss": 0.018, + "epoch": 0.37, + "learning_rate": 0.0002449677364021169, + "loss": 0.019, "step": 72720 }, { - "epoch": 0.79, - "learning_rate": 0.0001820620094700655, - "loss": 0.0166, + "epoch": 0.37, + "learning_rate": 0.0002449601687091029, + "loss": 0.0186, "step": 72730 }, { - "epoch": 0.79, - "learning_rate": 0.0001820457936044626, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.0002449526010160889, + "loss": 0.0184, "step": 72740 }, { - "epoch": 0.79, - "learning_rate": 0.0001820295777388597, - "loss": 0.0169, + "epoch": 0.37, + "learning_rate": 0.00024494503332307487, + "loss": 0.019, "step": 72750 }, { - "epoch": 0.79, - "learning_rate": 0.00018201336187325678, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024493746563006085, + "loss": 0.0173, "step": 72760 }, { - "epoch": 0.79, - "learning_rate": 0.00018199714600765387, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024492989793704683, + "loss": 0.0173, "step": 72770 }, { - "epoch": 0.79, - "learning_rate": 0.00018198093014205096, - "loss": 0.024, + "epoch": 0.37, + "learning_rate": 0.00024492233024403287, + "loss": 0.0162, "step": 72780 }, { - "epoch": 0.79, - "learning_rate": 0.00018196471427644808, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024491476255101885, + "loss": 0.0173, "step": 72790 }, { - "epoch": 0.79, - "learning_rate": 0.00018194849841084515, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.00024490719485800483, + "loss": 0.0195, "step": 72800 }, { - "epoch": 0.79, - "learning_rate": 0.00018193228254524224, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002448996271649908, + "loss": 0.0162, "step": 72810 }, { - "epoch": 0.79, - "learning_rate": 0.00018191606667963936, - "loss": 0.0152, + "epoch": 0.37, + "learning_rate": 0.0002448920594719768, + "loss": 0.0175, "step": 72820 }, { - "epoch": 0.79, - "learning_rate": 0.00018189985081403645, - "loss": 0.0176, + "epoch": 0.37, + "learning_rate": 0.0002448844917789628, + "loss": 0.018, "step": 72830 }, { - "epoch": 0.79, - "learning_rate": 0.00018188363494843352, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.0002448769240859488, + "loss": 0.0211, "step": 72840 }, { - "epoch": 0.79, - "learning_rate": 0.0001818674190828306, - "loss": 0.0173, + "epoch": 0.37, + "learning_rate": 0.0002448693563929348, + "loss": 0.0163, "step": 72850 }, { - "epoch": 0.79, - "learning_rate": 0.00018185120321722773, - "loss": 0.0161, + "epoch": 0.37, + "learning_rate": 0.0002448617886999208, + "loss": 0.0193, "step": 72860 }, { - "epoch": 0.79, - "learning_rate": 0.00018183498735162482, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024485422100690676, + "loss": 0.0187, "step": 72870 }, { - "epoch": 0.79, - "learning_rate": 0.0001818187714860219, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024484665331389274, + "loss": 0.0232, "step": 72880 }, { - "epoch": 0.79, - "learning_rate": 0.000181802555620419, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.0002448390856208787, + "loss": 0.0195, "step": 72890 }, { - "epoch": 0.79, - "learning_rate": 0.0001817863397548161, - "loss": 0.0158, + "epoch": 0.37, + "learning_rate": 0.00024483151792786475, + "loss": 0.0167, "step": 72900 }, { - "epoch": 0.79, - "learning_rate": 0.0001817701238892132, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024482395023485074, + "loss": 0.0166, "step": 72910 }, { - "epoch": 0.79, - "learning_rate": 0.00018175390802361026, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002448163825418367, + "loss": 0.0203, "step": 72920 }, { - "epoch": 0.79, - "learning_rate": 0.00018173769215800738, - "loss": 0.0174, + "epoch": 0.37, + "learning_rate": 0.0002448088148488227, + "loss": 0.0204, "step": 72930 }, { - "epoch": 0.79, - "learning_rate": 0.00018172147629240447, - "loss": 0.0161, + "epoch": 0.37, + "learning_rate": 0.0002448012471558087, + "loss": 0.0184, "step": 72940 }, { - "epoch": 0.79, - "learning_rate": 0.0001817052604268016, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024479367946279466, + "loss": 0.0207, "step": 72950 }, { - "epoch": 0.79, - "learning_rate": 0.00018168904456119866, - "loss": 0.0165, + "epoch": 0.37, + "learning_rate": 0.00024478611176978064, + "loss": 0.0193, "step": 72960 }, { - "epoch": 0.79, - "learning_rate": 0.00018167282869559575, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.0002447785440767667, + "loss": 0.0165, "step": 72970 }, { - "epoch": 0.79, - "learning_rate": 0.00018165661282999284, - "loss": 0.0191, + "epoch": 0.37, + "learning_rate": 0.00024477097638375266, + "loss": 0.0158, "step": 72980 }, { - "epoch": 0.79, - "learning_rate": 0.00018164039696438996, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024476340869073864, + "loss": 0.0159, "step": 72990 }, { - "epoch": 0.79, - "learning_rate": 0.00018162418109878703, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.0002447558409977246, + "loss": 0.02, "step": 73000 }, { - "epoch": 0.79, - "eval_cer": 0.9215382263475072, - "eval_loss": 0.01048470288515091, - "eval_runtime": 121.1149, - "eval_samples_per_second": 16.513, - "eval_steps_per_second": 4.128, + "epoch": 0.37, + "eval_cer": 0.9145197461055578, + "eval_loss": 0.013241157867014408, + "eval_runtime": 116.696, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 73000 }, { - "epoch": 0.79, - "learning_rate": 0.00018160796523318412, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.0002447482733047106, + "loss": 0.019, "step": 73010 }, { - "epoch": 0.79, - "learning_rate": 0.00018159174936758124, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002447407056116966, + "loss": 0.0194, "step": 73020 }, { - "epoch": 0.79, - "learning_rate": 0.00018157553350197834, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.0002447331379186826, + "loss": 0.0166, "step": 73030 }, { - "epoch": 0.79, - "learning_rate": 0.0001815593176363754, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002447255702256686, + "loss": 0.0193, "step": 73040 }, { - "epoch": 0.79, - "learning_rate": 0.0001815431017707725, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.0002447180025326546, + "loss": 0.0232, "step": 73050 }, { - "epoch": 0.79, - "learning_rate": 0.0001815268859051696, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.00024471043483964057, + "loss": 0.0167, "step": 73060 }, { - "epoch": 0.79, - "learning_rate": 0.0001815106700395667, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024470286714662655, + "loss": 0.0205, "step": 73070 }, { - "epoch": 0.79, - "learning_rate": 0.00018149445417396377, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024469529945361253, + "loss": 0.0195, "step": 73080 }, { - "epoch": 0.79, - "learning_rate": 0.0001814782383083609, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024468773176059856, + "loss": 0.0181, "step": 73090 }, { - "epoch": 0.79, - "learning_rate": 0.00018146202244275798, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.00024468016406758455, + "loss": 0.018, "step": 73100 }, { - "epoch": 0.79, - "learning_rate": 0.00018144580657715508, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.00024467259637457053, + "loss": 0.0291, "step": 73110 }, { - "epoch": 0.79, - "learning_rate": 0.00018142959071155214, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.0002446650286815565, + "loss": 0.0198, "step": 73120 }, { - "epoch": 0.79, - "learning_rate": 0.00018141337484594926, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002446574609885425, + "loss": 0.0162, "step": 73130 }, { - "epoch": 0.79, - "learning_rate": 0.00018139715898034636, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.00024464989329552847, + "loss": 0.0184, "step": 73140 }, { - "epoch": 0.79, - "learning_rate": 0.00018138094311474345, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024464232560251445, + "loss": 0.0188, "step": 73150 }, { - "epoch": 0.79, - "learning_rate": 0.00018136472724914054, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.0002446347579095005, + "loss": 0.0174, "step": 73160 }, { - "epoch": 0.79, - "learning_rate": 0.00018134851138353763, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024462719021648647, + "loss": 0.0233, "step": 73170 }, { - "epoch": 0.79, - "learning_rate": 0.00018133229551793473, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024461962252347245, + "loss": 0.0152, "step": 73180 }, { - "epoch": 0.79, - "learning_rate": 0.00018131607965233185, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.00024461205483045843, + "loss": 0.0173, "step": 73190 }, { - "epoch": 0.79, - "learning_rate": 0.0001812998637867289, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.0002446044871374444, + "loss": 0.0244, "step": 73200 }, { - "epoch": 0.79, - "learning_rate": 0.000181283647921126, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.0002445969194444304, + "loss": 0.0183, "step": 73210 }, { - "epoch": 0.79, - "learning_rate": 0.0001812674320555231, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024458935175141643, + "loss": 0.0193, "step": 73220 }, { - "epoch": 0.79, - "learning_rate": 0.00018125121618992022, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.0002445817840584024, + "loss": 0.0149, "step": 73230 }, { - "epoch": 0.79, - "learning_rate": 0.00018123500032431728, - "loss": 0.018, + "epoch": 0.37, + "learning_rate": 0.0002445742163653884, + "loss": 0.0188, "step": 73240 }, { - "epoch": 0.79, - "learning_rate": 0.00018121878445871438, - "loss": 0.0208, + "epoch": 0.37, + "learning_rate": 0.0002445666486723744, + "loss": 0.0194, "step": 73250 }, { - "epoch": 0.79, - "learning_rate": 0.0001812025685931115, - "loss": 0.0182, + "epoch": 0.37, + "learning_rate": 0.00024455908097936036, + "loss": 0.0158, "step": 73260 }, { - "epoch": 0.79, - "learning_rate": 0.0001811863527275086, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024455151328634634, + "loss": 0.0166, "step": 73270 }, { - "epoch": 0.79, - "learning_rate": 0.00018117013686190565, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002445439455933323, + "loss": 0.014, "step": 73280 }, { - "epoch": 0.79, - "learning_rate": 0.00018115392099630275, - "loss": 0.0186, + "epoch": 0.37, + "learning_rate": 0.00024453637790031836, + "loss": 0.0207, "step": 73290 }, { - "epoch": 0.79, - "learning_rate": 0.00018113770513069987, - "loss": 0.023, + "epoch": 0.37, + "learning_rate": 0.00024452881020730434, + "loss": 0.0232, "step": 73300 }, { - "epoch": 0.79, - "learning_rate": 0.00018112148926509696, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.0002445212425142903, + "loss": 0.0151, "step": 73310 }, { - "epoch": 0.79, - "learning_rate": 0.00018110527339949402, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.0002445136748212763, + "loss": 0.0191, "step": 73320 }, { - "epoch": 0.79, - "learning_rate": 0.00018108905753389114, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.0002445061071282623, + "loss": 0.021, "step": 73330 }, { - "epoch": 0.79, - "learning_rate": 0.00018107284166828824, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.00024449853943524826, + "loss": 0.0165, "step": 73340 }, { - "epoch": 0.79, - "learning_rate": 0.00018105662580268533, - "loss": 0.0161, + "epoch": 0.37, + "learning_rate": 0.0002444909717422343, + "loss": 0.0135, "step": 73350 }, { - "epoch": 0.79, - "learning_rate": 0.0001810404099370824, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.0002444834040492203, + "loss": 0.0145, "step": 73360 }, { - "epoch": 0.79, - "learning_rate": 0.00018102419407147952, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.00024447583635620626, + "loss": 0.0177, "step": 73370 }, { - "epoch": 0.79, - "learning_rate": 0.0001810079782058766, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024446826866319224, + "loss": 0.0165, "step": 73380 }, { - "epoch": 0.79, - "learning_rate": 0.00018099176234027373, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.0002444607009701782, + "loss": 0.0203, "step": 73390 }, { - "epoch": 0.79, - "learning_rate": 0.00018097554647467082, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.0002444531332771642, + "loss": 0.0139, "step": 73400 }, { - "epoch": 0.79, - "learning_rate": 0.0001809593306090679, - "loss": 0.0111, + "epoch": 0.37, + "learning_rate": 0.00024444556558415024, + "loss": 0.014, "step": 73410 }, { - "epoch": 0.79, - "learning_rate": 0.00018094311474346498, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002444379978911362, + "loss": 0.019, "step": 73420 }, { - "epoch": 0.79, - "learning_rate": 0.0001809268988778621, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.0002444304301981222, + "loss": 0.0149, "step": 73430 }, { - "epoch": 0.79, - "learning_rate": 0.0001809106830122592, - "loss": 0.0171, + "epoch": 0.37, + "learning_rate": 0.0002444228625051082, + "loss": 0.0173, "step": 73440 }, { - "epoch": 0.79, - "learning_rate": 0.00018089446714665626, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.00024441529481209417, + "loss": 0.0219, "step": 73450 }, { - "epoch": 0.79, - "learning_rate": 0.00018087825128105338, - "loss": 0.0158, + "epoch": 0.37, + "learning_rate": 0.00024440772711908015, + "loss": 0.0178, "step": 73460 }, { - "epoch": 0.79, - "learning_rate": 0.00018086203541545047, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024440015942606613, + "loss": 0.0198, "step": 73470 }, { - "epoch": 0.79, - "learning_rate": 0.00018084581954984756, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.00024439259173305217, + "loss": 0.0182, "step": 73480 }, { - "epoch": 0.79, - "learning_rate": 0.00018082960368424463, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.00024438502404003815, + "loss": 0.0175, "step": 73490 }, { - "epoch": 0.79, - "learning_rate": 0.00018081338781864175, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024437745634702413, + "loss": 0.024, "step": 73500 }, { - "epoch": 0.79, - "learning_rate": 0.00018079717195303884, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002443698886540101, + "loss": 0.0177, "step": 73510 }, { - "epoch": 0.79, - "learning_rate": 0.00018078095608743593, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002443623209609961, + "loss": 0.0212, "step": 73520 }, { - "epoch": 0.79, - "learning_rate": 0.00018076474022183303, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002443547532679821, + "loss": 0.0182, "step": 73530 }, { - "epoch": 0.8, - "learning_rate": 0.00018074852435623012, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.00024434718557496805, + "loss": 0.0156, "step": 73540 }, { - "epoch": 0.8, - "learning_rate": 0.0001807323084906272, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.00024433961788195404, + "loss": 0.0179, "step": 73550 }, { - "epoch": 0.8, - "learning_rate": 0.00018071609262502433, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024433205018894, + "loss": 0.0374, "step": 73560 }, { - "epoch": 0.8, - "learning_rate": 0.0001806998767594214, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.000244324482495926, + "loss": 0.0162, "step": 73570 }, { - "epoch": 0.8, - "learning_rate": 0.0001806836608938185, - "loss": 0.0228, + "epoch": 0.37, + "learning_rate": 0.00024431691480291203, + "loss": 0.0173, "step": 73580 }, { - "epoch": 0.8, - "learning_rate": 0.00018066744502821558, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.000244309347109898, + "loss": 0.0174, "step": 73590 }, { - "epoch": 0.8, - "learning_rate": 0.0001806512291626127, - "loss": 0.0158, + "epoch": 0.37, + "learning_rate": 0.000244301779416884, + "loss": 0.0173, "step": 73600 }, { - "epoch": 0.8, - "learning_rate": 0.00018063501329700977, - "loss": 0.017, + "epoch": 0.37, + "learning_rate": 0.00024429421172387, + "loss": 0.0218, "step": 73610 }, { - "epoch": 0.8, - "learning_rate": 0.00018061879743140686, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024428664403085596, + "loss": 0.019, "step": 73620 }, { - "epoch": 0.8, - "learning_rate": 0.00018060258156580398, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024427907633784194, + "loss": 0.0197, "step": 73630 }, { - "epoch": 0.8, - "learning_rate": 0.00018058636570020107, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.000244271508644828, + "loss": 0.0195, "step": 73640 }, { - "epoch": 0.8, - "learning_rate": 0.00018057014983459814, - "loss": 0.0179, + "epoch": 0.37, + "learning_rate": 0.00024426394095181396, + "loss": 0.0201, "step": 73650 }, { - "epoch": 0.8, - "learning_rate": 0.00018055393396899526, - "loss": 0.0205, + "epoch": 0.37, + "learning_rate": 0.00024425637325879994, + "loss": 0.0203, "step": 73660 }, { - "epoch": 0.8, - "learning_rate": 0.00018053771810339235, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.0002442488055657859, + "loss": 0.02, "step": 73670 }, { - "epoch": 0.8, - "learning_rate": 0.00018052150223778944, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.0002442412378727719, + "loss": 0.0148, "step": 73680 }, { - "epoch": 0.8, - "learning_rate": 0.0001805052863721865, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002442336701797579, + "loss": 0.0149, "step": 73690 }, { - "epoch": 0.8, - "learning_rate": 0.00018048907050658363, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024422610248674387, + "loss": 0.0186, "step": 73700 }, { - "epoch": 0.8, - "learning_rate": 0.00018047285464098072, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.0002442185347937299, + "loss": 0.0163, "step": 73710 }, { - "epoch": 0.8, - "learning_rate": 0.00018045663877537782, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.0002442109671007159, + "loss": 0.0183, "step": 73720 }, { - "epoch": 0.8, - "learning_rate": 0.0001804404229097749, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024420339940770186, + "loss": 0.0192, "step": 73730 }, { - "epoch": 0.8, - "learning_rate": 0.000180424207044172, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024419583171468785, + "loss": 0.0192, "step": 73740 }, { - "epoch": 0.8, - "learning_rate": 0.0001804079911785691, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.00024418826402167383, + "loss": 0.0179, "step": 73750 }, { - "epoch": 0.8, - "learning_rate": 0.00018039177531296621, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002441806963286598, + "loss": 0.0192, "step": 73760 }, { - "epoch": 0.8, - "learning_rate": 0.00018037555944736328, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.00024417312863564584, + "loss": 0.0169, "step": 73770 }, { - "epoch": 0.8, - "learning_rate": 0.00018035934358176037, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.0002441655609426318, + "loss": 0.0166, "step": 73780 }, { - "epoch": 0.8, - "learning_rate": 0.00018034312771615746, - "loss": 0.0169, + "epoch": 0.37, + "learning_rate": 0.0002441579932496178, + "loss": 0.0153, "step": 73790 }, { - "epoch": 0.8, - "learning_rate": 0.00018032691185055458, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002441504255566038, + "loss": 0.0178, "step": 73800 }, { - "epoch": 0.8, - "learning_rate": 0.00018031069598495165, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.00024414285786358977, + "loss": 0.0184, "step": 73810 }, { - "epoch": 0.8, - "learning_rate": 0.00018029448011934874, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024413529017057578, + "loss": 0.0177, "step": 73820 }, { - "epoch": 0.8, - "learning_rate": 0.00018027826425374586, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024412772247756176, + "loss": 0.0185, "step": 73830 }, { - "epoch": 0.8, - "learning_rate": 0.00018026204838814296, - "loss": 0.017, + "epoch": 0.37, + "learning_rate": 0.00024412015478454774, + "loss": 0.0203, "step": 73840 }, { - "epoch": 0.8, - "learning_rate": 0.00018024583252254002, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024411258709153375, + "loss": 0.0168, "step": 73850 }, { - "epoch": 0.8, - "learning_rate": 0.00018022961665693711, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024410501939851973, + "loss": 0.0186, "step": 73860 }, { - "epoch": 0.8, - "learning_rate": 0.00018021340079133423, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.0002440974517055057, + "loss": 0.0192, "step": 73870 }, { - "epoch": 0.8, - "learning_rate": 0.00018019718492573133, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024408988401249172, + "loss": 0.019, "step": 73880 }, { - "epoch": 0.8, - "learning_rate": 0.0001801809690601284, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.0002440823163194777, + "loss": 0.015, "step": 73890 }, { - "epoch": 0.8, - "learning_rate": 0.0001801647531945255, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024407474862646368, + "loss": 0.0198, "step": 73900 }, { - "epoch": 0.8, - "learning_rate": 0.0001801485373289226, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.00024406718093344967, + "loss": 0.0203, "step": 73910 }, { - "epoch": 0.8, - "learning_rate": 0.0001801323214633197, - "loss": 0.0161, + "epoch": 0.37, + "learning_rate": 0.00024405961324043567, + "loss": 0.0176, "step": 73920 }, { - "epoch": 0.8, - "learning_rate": 0.00018011610559771676, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.00024405204554742166, + "loss": 0.0169, "step": 73930 }, { - "epoch": 0.8, - "learning_rate": 0.00018009988973211388, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.00024404447785440764, + "loss": 0.017, "step": 73940 }, { - "epoch": 0.8, - "learning_rate": 0.00018008367386651098, - "loss": 0.017, + "epoch": 0.37, + "learning_rate": 0.00024403691016139365, + "loss": 0.0188, "step": 73950 }, { - "epoch": 0.8, - "learning_rate": 0.0001800674580009081, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024402934246837963, + "loss": 0.0181, "step": 73960 }, { - "epoch": 0.8, - "learning_rate": 0.00018005124213530516, - "loss": 0.0106, + "epoch": 0.37, + "learning_rate": 0.0002440217747753656, + "loss": 0.0174, "step": 73970 }, { - "epoch": 0.8, - "learning_rate": 0.00018003502626970225, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.00024401420708235162, + "loss": 0.0171, "step": 73980 }, { - "epoch": 0.8, - "learning_rate": 0.00018001881040409935, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.0002440066393893376, + "loss": 0.0221, "step": 73990 }, { - "epoch": 0.8, - "learning_rate": 0.00018000259453849647, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024399907169632358, + "loss": 0.02, "step": 74000 }, { - "epoch": 0.8, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.010000753216445446, - "eval_runtime": 121.1084, - "eval_samples_per_second": 16.514, - "eval_steps_per_second": 4.129, + "epoch": 0.37, + "eval_cer": 0.9144848118450433, + "eval_loss": 0.012880527414381504, + "eval_runtime": 116.6543, + "eval_samples_per_second": 17.145, + "eval_steps_per_second": 4.286, "step": 74000 }, { - "epoch": 0.8, - "learning_rate": 0.00017998637867289353, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.0002439915040033096, + "loss": 0.0215, "step": 74010 }, { - "epoch": 0.8, - "learning_rate": 0.00017997016280729063, - "loss": 0.0165, + "epoch": 0.37, + "learning_rate": 0.00024398393631029557, + "loss": 0.0181, "step": 74020 }, { - "epoch": 0.8, - "learning_rate": 0.00017995394694168774, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.00024397636861728155, + "loss": 0.0187, "step": 74030 }, { - "epoch": 0.8, - "learning_rate": 0.00017993773107608484, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.00024396880092426756, + "loss": 0.0162, "step": 74040 }, { - "epoch": 0.8, - "learning_rate": 0.0001799215152104819, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.00024396123323125354, + "loss": 0.0164, "step": 74050 }, { - "epoch": 0.8, - "learning_rate": 0.000179905299344879, + "epoch": 0.37, + "learning_rate": 0.00024395366553823952, "loss": 0.0189, "step": 74060 }, { - "epoch": 0.8, - "learning_rate": 0.00017988908347927612, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024394609784522553, + "loss": 0.016, "step": 74070 }, { - "epoch": 0.8, - "learning_rate": 0.0001798728676136732, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.0002439385301522115, + "loss": 0.0193, "step": 74080 }, { - "epoch": 0.8, - "learning_rate": 0.0001798566517480703, - "loss": 0.0175, + "epoch": 0.37, + "learning_rate": 0.0002439309624591975, + "loss": 0.0194, "step": 74090 }, { - "epoch": 0.8, - "learning_rate": 0.0001798404358824674, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024392339476618348, + "loss": 0.0184, "step": 74100 }, { - "epoch": 0.8, - "learning_rate": 0.0001798242200168645, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024391582707316948, + "loss": 0.0196, "step": 74110 }, { - "epoch": 0.8, - "learning_rate": 0.00017980800415126158, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.00024390825938015547, + "loss": 0.0197, "step": 74120 }, { - "epoch": 0.8, - "learning_rate": 0.0001797917882856587, - "loss": 0.0173, + "epoch": 0.37, + "learning_rate": 0.00024390069168714145, + "loss": 0.0172, "step": 74130 }, { - "epoch": 0.8, - "learning_rate": 0.00017977557242005577, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.00024389312399412746, + "loss": 0.0189, "step": 74140 }, { - "epoch": 0.8, - "learning_rate": 0.00017975935655445286, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024388555630111344, + "loss": 0.0165, "step": 74150 }, { - "epoch": 0.8, - "learning_rate": 0.00017974314068884995, - "loss": 0.0167, + "epoch": 0.37, + "learning_rate": 0.00024387798860809942, + "loss": 0.0179, "step": 74160 }, { - "epoch": 0.8, - "learning_rate": 0.00017972692482324707, - "loss": 0.0181, + "epoch": 0.37, + "learning_rate": 0.00024387042091508543, + "loss": 0.015, "step": 74170 }, { - "epoch": 0.8, - "learning_rate": 0.00017971070895764414, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.0002438628532220714, + "loss": 0.0181, "step": 74180 }, { - "epoch": 0.8, - "learning_rate": 0.00017969449309204123, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002438552855290574, + "loss": 0.0204, "step": 74190 }, { - "epoch": 0.8, - "learning_rate": 0.00017967827722643835, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.0002438477178360434, + "loss": 0.0181, "step": 74200 }, { - "epoch": 0.8, - "learning_rate": 0.00017966206136083544, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024384015014302938, + "loss": 0.0182, "step": 74210 }, { - "epoch": 0.8, - "learning_rate": 0.0001796458454952325, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.00024383258245001536, + "loss": 0.0188, "step": 74220 }, { - "epoch": 0.8, - "learning_rate": 0.0001796296296296296, - "loss": 0.017, + "epoch": 0.37, + "learning_rate": 0.00024382501475700137, + "loss": 0.0242, "step": 74230 }, { - "epoch": 0.8, - "learning_rate": 0.00017961341376402672, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.00024381744706398735, + "loss": 0.0171, "step": 74240 }, { - "epoch": 0.8, - "learning_rate": 0.0001795971978984238, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.00024380987937097333, + "loss": 0.0187, "step": 74250 }, { - "epoch": 0.8, - "learning_rate": 0.00017958098203282088, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024380231167795931, + "loss": 0.0171, "step": 74260 }, { - "epoch": 0.8, - "learning_rate": 0.000179564766167218, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024379474398494532, + "loss": 0.0148, "step": 74270 }, { - "epoch": 0.8, - "learning_rate": 0.0001795485503016151, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.0002437871762919313, + "loss": 0.0187, "step": 74280 }, { - "epoch": 0.8, - "learning_rate": 0.00017953233443601218, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024377960859891729, + "loss": 0.0166, "step": 74290 }, { - "epoch": 0.8, - "learning_rate": 0.00017951611857040925, - "loss": 0.0173, + "epoch": 0.37, + "learning_rate": 0.0002437720409059033, + "loss": 0.018, "step": 74300 }, { - "epoch": 0.8, - "learning_rate": 0.00017949990270480637, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024376447321288928, + "loss": 0.0141, "step": 74310 }, { - "epoch": 0.8, - "learning_rate": 0.00017948368683920346, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.00024375690551987526, + "loss": 0.0173, "step": 74320 }, { - "epoch": 0.8, - "learning_rate": 0.00017946747097360058, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024374933782686127, + "loss": 0.0209, "step": 74330 }, { - "epoch": 0.8, - "learning_rate": 0.00017945125510799765, - "loss": 0.0199, + "epoch": 0.38, + "learning_rate": 0.00024374177013384725, + "loss": 0.0183, "step": 74340 }, { - "epoch": 0.8, - "learning_rate": 0.00017943503924239474, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024373420244083323, + "loss": 0.0157, "step": 74350 }, { - "epoch": 0.8, - "learning_rate": 0.00017941882337679183, - "loss": 0.0153, + "epoch": 0.38, + "learning_rate": 0.00024372663474781924, + "loss": 0.0167, "step": 74360 }, { - "epoch": 0.8, - "learning_rate": 0.00017940260751118895, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024371906705480522, + "loss": 0.0168, "step": 74370 }, { - "epoch": 0.8, - "learning_rate": 0.00017938639164558602, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002437114993617912, + "loss": 0.0158, "step": 74380 }, { - "epoch": 0.8, - "learning_rate": 0.0001793701757799831, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.0002437039316687772, + "loss": 0.0216, "step": 74390 }, { - "epoch": 0.8, - "learning_rate": 0.00017935395991438023, - "loss": 0.021, + "epoch": 0.38, + "learning_rate": 0.0002436963639757632, + "loss": 0.0217, "step": 74400 }, { - "epoch": 0.8, - "learning_rate": 0.00017933774404877732, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024368879628274917, + "loss": 0.0187, "step": 74410 }, { - "epoch": 0.8, - "learning_rate": 0.0001793215281831744, - "loss": 0.0154, + "epoch": 0.38, + "learning_rate": 0.00024368122858973515, + "loss": 0.0217, "step": 74420 }, { - "epoch": 0.8, - "learning_rate": 0.00017930531231757148, - "loss": 0.0106, + "epoch": 0.38, + "learning_rate": 0.00024367366089672116, + "loss": 0.0231, "step": 74430 }, { - "epoch": 0.8, - "learning_rate": 0.0001792890964519686, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.00024366609320370714, + "loss": 0.0163, "step": 74440 }, { - "epoch": 0.8, - "learning_rate": 0.0001792728805863657, - "loss": 0.0154, + "epoch": 0.38, + "learning_rate": 0.00024365852551069312, + "loss": 0.0169, "step": 74450 }, { - "epoch": 0.8, - "learning_rate": 0.00017925666472076276, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024365095781767913, + "loss": 0.0225, "step": 74460 }, { - "epoch": 0.81, - "learning_rate": 0.00017924044885515988, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024364339012466511, + "loss": 0.0206, "step": 74470 }, { - "epoch": 0.81, - "learning_rate": 0.00017922423298955697, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.0002436358224316511, + "loss": 0.0202, "step": 74480 }, { - "epoch": 0.81, - "learning_rate": 0.00017920801712395407, - "loss": 0.0109, + "epoch": 0.38, + "learning_rate": 0.0002436282547386371, + "loss": 0.0168, "step": 74490 }, { - "epoch": 0.81, - "learning_rate": 0.00017919180125835113, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.00024362068704562309, + "loss": 0.0195, "step": 74500 }, { - "epoch": 0.81, - "learning_rate": 0.00017917558539274825, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024361311935260907, + "loss": 0.0196, "step": 74510 }, { - "epoch": 0.81, - "learning_rate": 0.00017915936952714534, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024360555165959508, + "loss": 0.0178, "step": 74520 }, { - "epoch": 0.81, - "learning_rate": 0.00017914315366154244, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024359798396658106, + "loss": 0.0168, "step": 74530 }, { - "epoch": 0.81, - "learning_rate": 0.00017912693779593953, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024359041627356704, + "loss": 0.0194, "step": 74540 }, { - "epoch": 0.81, - "learning_rate": 0.00017911072193033662, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024358284858055305, + "loss": 0.0216, "step": 74550 }, { - "epoch": 0.81, - "learning_rate": 0.00017909450606473371, - "loss": 0.0168, + "epoch": 0.38, + "learning_rate": 0.00024357528088753903, + "loss": 0.0178, "step": 74560 }, { - "epoch": 0.81, - "learning_rate": 0.00017907829019913083, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.000243567713194525, + "loss": 0.0204, "step": 74570 }, { - "epoch": 0.81, - "learning_rate": 0.0001790620743335279, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024356014550151102, + "loss": 0.0185, "step": 74580 }, { - "epoch": 0.81, - "learning_rate": 0.000179045858467925, - "loss": 0.0152, + "epoch": 0.38, + "learning_rate": 0.000243552577808497, + "loss": 0.0173, "step": 74590 }, { - "epoch": 0.81, - "learning_rate": 0.00017902964260232209, - "loss": 0.0177, + "epoch": 0.38, + "learning_rate": 0.00024354501011548298, + "loss": 0.0183, "step": 74600 }, { - "epoch": 0.81, - "learning_rate": 0.0001790134267367192, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024353744242246896, + "loss": 0.0188, "step": 74610 }, { - "epoch": 0.81, - "learning_rate": 0.00017899721087111627, - "loss": 0.0184, + "epoch": 0.38, + "learning_rate": 0.00024352987472945497, + "loss": 0.0213, "step": 74620 }, { - "epoch": 0.81, - "learning_rate": 0.00017898099500551336, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024352230703644095, + "loss": 0.0171, "step": 74630 }, { - "epoch": 0.81, - "learning_rate": 0.00017896477913991048, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024351473934342693, + "loss": 0.0194, "step": 74640 }, { - "epoch": 0.81, - "learning_rate": 0.00017894856327430758, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024350717165041294, + "loss": 0.0204, "step": 74650 }, { - "epoch": 0.81, - "learning_rate": 0.00017893234740870464, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024349960395739892, + "loss": 0.0214, "step": 74660 }, { - "epoch": 0.81, - "learning_rate": 0.00017891613154310176, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.0002434920362643849, + "loss": 0.0178, "step": 74670 }, { - "epoch": 0.81, - "learning_rate": 0.00017889991567749885, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024348446857137091, + "loss": 0.0173, "step": 74680 }, { - "epoch": 0.81, - "learning_rate": 0.00017888369981189595, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.0002434769008783569, + "loss": 0.0165, "step": 74690 }, { - "epoch": 0.81, - "learning_rate": 0.000178867483946293, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024346933318534288, + "loss": 0.0181, "step": 74700 }, { - "epoch": 0.81, - "learning_rate": 0.00017885126808069013, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.00024346176549232889, + "loss": 0.0171, "step": 74710 }, { - "epoch": 0.81, - "learning_rate": 0.00017883505221508723, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.00024345419779931487, + "loss": 0.0178, "step": 74720 }, { - "epoch": 0.81, - "learning_rate": 0.00017881883634948432, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024344663010630085, + "loss": 0.017, "step": 74730 }, { - "epoch": 0.81, - "learning_rate": 0.0001788026204838814, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024343906241328686, + "loss": 0.0205, "step": 74740 }, { - "epoch": 0.81, - "learning_rate": 0.0001787864046182785, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.00024343149472027284, + "loss": 0.0173, "step": 74750 }, { - "epoch": 0.81, - "learning_rate": 0.0001787701887526756, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024342392702725882, + "loss": 0.0185, "step": 74760 }, { - "epoch": 0.81, - "learning_rate": 0.00017875397288707272, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002434163593342448, + "loss": 0.0179, "step": 74770 }, { - "epoch": 0.81, - "learning_rate": 0.00017873775702146978, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.0002434087916412308, + "loss": 0.0176, "step": 74780 }, { - "epoch": 0.81, - "learning_rate": 0.00017872154115586687, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024340122394821676, + "loss": 0.0205, "step": 74790 }, { - "epoch": 0.81, - "learning_rate": 0.00017870532529026397, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024339365625520275, + "loss": 0.0175, "step": 74800 }, { - "epoch": 0.81, - "learning_rate": 0.0001786891094246611, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024338608856218873, + "loss": 0.0168, "step": 74810 }, { - "epoch": 0.81, - "learning_rate": 0.00017867289355905818, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024337852086917474, + "loss": 0.0211, "step": 74820 }, { - "epoch": 0.81, - "learning_rate": 0.00017865667769345525, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024337095317616072, + "loss": 0.0186, "step": 74830 }, { - "epoch": 0.81, - "learning_rate": 0.00017864046182785237, - "loss": 0.0148, + "epoch": 0.38, + "learning_rate": 0.0002433633854831467, + "loss": 0.0184, "step": 74840 }, { - "epoch": 0.81, - "learning_rate": 0.00017862424596224946, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.0002433558177901327, + "loss": 0.0167, "step": 74850 }, { - "epoch": 0.81, - "learning_rate": 0.00017860803009664655, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.0002433482500971187, + "loss": 0.0211, "step": 74860 }, { - "epoch": 0.81, - "learning_rate": 0.00017859181423104362, - "loss": 0.0109, + "epoch": 0.38, + "learning_rate": 0.00024334068240410467, + "loss": 0.0193, "step": 74870 }, { - "epoch": 0.81, - "learning_rate": 0.00017857559836544074, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024333311471109068, + "loss": 0.0197, "step": 74880 }, { - "epoch": 0.81, - "learning_rate": 0.00017855938249983783, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.00024332554701807666, + "loss": 0.0151, "step": 74890 }, { - "epoch": 0.81, - "learning_rate": 0.00017854316663423492, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024331797932506264, + "loss": 0.0191, "step": 74900 }, { - "epoch": 0.81, - "learning_rate": 0.00017852695076863201, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024331041163204865, + "loss": 0.0204, "step": 74910 }, { - "epoch": 0.81, - "learning_rate": 0.0001785107349030291, - "loss": 0.0172, + "epoch": 0.38, + "learning_rate": 0.00024330284393903463, + "loss": 0.0217, "step": 74920 }, { - "epoch": 0.81, - "learning_rate": 0.0001784945190374262, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024329527624602061, + "loss": 0.0208, "step": 74930 }, { - "epoch": 0.81, - "learning_rate": 0.00017847830317182332, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024328770855300662, + "loss": 0.0187, "step": 74940 }, { - "epoch": 0.81, - "learning_rate": 0.00017846208730622039, - "loss": 0.0146, + "epoch": 0.38, + "learning_rate": 0.0002432801408599926, + "loss": 0.0184, "step": 74950 }, { - "epoch": 0.81, - "learning_rate": 0.00017844587144061748, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024327257316697859, + "loss": 0.0186, "step": 74960 }, { - "epoch": 0.81, - "learning_rate": 0.0001784296555750146, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.0002432650054739646, + "loss": 0.0217, "step": 74970 }, { - "epoch": 0.81, - "learning_rate": 0.0001784134397094117, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024325743778095058, + "loss": 0.0188, "step": 74980 }, { - "epoch": 0.81, - "learning_rate": 0.00017839722384380876, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024324987008793656, + "loss": 0.02, "step": 74990 }, { - "epoch": 0.81, - "learning_rate": 0.00017838100797820585, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024324230239492254, + "loss": 0.0191, "step": 75000 }, { - "epoch": 0.81, - "eval_cer": 0.9215417007593327, - "eval_loss": 0.009637880139052868, - "eval_runtime": 121.078, - "eval_samples_per_second": 16.518, - "eval_steps_per_second": 4.13, + "epoch": 0.38, + "eval_cer": 0.9144935454101719, + "eval_loss": 0.013869182206690311, + "eval_runtime": 116.7861, + "eval_samples_per_second": 17.125, + "eval_steps_per_second": 4.281, "step": 75000 }, { - "epoch": 0.81, - "learning_rate": 0.00017836479211260297, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024323473470190855, + "loss": 0.0208, "step": 75010 }, { - "epoch": 0.81, - "learning_rate": 0.00017834857624700006, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.00024322716700889453, + "loss": 0.0217, "step": 75020 }, { - "epoch": 0.81, - "learning_rate": 0.00017833236038139713, - "loss": 0.0158, + "epoch": 0.38, + "learning_rate": 0.0002432195993158805, + "loss": 0.0162, "step": 75030 }, { - "epoch": 0.81, - "learning_rate": 0.00017831614451579425, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024321203162286652, + "loss": 0.0162, "step": 75040 }, { - "epoch": 0.81, - "learning_rate": 0.00017829992865019134, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.0002432044639298525, + "loss": 0.0242, "step": 75050 }, { - "epoch": 0.81, - "learning_rate": 0.00017828371278458843, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024319689623683848, + "loss": 0.019, "step": 75060 }, { - "epoch": 0.81, - "learning_rate": 0.0001782674969189855, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.0002431893285438245, + "loss": 0.0189, "step": 75070 }, { - "epoch": 0.81, - "learning_rate": 0.00017825128105338262, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024318176085081047, + "loss": 0.0169, "step": 75080 }, { - "epoch": 0.81, - "learning_rate": 0.0001782350651877797, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.00024317419315779645, + "loss": 0.0173, "step": 75090 }, { - "epoch": 0.81, - "learning_rate": 0.0001782188493221768, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024316662546478246, + "loss": 0.0189, "step": 75100 }, { - "epoch": 0.81, - "learning_rate": 0.0001782026334565739, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024315905777176844, + "loss": 0.0181, "step": 75110 }, { - "epoch": 0.81, - "learning_rate": 0.000178186417590971, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024315149007875442, + "loss": 0.0204, "step": 75120 }, { - "epoch": 0.81, - "learning_rate": 0.00017817020172536808, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024314392238574043, + "loss": 0.0199, "step": 75130 }, { - "epoch": 0.81, - "learning_rate": 0.0001781539858597652, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024313635469272641, + "loss": 0.0169, "step": 75140 }, { - "epoch": 0.81, - "learning_rate": 0.00017813776999416227, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002431287869997124, + "loss": 0.0174, "step": 75150 }, { - "epoch": 0.81, - "learning_rate": 0.00017812155412855936, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024312121930669838, + "loss": 0.02, "step": 75160 }, { - "epoch": 0.81, - "learning_rate": 0.00017810533826295645, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.00024311365161368439, + "loss": 0.0205, "step": 75170 }, { - "epoch": 0.81, - "learning_rate": 0.00017808912239735357, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024310608392067037, + "loss": 0.0188, "step": 75180 }, { - "epoch": 0.81, - "learning_rate": 0.00017807290653175064, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024309851622765635, + "loss": 0.0221, "step": 75190 }, { - "epoch": 0.81, - "learning_rate": 0.00017805669066614773, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024309094853464236, + "loss": 0.0181, "step": 75200 }, { - "epoch": 0.81, - "learning_rate": 0.00017804047480054485, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.00024308338084162834, + "loss": 0.018, "step": 75210 }, { - "epoch": 0.81, - "learning_rate": 0.00017802425893494194, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024307581314861432, + "loss": 0.0225, "step": 75220 }, { - "epoch": 0.81, - "learning_rate": 0.000178008043069339, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.00024306824545560033, + "loss": 0.0168, "step": 75230 }, { - "epoch": 0.81, - "learning_rate": 0.0001779918272037361, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002430606777625863, + "loss": 0.0179, "step": 75240 }, { - "epoch": 0.81, - "learning_rate": 0.00017797561133813322, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.0002430531100695723, + "loss": 0.0173, "step": 75250 }, { - "epoch": 0.81, - "learning_rate": 0.00017795939547253032, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.0002430455423765583, + "loss": 0.0203, "step": 75260 }, { - "epoch": 0.81, - "learning_rate": 0.00017794317960692738, - "loss": 0.0176, + "epoch": 0.38, + "learning_rate": 0.00024303797468354428, + "loss": 0.0186, "step": 75270 }, { - "epoch": 0.81, - "learning_rate": 0.0001779269637413245, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.00024303040699053026, + "loss": 0.0168, "step": 75280 }, { - "epoch": 0.81, - "learning_rate": 0.0001779107478757216, - "loss": 0.0159, + "epoch": 0.38, + "learning_rate": 0.00024302283929751627, + "loss": 0.019, "step": 75290 }, { - "epoch": 0.81, - "learning_rate": 0.00017789453201011869, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024301527160450225, + "loss": 0.0194, "step": 75300 }, { - "epoch": 0.81, - "learning_rate": 0.00017787831614451575, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024300770391148823, + "loss": 0.0195, "step": 75310 }, { - "epoch": 0.81, - "learning_rate": 0.00017786210027891287, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024300013621847422, + "loss": 0.0145, "step": 75320 }, { - "epoch": 0.81, - "learning_rate": 0.00017784588441330996, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024299256852546022, + "loss": 0.0141, "step": 75330 }, { - "epoch": 0.81, - "learning_rate": 0.00017782966854770708, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002429850008324462, + "loss": 0.0206, "step": 75340 }, { - "epoch": 0.81, - "learning_rate": 0.00017781345268210415, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.0002429774331394322, + "loss": 0.0232, "step": 75350 }, { - "epoch": 0.81, - "learning_rate": 0.00017779723681650124, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.0002429698654464182, + "loss": 0.0177, "step": 75360 }, { - "epoch": 0.81, - "learning_rate": 0.00017778102095089834, - "loss": 0.0174, + "epoch": 0.38, + "learning_rate": 0.00024296229775340418, + "loss": 0.0148, "step": 75370 }, { - "epoch": 0.81, - "learning_rate": 0.00017776480508529546, - "loss": 0.0153, + "epoch": 0.38, + "learning_rate": 0.00024295473006039016, + "loss": 0.0182, "step": 75380 }, { - "epoch": 0.82, - "learning_rate": 0.00017774858921969252, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.00024294716236737617, + "loss": 0.0197, "step": 75390 }, { - "epoch": 0.82, - "learning_rate": 0.0001777323733540896, - "loss": 0.015, + "epoch": 0.38, + "learning_rate": 0.00024293959467436215, + "loss": 0.0162, "step": 75400 }, { - "epoch": 0.82, - "learning_rate": 0.00017771615748848673, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024293202698134813, + "loss": 0.0181, "step": 75410 }, { - "epoch": 0.82, - "learning_rate": 0.00017769994162288383, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024292445928833414, + "loss": 0.0198, "step": 75420 }, { - "epoch": 0.82, - "learning_rate": 0.0001776837257572809, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024291689159532012, + "loss": 0.0172, "step": 75430 }, { - "epoch": 0.82, - "learning_rate": 0.00017766750989167798, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.0002429093239023061, + "loss": 0.0187, "step": 75440 }, { - "epoch": 0.82, - "learning_rate": 0.0001776512940260751, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.0002429017562092921, + "loss": 0.0137, "step": 75450 }, { - "epoch": 0.82, - "learning_rate": 0.0001776350781604722, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.0002428941885162781, + "loss": 0.0202, "step": 75460 }, { - "epoch": 0.82, - "learning_rate": 0.00017761886229486926, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024288662082326407, + "loss": 0.0159, "step": 75470 }, { - "epoch": 0.82, - "learning_rate": 0.00017760264642926638, - "loss": 0.0159, + "epoch": 0.38, + "learning_rate": 0.00024287905313025008, + "loss": 0.0231, "step": 75480 }, { - "epoch": 0.82, - "learning_rate": 0.00017758643056366348, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024287148543723606, + "loss": 0.0209, "step": 75490 }, { - "epoch": 0.82, - "learning_rate": 0.00017757021469806057, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024286391774422204, + "loss": 0.0184, "step": 75500 }, { - "epoch": 0.82, - "learning_rate": 0.00017755399883245763, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024285635005120803, + "loss": 0.0173, "step": 75510 }, { - "epoch": 0.82, - "learning_rate": 0.00017753778296685475, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024284878235819403, + "loss": 0.0181, "step": 75520 }, { - "epoch": 0.82, - "learning_rate": 0.00017752156710125185, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024284121466518002, + "loss": 0.0188, "step": 75530 }, { - "epoch": 0.82, - "learning_rate": 0.00017750535123564894, - "loss": 0.015, + "epoch": 0.38, + "learning_rate": 0.000242833646972166, + "loss": 0.0179, "step": 75540 }, { - "epoch": 0.82, - "learning_rate": 0.00017748913537004606, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.000242826079279152, + "loss": 0.0158, "step": 75550 }, { - "epoch": 0.82, - "learning_rate": 0.00017747291950444312, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.000242818511586138, + "loss": 0.0201, "step": 75560 }, { - "epoch": 0.82, - "learning_rate": 0.00017745670363884022, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024281094389312397, + "loss": 0.0166, "step": 75570 }, { - "epoch": 0.82, - "learning_rate": 0.00017744048777323734, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024280337620010998, + "loss": 0.0168, "step": 75580 }, { - "epoch": 0.82, - "learning_rate": 0.00017742427190763443, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024279580850709596, + "loss": 0.0188, "step": 75590 }, { - "epoch": 0.82, - "learning_rate": 0.0001774080560420315, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024278824081408194, + "loss": 0.018, "step": 75600 }, { - "epoch": 0.82, - "learning_rate": 0.0001773918401764286, - "loss": 0.0169, + "epoch": 0.38, + "learning_rate": 0.00024278067312106795, + "loss": 0.0191, "step": 75610 }, { - "epoch": 0.82, - "learning_rate": 0.0001773756243108257, - "loss": 0.0149, + "epoch": 0.38, + "learning_rate": 0.00024277310542805393, + "loss": 0.0172, "step": 75620 }, { - "epoch": 0.82, - "learning_rate": 0.0001773594084452228, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.0002427655377350399, + "loss": 0.0191, "step": 75630 }, { - "epoch": 0.82, - "learning_rate": 0.00017734319257961987, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024275797004202592, + "loss": 0.0216, "step": 75640 }, { - "epoch": 0.82, - "learning_rate": 0.00017732697671401699, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.0002427504023490119, + "loss": 0.018, "step": 75650 }, { - "epoch": 0.82, - "learning_rate": 0.00017731076084841408, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024274283465599788, + "loss": 0.0179, "step": 75660 }, { - "epoch": 0.82, - "learning_rate": 0.00017729454498281117, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024273526696298386, + "loss": 0.0238, "step": 75670 }, { - "epoch": 0.82, - "learning_rate": 0.00017727832911720826, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024272769926996987, + "loss": 0.0177, "step": 75680 }, { - "epoch": 0.82, - "learning_rate": 0.00017726211325160536, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024272013157695585, + "loss": 0.0169, "step": 75690 }, { - "epoch": 0.82, - "learning_rate": 0.00017724589738600245, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024271256388394184, + "loss": 0.02, "step": 75700 }, { - "epoch": 0.82, - "learning_rate": 0.00017722968152039957, - "loss": 0.0164, + "epoch": 0.38, + "learning_rate": 0.00024270499619092784, + "loss": 0.0188, "step": 75710 }, { - "epoch": 0.82, - "learning_rate": 0.00017721346565479664, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024269742849791383, + "loss": 0.0197, "step": 75720 }, { - "epoch": 0.82, - "learning_rate": 0.00017719724978919373, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.0002426898608048998, + "loss": 0.0168, "step": 75730 }, { - "epoch": 0.82, - "learning_rate": 0.00017718103392359082, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024268229311188582, + "loss": 0.018, "step": 75740 }, { - "epoch": 0.82, - "learning_rate": 0.00017716481805798794, - "loss": 0.0185, + "epoch": 0.38, + "learning_rate": 0.0002426747254188718, + "loss": 0.0186, "step": 75750 }, { - "epoch": 0.82, - "learning_rate": 0.000177148602192385, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024266715772585778, + "loss": 0.019, "step": 75760 }, { - "epoch": 0.82, - "learning_rate": 0.0001771323863267821, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.0002426595900328438, + "loss": 0.0165, "step": 75770 }, { - "epoch": 0.82, - "learning_rate": 0.00017711617046117922, - "loss": 0.0157, + "epoch": 0.38, + "learning_rate": 0.00024265202233982977, + "loss": 0.0161, "step": 75780 }, { - "epoch": 0.82, - "learning_rate": 0.0001770999545955763, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.00024264445464681575, + "loss": 0.0233, "step": 75790 }, { - "epoch": 0.82, - "learning_rate": 0.00017708373872997338, - "loss": 0.0152, + "epoch": 0.38, + "learning_rate": 0.00024263688695380176, + "loss": 0.0207, "step": 75800 }, { - "epoch": 0.82, - "learning_rate": 0.00017706752286437047, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024262931926078774, + "loss": 0.0291, "step": 75810 }, { - "epoch": 0.82, - "learning_rate": 0.0001770513069987676, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024262175156777372, + "loss": 0.0234, "step": 75820 }, { - "epoch": 0.82, - "learning_rate": 0.00017703509113316468, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002426141838747597, + "loss": 0.0198, "step": 75830 }, { - "epoch": 0.82, - "learning_rate": 0.00017701887526756175, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.0002426066161817457, + "loss": 0.0192, "step": 75840 }, { - "epoch": 0.82, - "learning_rate": 0.00017700265940195887, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.0002425990484887317, + "loss": 0.0206, "step": 75850 }, { - "epoch": 0.82, - "learning_rate": 0.00017698644353635596, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.00024259148079571767, + "loss": 0.0199, "step": 75860 }, { - "epoch": 0.82, - "learning_rate": 0.00017697022767075305, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.00024258391310270368, + "loss": 0.014, "step": 75870 }, { - "epoch": 0.82, - "learning_rate": 0.00017695401180515012, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024257634540968966, + "loss": 0.0183, "step": 75880 }, { - "epoch": 0.82, - "learning_rate": 0.00017693779593954724, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024256877771667565, + "loss": 0.0204, "step": 75890 }, { - "epoch": 0.82, - "learning_rate": 0.00017692158007394433, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024256121002366165, + "loss": 0.017, "step": 75900 }, { - "epoch": 0.82, - "learning_rate": 0.00017690536420834142, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024255364233064764, + "loss": 0.0169, "step": 75910 }, { - "epoch": 0.82, - "learning_rate": 0.00017688914834273852, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024254607463763362, + "loss": 0.0174, "step": 75920 }, { - "epoch": 0.82, - "learning_rate": 0.0001768729324771356, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024253850694461963, + "loss": 0.0183, "step": 75930 }, { - "epoch": 0.82, - "learning_rate": 0.0001768567166115327, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.0002425309392516056, + "loss": 0.0181, "step": 75940 }, { - "epoch": 0.82, - "learning_rate": 0.00017684050074592982, - "loss": 0.0115, + "epoch": 0.38, + "learning_rate": 0.0002425233715585916, + "loss": 0.0183, "step": 75950 }, { - "epoch": 0.82, - "learning_rate": 0.0001768242848803269, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.0002425158038655776, + "loss": 0.0183, "step": 75960 }, { - "epoch": 0.82, - "learning_rate": 0.00017680806901472398, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024250823617256358, + "loss": 0.0203, "step": 75970 }, { - "epoch": 0.82, - "learning_rate": 0.0001767918531491211, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024250066847954956, + "loss": 0.0179, "step": 75980 }, { - "epoch": 0.82, - "learning_rate": 0.0001767756372835182, - "loss": 0.0178, + "epoch": 0.38, + "learning_rate": 0.00024249310078653557, + "loss": 0.0203, "step": 75990 }, { - "epoch": 0.82, - "learning_rate": 0.00017675942141791526, - "loss": 0.0106, + "epoch": 0.38, + "learning_rate": 0.00024248553309352155, + "loss": 0.0175, "step": 76000 }, { - "epoch": 0.82, - "eval_cer": 0.9215929483337589, - "eval_loss": 0.010436671786010265, - "eval_runtime": 121.1923, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.38, + "eval_cer": 0.9144925750140465, + "eval_loss": 0.012879201211035252, + "eval_runtime": 116.6021, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, "step": 76000 }, { - "epoch": 0.82, - "learning_rate": 0.00017674320555231235, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024247796540050753, + "loss": 0.0189, "step": 76010 }, { - "epoch": 0.82, - "learning_rate": 0.00017672698968670947, - "loss": 0.0184, + "epoch": 0.38, + "learning_rate": 0.0002424703977074935, + "loss": 0.0175, "step": 76020 }, { - "epoch": 0.82, - "learning_rate": 0.00017671077382110656, - "loss": 0.0247, + "epoch": 0.38, + "learning_rate": 0.00024246283001447952, + "loss": 0.0171, "step": 76030 }, { - "epoch": 0.82, - "learning_rate": 0.00017669455795550363, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002424552623214655, + "loss": 0.0174, "step": 76040 }, { - "epoch": 0.82, - "learning_rate": 0.00017667834208990075, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024244769462845146, + "loss": 0.0159, "step": 76050 }, { - "epoch": 0.82, - "learning_rate": 0.00017666212622429784, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.00024244012693543744, + "loss": 0.0189, "step": 76060 }, { - "epoch": 0.82, - "learning_rate": 0.00017664591035869494, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024243255924242345, + "loss": 0.0171, "step": 76070 }, { - "epoch": 0.82, - "learning_rate": 0.000176629694493092, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.00024242499154940943, + "loss": 0.0219, "step": 76080 }, { - "epoch": 0.82, - "learning_rate": 0.00017661347862748912, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002424174238563954, + "loss": 0.0165, "step": 76090 }, { - "epoch": 0.82, - "learning_rate": 0.00017659726276188621, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024240985616338142, + "loss": 0.0196, "step": 76100 }, { - "epoch": 0.82, - "learning_rate": 0.0001765810468962833, - "loss": 0.0165, + "epoch": 0.38, + "learning_rate": 0.0002424022884703674, + "loss": 0.0203, "step": 76110 }, { - "epoch": 0.82, - "learning_rate": 0.0001765648310306804, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.00024239472077735338, + "loss": 0.0205, "step": 76120 }, { - "epoch": 0.82, - "learning_rate": 0.0001765486151650775, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.0002423871530843394, + "loss": 0.0197, "step": 76130 }, { - "epoch": 0.82, - "learning_rate": 0.00017653239929947458, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024237958539132537, + "loss": 0.0179, "step": 76140 }, { - "epoch": 0.82, - "learning_rate": 0.0001765161834338717, - "loss": 0.0153, + "epoch": 0.38, + "learning_rate": 0.00024237201769831135, + "loss": 0.0143, "step": 76150 }, { - "epoch": 0.82, - "learning_rate": 0.00017649996756826877, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.00024236445000529736, + "loss": 0.0198, "step": 76160 }, { - "epoch": 0.82, - "learning_rate": 0.00017648375170266586, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024235688231228334, + "loss": 0.019, "step": 76170 }, { - "epoch": 0.82, - "learning_rate": 0.00017646753583706296, - "loss": 0.0148, + "epoch": 0.38, + "learning_rate": 0.00024234931461926932, + "loss": 0.0217, "step": 76180 }, { - "epoch": 0.82, - "learning_rate": 0.00017645131997146008, - "loss": 0.017, + "epoch": 0.38, + "learning_rate": 0.00024234174692625533, + "loss": 0.0185, "step": 76190 }, { - "epoch": 0.82, - "learning_rate": 0.00017643510410585714, - "loss": 0.0166, + "epoch": 0.38, + "learning_rate": 0.00024233417923324131, + "loss": 0.0181, "step": 76200 }, { - "epoch": 0.82, - "learning_rate": 0.00017641888824025423, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.0002423266115402273, + "loss": 0.0206, "step": 76210 }, { - "epoch": 0.82, - "learning_rate": 0.00017640267237465135, - "loss": 0.0167, + "epoch": 0.38, + "learning_rate": 0.00024231904384721328, + "loss": 0.0172, "step": 76220 }, { - "epoch": 0.82, - "learning_rate": 0.00017638645650904845, - "loss": 0.0202, + "epoch": 0.38, + "learning_rate": 0.00024231147615419929, + "loss": 0.0185, "step": 76230 }, { - "epoch": 0.82, - "learning_rate": 0.0001763702406434455, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024230390846118527, + "loss": 0.0209, "step": 76240 }, { - "epoch": 0.82, - "learning_rate": 0.0001763540247778426, - "loss": 0.0181, + "epoch": 0.38, + "learning_rate": 0.00024229634076817125, + "loss": 0.0186, "step": 76250 }, { - "epoch": 0.82, - "learning_rate": 0.00017633780891223972, - "loss": 0.0112, + "epoch": 0.38, + "learning_rate": 0.00024228877307515726, + "loss": 0.0212, "step": 76260 }, { - "epoch": 0.82, - "learning_rate": 0.00017632159304663682, - "loss": 0.0164, + "epoch": 0.38, + "learning_rate": 0.00024228120538214324, + "loss": 0.0172, "step": 76270 }, { - "epoch": 0.82, - "learning_rate": 0.00017630537718103394, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024227363768912922, + "loss": 0.0169, "step": 76280 }, { - "epoch": 0.82, - "learning_rate": 0.000176289161315431, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024226606999611523, + "loss": 0.0176, "step": 76290 }, { - "epoch": 0.82, - "learning_rate": 0.0001762729454498281, - "loss": 0.0149, + "epoch": 0.38, + "learning_rate": 0.0002422585023031012, + "loss": 0.0183, "step": 76300 }, { - "epoch": 0.82, - "learning_rate": 0.0001762567295842252, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.0002422509346100872, + "loss": 0.0154, "step": 76310 }, { - "epoch": 0.83, - "learning_rate": 0.0001762405137186223, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.0002422433669170732, + "loss": 0.0204, "step": 76320 }, { - "epoch": 0.83, - "learning_rate": 0.00017622429785301937, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024223579922405918, + "loss": 0.018, "step": 76330 }, { - "epoch": 0.83, - "learning_rate": 0.00017620808198741647, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.00024222823153104516, + "loss": 0.0238, "step": 76340 }, { - "epoch": 0.83, - "learning_rate": 0.0001761918661218136, - "loss": 0.0187, + "epoch": 0.39, + "learning_rate": 0.00024222066383803117, + "loss": 0.0168, "step": 76350 }, { - "epoch": 0.83, - "learning_rate": 0.00017617565025621068, - "loss": 0.0154, + "epoch": 0.39, + "learning_rate": 0.00024221309614501715, + "loss": 0.0149, "step": 76360 }, { - "epoch": 0.83, - "learning_rate": 0.00017615943439060775, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024220552845200313, + "loss": 0.0194, "step": 76370 }, { - "epoch": 0.83, - "learning_rate": 0.00017614321852500484, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024219796075898914, + "loss": 0.0177, "step": 76380 }, { - "epoch": 0.83, - "learning_rate": 0.00017612700265940196, - "loss": 0.0165, + "epoch": 0.39, + "learning_rate": 0.00024219039306597512, + "loss": 0.0185, "step": 76390 }, { - "epoch": 0.83, - "learning_rate": 0.00017611078679379905, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002421828253729611, + "loss": 0.0173, "step": 76400 }, { - "epoch": 0.83, - "learning_rate": 0.00017609457092819612, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.0002421752576799471, + "loss": 0.0188, "step": 76410 }, { - "epoch": 0.83, - "learning_rate": 0.00017607835506259324, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.0002421676899869331, + "loss": 0.0212, "step": 76420 }, { - "epoch": 0.83, - "learning_rate": 0.00017606213919699033, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024216012229391908, + "loss": 0.0176, "step": 76430 }, { - "epoch": 0.83, - "learning_rate": 0.00017604592333138742, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024215255460090506, + "loss": 0.0186, "step": 76440 }, { - "epoch": 0.83, - "learning_rate": 0.0001760297074657845, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.00024214498690789107, + "loss": 0.0174, "step": 76450 }, { - "epoch": 0.83, - "learning_rate": 0.0001760134916001816, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024213741921487705, + "loss": 0.0178, "step": 76460 }, { - "epoch": 0.83, - "learning_rate": 0.0001759972757345787, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024212985152186303, + "loss": 0.0196, "step": 76470 }, { - "epoch": 0.83, - "learning_rate": 0.0001759810598689758, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024212228382884904, + "loss": 0.0174, "step": 76480 }, { - "epoch": 0.83, - "learning_rate": 0.00017596484400337289, - "loss": 0.0106, + "epoch": 0.39, + "learning_rate": 0.00024211471613583502, + "loss": 0.016, "step": 76490 }, { - "epoch": 0.83, - "learning_rate": 0.00017594862813776998, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.000242107148442821, + "loss": 0.0139, "step": 76500 }, { - "epoch": 0.83, - "learning_rate": 0.00017593241227216707, - "loss": 0.0172, + "epoch": 0.39, + "learning_rate": 0.000242099580749807, + "loss": 0.0174, "step": 76510 }, { - "epoch": 0.83, - "learning_rate": 0.0001759161964065642, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.000242092013056793, + "loss": 0.0215, "step": 76520 }, { - "epoch": 0.83, - "learning_rate": 0.00017589998054096126, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024208444536377897, + "loss": 0.0173, "step": 76530 }, { - "epoch": 0.83, - "learning_rate": 0.00017588376467535835, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024207687767076498, + "loss": 0.0189, "step": 76540 }, { - "epoch": 0.83, - "learning_rate": 0.00017586754880975544, - "loss": 0.0142, + "epoch": 0.39, + "learning_rate": 0.00024206930997775096, + "loss": 0.0173, "step": 76550 }, { - "epoch": 0.83, - "learning_rate": 0.00017585133294415256, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024206174228473694, + "loss": 0.018, "step": 76560 }, { - "epoch": 0.83, - "learning_rate": 0.00017583511707854963, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024205417459172293, + "loss": 0.055, "step": 76570 }, { - "epoch": 0.83, - "learning_rate": 0.00017581890121294672, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024204660689870893, + "loss": 0.0154, "step": 76580 }, { - "epoch": 0.83, - "learning_rate": 0.00017580268534734384, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024203903920569492, + "loss": 0.0182, "step": 76590 }, { - "epoch": 0.83, - "learning_rate": 0.00017578646948174093, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.0002420314715126809, + "loss": 0.0171, "step": 76600 }, { - "epoch": 0.83, - "learning_rate": 0.000175770253616138, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.0002420239038196669, + "loss": 0.0193, "step": 76610 }, { - "epoch": 0.83, - "learning_rate": 0.0001757540377505351, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.0002420163361266529, + "loss": 0.0184, "step": 76620 }, { - "epoch": 0.83, - "learning_rate": 0.0001757378218849322, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024200876843363887, + "loss": 0.0205, "step": 76630 }, { - "epoch": 0.83, - "learning_rate": 0.0001757216060193293, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024200120074062488, + "loss": 0.0199, "step": 76640 }, { - "epoch": 0.83, - "learning_rate": 0.00017570539015372637, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024199363304761086, + "loss": 0.0182, "step": 76650 }, { - "epoch": 0.83, - "learning_rate": 0.0001756891742881235, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.00024198606535459684, + "loss": 0.0166, "step": 76660 }, { - "epoch": 0.83, - "learning_rate": 0.00017567295842252058, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024197849766158285, + "loss": 0.0187, "step": 76670 }, { - "epoch": 0.83, - "learning_rate": 0.00017565674255691767, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024197092996856883, + "loss": 0.0168, "step": 76680 }, { - "epoch": 0.83, - "learning_rate": 0.00017564052669131474, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.0002419633622755548, + "loss": 0.0145, "step": 76690 }, { - "epoch": 0.83, - "learning_rate": 0.00017562431082571186, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024195579458254082, + "loss": 0.0157, "step": 76700 }, { - "epoch": 0.83, - "learning_rate": 0.00017560809496010895, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.0002419482268895268, + "loss": 0.0168, "step": 76710 }, { - "epoch": 0.83, - "learning_rate": 0.00017559187909450607, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.00024194065919651278, + "loss": 0.0172, "step": 76720 }, { - "epoch": 0.83, - "learning_rate": 0.00017557566322890314, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024193309150349876, + "loss": 0.0186, "step": 76730 }, { - "epoch": 0.83, - "learning_rate": 0.00017555944736330023, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024192552381048477, + "loss": 0.0141, "step": 76740 }, { - "epoch": 0.83, - "learning_rate": 0.00017554323149769732, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024191795611747075, + "loss": 0.0183, "step": 76750 }, { - "epoch": 0.83, - "learning_rate": 0.00017552701563209444, - "loss": 0.0175, + "epoch": 0.39, + "learning_rate": 0.00024191038842445674, + "loss": 0.0196, "step": 76760 }, { - "epoch": 0.83, - "learning_rate": 0.0001755107997664915, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024190282073144274, + "loss": 0.0201, "step": 76770 }, { - "epoch": 0.83, - "learning_rate": 0.0001754945839008886, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.00024189525303842873, + "loss": 0.0201, "step": 76780 }, { - "epoch": 0.83, - "learning_rate": 0.00017547836803528572, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.0002418876853454147, + "loss": 0.0148, "step": 76790 }, { - "epoch": 0.83, - "learning_rate": 0.00017546215216968281, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.00024188011765240072, + "loss": 0.0211, "step": 76800 }, { - "epoch": 0.83, - "learning_rate": 0.00017544593630407988, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.0002418725499593867, + "loss": 0.0213, "step": 76810 }, { - "epoch": 0.83, - "learning_rate": 0.00017542972043847697, - "loss": 0.0181, + "epoch": 0.39, + "learning_rate": 0.00024186498226637268, + "loss": 0.0161, "step": 76820 }, { - "epoch": 0.83, - "learning_rate": 0.0001754135045728741, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.0002418574145733587, + "loss": 0.0179, "step": 76830 }, { - "epoch": 0.83, - "learning_rate": 0.00017539728870727119, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024184984688034467, + "loss": 0.0152, "step": 76840 }, { - "epoch": 0.83, - "learning_rate": 0.00017538107284166825, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024184227918733065, + "loss": 0.0195, "step": 76850 }, { - "epoch": 0.83, - "learning_rate": 0.00017536485697606537, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024183471149431666, + "loss": 0.0214, "step": 76860 }, { - "epoch": 0.83, - "learning_rate": 0.00017534864111046246, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024182714380130264, + "loss": 0.0268, "step": 76870 }, { - "epoch": 0.83, - "learning_rate": 0.00017533242524485956, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024181957610828862, + "loss": 0.0213, "step": 76880 }, { - "epoch": 0.83, - "learning_rate": 0.00017531620937925662, - "loss": 0.0157, + "epoch": 0.39, + "learning_rate": 0.00024181200841527463, + "loss": 0.0185, "step": 76890 }, { - "epoch": 0.83, - "learning_rate": 0.00017529999351365374, - "loss": 0.0175, + "epoch": 0.39, + "learning_rate": 0.0002418044407222606, + "loss": 0.0198, "step": 76900 }, { - "epoch": 0.83, - "learning_rate": 0.00017528377764805083, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.0002417968730292466, + "loss": 0.0206, "step": 76910 }, { - "epoch": 0.83, - "learning_rate": 0.00017526756178244793, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024178930533623257, + "loss": 0.0165, "step": 76920 }, { - "epoch": 0.83, - "learning_rate": 0.00017525134591684502, - "loss": 0.0162, + "epoch": 0.39, + "learning_rate": 0.00024178173764321858, + "loss": 0.0171, "step": 76930 }, { - "epoch": 0.83, - "learning_rate": 0.0001752351300512421, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024177416995020456, + "loss": 0.0183, "step": 76940 }, { - "epoch": 0.83, - "learning_rate": 0.0001752189141856392, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.00024176660225719055, + "loss": 0.0224, "step": 76950 }, { - "epoch": 0.83, - "learning_rate": 0.00017520269832003633, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024175903456417655, + "loss": 0.0219, "step": 76960 }, { - "epoch": 0.83, - "learning_rate": 0.00017518648245443342, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024175146687116254, + "loss": 0.0175, "step": 76970 }, { - "epoch": 0.83, - "learning_rate": 0.00017517026658883048, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024174389917814852, + "loss": 0.0131, "step": 76980 }, { - "epoch": 0.83, - "learning_rate": 0.0001751540507232276, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024173633148513453, + "loss": 0.0148, "step": 76990 }, { - "epoch": 0.83, - "learning_rate": 0.0001751378348576247, - "loss": 0.0176, + "epoch": 0.39, + "learning_rate": 0.0002417287637921205, + "loss": 0.0143, "step": 77000 }, { - "epoch": 0.83, - "eval_cer": 0.9215825250982824, - "eval_loss": 0.010247960686683655, - "eval_runtime": 121.2734, - "eval_samples_per_second": 16.492, - "eval_steps_per_second": 4.123, + "epoch": 0.39, + "eval_cer": 0.9144974269946735, + "eval_loss": 0.012495556846261024, + "eval_runtime": 116.5435, + "eval_samples_per_second": 17.161, + "eval_steps_per_second": 4.29, "step": 77000 }, { - "epoch": 0.83, - "learning_rate": 0.0001751216189920218, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.0002417211960991065, + "loss": 0.0195, "step": 77010 }, { - "epoch": 0.83, - "learning_rate": 0.00017510540312641885, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.0002417136284060925, + "loss": 0.0186, "step": 77020 }, { - "epoch": 0.83, - "learning_rate": 0.00017508918726081597, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024170606071307848, + "loss": 0.0197, "step": 77030 }, { - "epoch": 0.83, - "learning_rate": 0.00017507297139521307, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024169849302006446, + "loss": 0.0182, "step": 77040 }, { - "epoch": 0.83, - "learning_rate": 0.00017505675552961016, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024169092532705047, + "loss": 0.0164, "step": 77050 }, { - "epoch": 0.83, - "learning_rate": 0.00017504053966400725, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024168335763403645, + "loss": 0.0151, "step": 77060 }, { - "epoch": 0.83, - "learning_rate": 0.00017502432379840435, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024167578994102243, + "loss": 0.0165, "step": 77070 }, { - "epoch": 0.83, - "learning_rate": 0.00017500810793280144, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.0002416682222480084, + "loss": 0.019, "step": 77080 }, { - "epoch": 0.83, - "learning_rate": 0.00017499189206719856, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024166065455499442, + "loss": 0.0179, "step": 77090 }, { - "epoch": 0.83, - "learning_rate": 0.00017497567620159562, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.0002416530868619804, + "loss": 0.0245, "step": 77100 }, { - "epoch": 0.83, - "learning_rate": 0.00017495946033599272, - "loss": 0.0174, + "epoch": 0.39, + "learning_rate": 0.00024164551916896638, + "loss": 0.0208, "step": 77110 }, { - "epoch": 0.83, - "learning_rate": 0.0001749432444703898, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.0002416379514759524, + "loss": 0.0195, "step": 77120 }, { - "epoch": 0.83, - "learning_rate": 0.00017492702860478693, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024163038378293837, + "loss": 0.018, "step": 77130 }, { - "epoch": 0.83, - "learning_rate": 0.000174910812739184, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.00024162281608992436, + "loss": 0.0153, "step": 77140 }, { - "epoch": 0.83, - "learning_rate": 0.0001748945968735811, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024161524839691036, + "loss": 0.0219, "step": 77150 }, { - "epoch": 0.83, - "learning_rate": 0.0001748783810079782, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024160768070389635, + "loss": 0.0184, "step": 77160 }, { - "epoch": 0.83, - "learning_rate": 0.0001748621651423753, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024160011301088233, + "loss": 0.0222, "step": 77170 }, { - "epoch": 0.83, - "learning_rate": 0.00017484594927677237, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024159254531786834, + "loss": 0.0227, "step": 77180 }, { - "epoch": 0.83, - "learning_rate": 0.00017482973341116946, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024158497762485432, + "loss": 0.0192, "step": 77190 }, { - "epoch": 0.83, - "learning_rate": 0.00017481351754556658, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.0002415774099318403, + "loss": 0.0174, "step": 77200 }, { - "epoch": 0.83, - "learning_rate": 0.00017479730167996367, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.0002415698422388263, + "loss": 0.0127, "step": 77210 }, { - "epoch": 0.83, - "learning_rate": 0.00017478108581436074, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002415622745458123, + "loss": 0.0152, "step": 77220 }, { - "epoch": 0.83, - "learning_rate": 0.00017476486994875786, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024155470685279827, + "loss": 0.0163, "step": 77230 }, { - "epoch": 0.84, - "learning_rate": 0.00017474865408315495, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024154713915978425, + "loss": 0.0172, "step": 77240 }, { - "epoch": 0.84, - "learning_rate": 0.00017473243821755204, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.00024153957146677026, + "loss": 0.0155, "step": 77250 }, { - "epoch": 0.84, - "learning_rate": 0.0001747162223519491, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.00024153200377375624, + "loss": 0.0181, "step": 77260 }, { - "epoch": 0.84, - "learning_rate": 0.00017470000648634623, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.00024152443608074222, + "loss": 0.0185, "step": 77270 }, { - "epoch": 0.84, - "learning_rate": 0.00017468379062074332, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024151686838772823, + "loss": 0.0179, "step": 77280 }, { - "epoch": 0.84, - "learning_rate": 0.00017466757475514044, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002415093006947142, + "loss": 0.0157, "step": 77290 }, { - "epoch": 0.84, - "learning_rate": 0.0001746513588895375, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024150173300170017, + "loss": 0.0166, "step": 77300 }, { - "epoch": 0.84, - "learning_rate": 0.0001746351430239346, - "loss": 0.0168, + "epoch": 0.39, + "learning_rate": 0.00024149416530868615, + "loss": 0.0131, "step": 77310 }, { - "epoch": 0.84, - "learning_rate": 0.0001746189271583317, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024148659761567216, + "loss": 0.0155, "step": 77320 }, { - "epoch": 0.84, - "learning_rate": 0.0001746027112927288, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024147902992265814, + "loss": 0.0166, "step": 77330 }, { - "epoch": 0.84, - "learning_rate": 0.00017458649542712588, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024147146222964412, + "loss": 0.0178, "step": 77340 }, { - "epoch": 0.84, - "learning_rate": 0.00017457027956152297, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.00024146389453663013, + "loss": 0.0167, "step": 77350 }, { - "epoch": 0.84, - "learning_rate": 0.0001745540636959201, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.0002414563268436161, + "loss": 0.0167, "step": 77360 }, { - "epoch": 0.84, - "learning_rate": 0.00017453784783031718, - "loss": 0.0174, + "epoch": 0.39, + "learning_rate": 0.0002414487591506021, + "loss": 0.0177, "step": 77370 }, { - "epoch": 0.84, - "learning_rate": 0.00017452163196471425, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.0002414411914575881, + "loss": 0.0204, "step": 77380 }, { - "epoch": 0.84, - "learning_rate": 0.00017450541609911134, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024143362376457408, + "loss": 0.0167, "step": 77390 }, { - "epoch": 0.84, - "learning_rate": 0.00017448920023350846, - "loss": 0.0165, + "epoch": 0.39, + "learning_rate": 0.00024142605607156006, + "loss": 0.0173, "step": 77400 }, { - "epoch": 0.84, - "learning_rate": 0.00017447298436790555, - "loss": 0.0157, + "epoch": 0.39, + "learning_rate": 0.00024141848837854607, + "loss": 0.0181, "step": 77410 }, { - "epoch": 0.84, - "learning_rate": 0.00017445676850230262, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024141092068553205, + "loss": 0.0166, "step": 77420 }, { - "epoch": 0.84, - "learning_rate": 0.00017444055263669974, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024140335299251803, + "loss": 0.0169, "step": 77430 }, { - "epoch": 0.84, - "learning_rate": 0.00017442433677109683, - "loss": 0.0154, + "epoch": 0.39, + "learning_rate": 0.00024139578529950404, + "loss": 0.0234, "step": 77440 }, { - "epoch": 0.84, - "learning_rate": 0.00017440812090549392, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024138821760649002, + "loss": 0.0164, "step": 77450 }, { - "epoch": 0.84, - "learning_rate": 0.000174391905039891, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.000241380649913476, + "loss": 0.0178, "step": 77460 }, { - "epoch": 0.84, - "learning_rate": 0.0001743756891742881, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.000241373082220462, + "loss": 0.0183, "step": 77470 }, { - "epoch": 0.84, - "learning_rate": 0.0001743594733086852, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.000241365514527448, + "loss": 0.0161, "step": 77480 }, { - "epoch": 0.84, - "learning_rate": 0.0001743432574430823, - "loss": 0.0176, + "epoch": 0.39, + "learning_rate": 0.00024135794683443398, + "loss": 0.0137, "step": 77490 }, { - "epoch": 0.84, - "learning_rate": 0.0001743270415774794, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024135037914141996, + "loss": 0.0194, "step": 77500 }, { - "epoch": 0.84, - "learning_rate": 0.00017431082571187648, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.00024134281144840597, + "loss": 0.021, "step": 77510 }, { - "epoch": 0.84, - "learning_rate": 0.00017429460984627357, - "loss": 0.0106, + "epoch": 0.39, + "learning_rate": 0.00024133524375539195, + "loss": 0.0157, "step": 77520 }, { - "epoch": 0.84, - "learning_rate": 0.0001742783939806707, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024132767606237793, + "loss": 0.0172, "step": 77530 }, { - "epoch": 0.84, - "learning_rate": 0.00017426217811506776, - "loss": 0.017, + "epoch": 0.39, + "learning_rate": 0.00024132010836936394, + "loss": 0.0174, "step": 77540 }, { - "epoch": 0.84, - "learning_rate": 0.00017424596224946485, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024131254067634992, + "loss": 0.017, "step": 77550 }, { - "epoch": 0.84, - "learning_rate": 0.00017422974638386194, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.0002413049729833359, + "loss": 0.0159, "step": 77560 }, { - "epoch": 0.84, - "learning_rate": 0.00017421353051825906, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002412974052903219, + "loss": 0.0197, "step": 77570 }, { - "epoch": 0.84, - "learning_rate": 0.00017419731465265613, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.0002412898375973079, + "loss": 0.0176, "step": 77580 }, { - "epoch": 0.84, - "learning_rate": 0.00017418109878705322, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024128226990429387, + "loss": 0.0166, "step": 77590 }, { - "epoch": 0.84, - "learning_rate": 0.00017416488292145034, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024127470221127988, + "loss": 0.019, "step": 77600 }, { - "epoch": 0.84, - "learning_rate": 0.00017414866705584744, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.00024126713451826586, + "loss": 0.018, "step": 77610 }, { - "epoch": 0.84, - "learning_rate": 0.0001741324511902445, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024125956682525184, + "loss": 0.0185, "step": 77620 }, { - "epoch": 0.84, - "learning_rate": 0.0001741162353246416, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024125199913223783, + "loss": 0.0178, "step": 77630 }, { - "epoch": 0.84, - "learning_rate": 0.0001741000194590387, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.00024124443143922383, + "loss": 0.02, "step": 77640 }, { - "epoch": 0.84, - "learning_rate": 0.0001740838035934358, - "loss": 0.011, + "epoch": 0.39, + "learning_rate": 0.00024123686374620982, + "loss": 0.0173, "step": 77650 }, { - "epoch": 0.84, - "learning_rate": 0.00017406758772783287, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.0002412292960531958, + "loss": 0.019, "step": 77660 }, { - "epoch": 0.84, - "learning_rate": 0.00017405137186223, - "loss": 0.0132, + "epoch": 0.39, + "learning_rate": 0.0002412217283601818, + "loss": 0.0242, "step": 77670 }, { - "epoch": 0.84, - "learning_rate": 0.00017403515599662708, - "loss": 0.0162, + "epoch": 0.39, + "learning_rate": 0.0002412141606671678, + "loss": 0.0186, "step": 77680 }, { - "epoch": 0.84, - "learning_rate": 0.00017401894013102418, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024120659297415377, + "loss": 0.0184, "step": 77690 }, { - "epoch": 0.84, - "learning_rate": 0.0001740027242654213, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024119902528113978, + "loss": 0.0165, "step": 77700 }, { - "epoch": 0.84, - "learning_rate": 0.00017398650839981836, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024119145758812576, + "loss": 0.0163, "step": 77710 }, { - "epoch": 0.84, - "learning_rate": 0.00017397029253421546, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024118388989511174, + "loss": 0.0174, "step": 77720 }, { - "epoch": 0.84, - "learning_rate": 0.00017395407666861258, - "loss": 0.0177, + "epoch": 0.39, + "learning_rate": 0.00024117632220209775, + "loss": 0.0169, "step": 77730 }, { - "epoch": 0.84, - "learning_rate": 0.00017393786080300967, - "loss": 0.0177, + "epoch": 0.39, + "learning_rate": 0.00024116875450908373, + "loss": 0.0202, "step": 77740 }, { - "epoch": 0.84, - "learning_rate": 0.00017392164493740673, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.0002411611868160697, + "loss": 0.0165, "step": 77750 }, { - "epoch": 0.84, - "learning_rate": 0.00017390542907180383, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024115361912305572, + "loss": 0.0176, "step": 77760 }, { - "epoch": 0.84, - "learning_rate": 0.00017388921320620095, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.0002411460514300417, + "loss": 0.0178, "step": 77770 }, { - "epoch": 0.84, - "learning_rate": 0.00017387299734059804, - "loss": 0.0106, + "epoch": 0.39, + "learning_rate": 0.00024113848373702768, + "loss": 0.0193, "step": 77780 }, { - "epoch": 0.84, - "learning_rate": 0.0001738567814749951, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.00024113091604401366, + "loss": 0.0189, "step": 77790 }, { - "epoch": 0.84, - "learning_rate": 0.00017384056560939222, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024112334835099967, + "loss": 0.0208, "step": 77800 }, { - "epoch": 0.84, - "learning_rate": 0.00017382434974378932, - "loss": 0.0165, + "epoch": 0.39, + "learning_rate": 0.00024111578065798565, + "loss": 0.0158, "step": 77810 }, { - "epoch": 0.84, - "learning_rate": 0.0001738081338781864, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024110821296497164, + "loss": 0.0181, "step": 77820 }, { - "epoch": 0.84, - "learning_rate": 0.00017379191801258348, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024110064527195764, + "loss": 0.0172, "step": 77830 }, { - "epoch": 0.84, - "learning_rate": 0.0001737757021469806, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024109307757894363, + "loss": 0.0158, "step": 77840 }, { - "epoch": 0.84, - "learning_rate": 0.0001737594862813777, - "loss": 0.0176, + "epoch": 0.39, + "learning_rate": 0.0002410855098859296, + "loss": 0.0172, "step": 77850 }, { - "epoch": 0.84, - "learning_rate": 0.00017374327041577478, - "loss": 0.0175, + "epoch": 0.39, + "learning_rate": 0.00024107794219291562, + "loss": 0.0149, "step": 77860 }, { - "epoch": 0.84, - "learning_rate": 0.00017372705455017187, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.0002410703744999016, + "loss": 0.0178, "step": 77870 }, { - "epoch": 0.84, - "learning_rate": 0.00017371083868456897, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024106280680688758, + "loss": 0.0178, "step": 77880 }, { - "epoch": 0.84, - "learning_rate": 0.00017369462281896606, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.0002410552391138736, + "loss": 0.0159, "step": 77890 }, { - "epoch": 0.84, - "learning_rate": 0.00017367840695336318, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024104767142085957, + "loss": 0.0159, "step": 77900 }, { - "epoch": 0.84, - "learning_rate": 0.00017366219108776024, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024104010372784555, + "loss": 0.0179, "step": 77910 }, { - "epoch": 0.84, - "learning_rate": 0.00017364597522215734, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024103253603483156, + "loss": 0.0185, "step": 77920 }, { - "epoch": 0.84, - "learning_rate": 0.00017362975935655443, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024102496834181754, + "loss": 0.017, "step": 77930 }, { - "epoch": 0.84, - "learning_rate": 0.00017361354349095155, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024101740064880352, + "loss": 0.0189, "step": 77940 }, { - "epoch": 0.84, - "learning_rate": 0.00017359732762534862, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.00024100983295578953, + "loss": 0.015, "step": 77950 }, { - "epoch": 0.84, - "learning_rate": 0.0001735811117597457, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.0002410022652627755, + "loss": 0.0157, "step": 77960 }, { - "epoch": 0.84, - "learning_rate": 0.00017356489589414283, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002409946975697615, + "loss": 0.0185, "step": 77970 }, { - "epoch": 0.84, - "learning_rate": 0.00017354868002853992, - "loss": 0.0155, + "epoch": 0.39, + "learning_rate": 0.00024098712987674747, + "loss": 0.0163, "step": 77980 }, { - "epoch": 0.84, - "learning_rate": 0.00017353246416293699, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024097956218373348, + "loss": 0.0163, "step": 77990 }, { - "epoch": 0.84, - "learning_rate": 0.0001735162482973341, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024097199449071946, + "loss": 0.0178, "step": 78000 }, { - "epoch": 0.84, - "eval_cer": 0.9215347519356817, - "eval_loss": 0.00994004588574171, - "eval_runtime": 121.1288, - "eval_samples_per_second": 16.511, - "eval_steps_per_second": 4.128, + "epoch": 0.39, + "eval_cer": 0.9145148941249307, + "eval_loss": 0.012463193386793137, + "eval_runtime": 116.5238, + "eval_samples_per_second": 17.164, + "eval_steps_per_second": 4.291, "step": 78000 }, { - "epoch": 0.84, - "learning_rate": 0.0001735000324317312, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024096442679770545, + "loss": 0.0181, "step": 78010 }, { - "epoch": 0.84, - "learning_rate": 0.0001734838165661283, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024095685910469145, + "loss": 0.016, "step": 78020 }, { - "epoch": 0.84, - "learning_rate": 0.00017346760070052536, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024094929141167744, + "loss": 0.019, "step": 78030 }, { - "epoch": 0.84, - "learning_rate": 0.00017345138483492248, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024094172371866342, + "loss": 0.0137, "step": 78040 }, { - "epoch": 0.84, - "learning_rate": 0.00017343516896931957, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024093415602564943, + "loss": 0.0163, "step": 78050 }, { - "epoch": 0.84, - "learning_rate": 0.00017341895310371666, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002409265883326354, + "loss": 0.0176, "step": 78060 }, { - "epoch": 0.84, - "learning_rate": 0.00017340273723811376, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.0002409190206396214, + "loss": 0.0183, "step": 78070 }, { - "epoch": 0.84, - "learning_rate": 0.00017338652137251085, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.0002409114529466074, + "loss": 0.0196, "step": 78080 }, { - "epoch": 0.84, - "learning_rate": 0.00017337030550690794, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024090388525359338, + "loss": 0.0175, "step": 78090 }, { - "epoch": 0.84, - "learning_rate": 0.00017335408964130506, - "loss": 0.0153, + "epoch": 0.39, + "learning_rate": 0.00024089631756057936, + "loss": 0.0183, "step": 78100 }, { - "epoch": 0.84, - "learning_rate": 0.00017333787377570213, - "loss": 0.0164, + "epoch": 0.39, + "learning_rate": 0.00024088874986756537, + "loss": 0.0202, "step": 78110 }, { - "epoch": 0.84, - "learning_rate": 0.00017332165791009922, - "loss": 0.0155, + "epoch": 0.39, + "learning_rate": 0.00024088118217455135, + "loss": 0.0204, "step": 78120 }, { - "epoch": 0.84, - "learning_rate": 0.0001733054420444963, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024087361448153733, + "loss": 0.0167, "step": 78130 }, { - "epoch": 0.84, - "learning_rate": 0.00017328922617889343, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.0002408660467885233, + "loss": 0.0173, "step": 78140 }, { - "epoch": 0.84, - "learning_rate": 0.0001732730103132905, - "loss": 0.0183, + "epoch": 0.39, + "learning_rate": 0.00024085847909550932, + "loss": 0.0217, "step": 78150 }, { - "epoch": 0.84, - "learning_rate": 0.0001732567944476876, + "epoch": 0.39, + "learning_rate": 0.0002408509114024953, "loss": 0.0189, "step": 78160 }, { - "epoch": 0.85, - "learning_rate": 0.0001732405785820847, - "loss": 0.0168, + "epoch": 0.39, + "learning_rate": 0.00024084334370948128, + "loss": 0.0177, "step": 78170 }, { - "epoch": 0.85, - "learning_rate": 0.0001732243627164818, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.0002408357760164673, + "loss": 0.0162, "step": 78180 }, { - "epoch": 0.85, - "learning_rate": 0.00017320814685087887, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.00024082820832345327, + "loss": 0.0171, "step": 78190 }, { - "epoch": 0.85, - "learning_rate": 0.00017319193098527596, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024082064063043926, + "loss": 0.0177, "step": 78200 }, { - "epoch": 0.85, - "learning_rate": 0.00017317571511967308, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024081307293742526, + "loss": 0.018, "step": 78210 }, { - "epoch": 0.85, - "learning_rate": 0.00017315949925407017, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024080550524441125, + "loss": 0.0202, "step": 78220 }, { - "epoch": 0.85, - "learning_rate": 0.00017314328338846724, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024079793755139723, + "loss": 0.015, "step": 78230 }, { - "epoch": 0.85, - "learning_rate": 0.00017312706752286436, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024079036985838324, + "loss": 0.0211, "step": 78240 }, { - "epoch": 0.85, - "learning_rate": 0.00017311085165726145, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024078280216536922, + "loss": 0.0216, "step": 78250 }, { - "epoch": 0.85, - "learning_rate": 0.00017309463579165854, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.0002407752344723552, + "loss": 0.015, "step": 78260 }, { - "epoch": 0.85, - "learning_rate": 0.0001730784199260556, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.0002407676667793412, + "loss": 0.017, "step": 78270 }, { - "epoch": 0.85, - "learning_rate": 0.00017306220406045273, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.0002407600990863272, + "loss": 0.0243, "step": 78280 }, { - "epoch": 0.85, - "learning_rate": 0.00017304598819484982, - "loss": 0.0181, + "epoch": 0.39, + "learning_rate": 0.00024075253139331317, + "loss": 0.0165, "step": 78290 }, { - "epoch": 0.85, - "learning_rate": 0.00017302977232924694, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00024074496370029915, + "loss": 0.0172, "step": 78300 }, { - "epoch": 0.85, - "learning_rate": 0.000173013556463644, - "loss": 0.0165, + "epoch": 0.4, + "learning_rate": 0.00024073739600728516, + "loss": 0.0185, "step": 78310 }, { - "epoch": 0.85, - "learning_rate": 0.0001729973405980411, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024072982831427114, + "loss": 0.0184, "step": 78320 }, { - "epoch": 0.85, - "learning_rate": 0.0001729811247324382, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00024072226062125712, + "loss": 0.019, "step": 78330 }, { - "epoch": 0.85, - "learning_rate": 0.00017296490886683531, - "loss": 0.0156, + "epoch": 0.4, + "learning_rate": 0.00024071469292824313, + "loss": 0.0224, "step": 78340 }, { - "epoch": 0.85, - "learning_rate": 0.00017294869300123238, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.0002407071252352291, + "loss": 0.0212, "step": 78350 }, { - "epoch": 0.85, - "learning_rate": 0.00017293247713562947, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.0002406995575422151, + "loss": 0.0187, "step": 78360 }, { - "epoch": 0.85, - "learning_rate": 0.0001729162612700266, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.0002406919898492011, + "loss": 0.0203, "step": 78370 }, { - "epoch": 0.85, - "learning_rate": 0.00017290004540442368, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00024068442215618708, + "loss": 0.0144, "step": 78380 }, { - "epoch": 0.85, - "learning_rate": 0.00017288382953882075, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024067685446317307, + "loss": 0.016, "step": 78390 }, { - "epoch": 0.85, - "learning_rate": 0.00017286761367321784, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.00024066928677015907, + "loss": 0.0171, "step": 78400 }, { - "epoch": 0.85, - "learning_rate": 0.00017285139780761496, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024066171907714506, + "loss": 0.0171, "step": 78410 }, { - "epoch": 0.85, - "learning_rate": 0.00017283518194201206, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024065415138413104, + "loss": 0.0146, "step": 78420 }, { - "epoch": 0.85, - "learning_rate": 0.00017281896607640915, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00024064658369111705, + "loss": 0.0157, "step": 78430 }, { - "epoch": 0.85, - "learning_rate": 0.00017280275021080624, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00024063901599810303, + "loss": 0.0161, "step": 78440 }, { - "epoch": 0.85, - "learning_rate": 0.00017278653434520333, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.000240631448305089, + "loss": 0.0175, "step": 78450 }, { - "epoch": 0.85, - "learning_rate": 0.00017277031847960043, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00024062388061207502, + "loss": 0.0152, "step": 78460 }, { - "epoch": 0.85, - "learning_rate": 0.00017275410261399755, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.000240616312919061, + "loss": 0.0184, "step": 78470 }, { - "epoch": 0.85, - "learning_rate": 0.0001727378867483946, - "loss": 0.0105, + "epoch": 0.4, + "learning_rate": 0.00024060874522604698, + "loss": 0.0223, "step": 78480 }, { - "epoch": 0.85, - "learning_rate": 0.0001727216708827917, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00024060117753303296, + "loss": 0.027, "step": 78490 }, { - "epoch": 0.85, - "learning_rate": 0.0001727054550171888, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024059360984001897, + "loss": 0.0212, "step": 78500 }, { - "epoch": 0.85, - "learning_rate": 0.00017268923915158592, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00024058604214700495, + "loss": 0.0158, "step": 78510 }, { - "epoch": 0.85, - "learning_rate": 0.00017267302328598298, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00024057847445399093, + "loss": 0.0192, "step": 78520 }, { - "epoch": 0.85, - "learning_rate": 0.00017265680742038008, - "loss": 0.015, + "epoch": 0.4, + "learning_rate": 0.00024057090676097694, + "loss": 0.0138, "step": 78530 }, { - "epoch": 0.85, - "learning_rate": 0.0001726405915547772, - "loss": 0.0159, + "epoch": 0.4, + "learning_rate": 0.00024056333906796292, + "loss": 0.0198, "step": 78540 }, { - "epoch": 0.85, - "learning_rate": 0.0001726243756891743, - "loss": 0.0165, + "epoch": 0.4, + "learning_rate": 0.0002405557713749489, + "loss": 0.0174, "step": 78550 }, { - "epoch": 0.85, - "learning_rate": 0.00017260815982357135, - "loss": 0.0151, + "epoch": 0.4, + "learning_rate": 0.00024054820368193486, + "loss": 0.019, "step": 78560 }, { - "epoch": 0.85, - "learning_rate": 0.00017259194395796845, - "loss": 0.0167, + "epoch": 0.4, + "learning_rate": 0.00024054063598892087, + "loss": 0.0217, "step": 78570 }, { - "epoch": 0.85, - "learning_rate": 0.00017257572809236557, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00024053306829590685, + "loss": 0.0209, "step": 78580 }, { - "epoch": 0.85, - "learning_rate": 0.00017255951222676266, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00024052550060289283, + "loss": 0.0179, "step": 78590 }, { - "epoch": 0.85, - "learning_rate": 0.00017254329636115973, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024051793290987884, + "loss": 0.0198, "step": 78600 }, { - "epoch": 0.85, - "learning_rate": 0.00017252708049555684, - "loss": 0.016, + "epoch": 0.4, + "learning_rate": 0.00024051036521686482, + "loss": 0.0189, "step": 78610 }, { - "epoch": 0.85, - "learning_rate": 0.00017251086462995394, - "loss": 0.0151, + "epoch": 0.4, + "learning_rate": 0.0002405027975238508, + "loss": 0.0174, "step": 78620 }, { - "epoch": 0.85, - "learning_rate": 0.00017249464876435103, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.0002404952298308368, + "loss": 0.0171, "step": 78630 }, { - "epoch": 0.85, - "learning_rate": 0.0001724784328987481, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.0002404876621378228, + "loss": 0.0176, "step": 78640 }, { - "epoch": 0.85, - "learning_rate": 0.00017246221703314522, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024048009444480877, + "loss": 0.0177, "step": 78650 }, { - "epoch": 0.85, - "learning_rate": 0.0001724460011675423, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024047252675179478, + "loss": 0.0181, "step": 78660 }, { - "epoch": 0.85, - "learning_rate": 0.00017242978530193943, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024046495905878076, + "loss": 0.0197, "step": 78670 }, { - "epoch": 0.85, - "learning_rate": 0.0001724135694363365, - "loss": 0.0108, + "epoch": 0.4, + "learning_rate": 0.00024045739136576674, + "loss": 0.0211, "step": 78680 }, { - "epoch": 0.85, - "learning_rate": 0.0001723973535707336, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00024044982367275273, + "loss": 0.0175, "step": 78690 }, { - "epoch": 0.85, - "learning_rate": 0.00017238113770513068, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.00024044225597973873, + "loss": 0.0195, "step": 78700 }, { - "epoch": 0.85, - "learning_rate": 0.0001723649218395278, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00024043468828672472, + "loss": 0.0188, "step": 78710 }, { - "epoch": 0.85, - "learning_rate": 0.00017234870597392487, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.0002404271205937107, + "loss": 0.0165, "step": 78720 }, { - "epoch": 0.85, - "learning_rate": 0.00017233249010832196, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.0002404195529006967, + "loss": 0.0172, "step": 78730 }, { - "epoch": 0.85, - "learning_rate": 0.00017231627424271908, - "loss": 0.0162, + "epoch": 0.4, + "learning_rate": 0.0002404119852076827, + "loss": 0.019, "step": 78740 }, { - "epoch": 0.85, - "learning_rate": 0.00017230005837711617, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024040441751466867, + "loss": 0.0166, "step": 78750 }, { - "epoch": 0.85, - "learning_rate": 0.00017228384251151324, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024039684982165468, + "loss": 0.0156, "step": 78760 }, { - "epoch": 0.85, - "learning_rate": 0.00017226762664591033, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024038928212864066, + "loss": 0.0173, "step": 78770 }, { - "epoch": 0.85, - "learning_rate": 0.00017225141078030745, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00024038171443562664, + "loss": 0.0184, "step": 78780 }, { - "epoch": 0.85, - "learning_rate": 0.00017223519491470454, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024037414674261265, + "loss": 0.0189, "step": 78790 }, { - "epoch": 0.85, - "learning_rate": 0.0001722189790491016, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.00024036657904959863, + "loss": 0.0171, "step": 78800 }, { - "epoch": 0.85, - "learning_rate": 0.00017220276318349873, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.0002403590113565846, + "loss": 0.0196, "step": 78810 }, { - "epoch": 0.85, - "learning_rate": 0.00017218654731789582, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00024035144366357062, + "loss": 0.0153, "step": 78820 }, { - "epoch": 0.85, - "learning_rate": 0.0001721703314522929, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.0002403438759705566, + "loss": 0.0188, "step": 78830 }, { - "epoch": 0.85, - "learning_rate": 0.00017215411558668998, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024033630827754258, + "loss": 0.0178, "step": 78840 }, { - "epoch": 0.85, - "learning_rate": 0.0001721378997210871, - "loss": 0.0148, + "epoch": 0.4, + "learning_rate": 0.0002403287405845286, + "loss": 0.0221, "step": 78850 }, { - "epoch": 0.85, - "learning_rate": 0.0001721216838554842, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024032117289151457, + "loss": 0.0166, "step": 78860 }, { - "epoch": 0.85, - "learning_rate": 0.00017210546798988128, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00024031360519850055, + "loss": 0.0216, "step": 78870 }, { - "epoch": 0.85, - "learning_rate": 0.00017208925212427838, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024030603750548654, + "loss": 0.0176, "step": 78880 }, { - "epoch": 0.85, - "learning_rate": 0.00017207303625867547, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024029846981247254, + "loss": 0.0192, "step": 78890 }, { - "epoch": 0.85, - "learning_rate": 0.00017205682039307256, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024029090211945853, + "loss": 0.0182, "step": 78900 }, { - "epoch": 0.85, - "learning_rate": 0.00017204060452746968, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.0002402833344264445, + "loss": 0.0208, "step": 78910 }, { - "epoch": 0.85, - "learning_rate": 0.00017202438866186675, - "loss": 0.0218, + "epoch": 0.4, + "learning_rate": 0.00024027576673343052, + "loss": 0.0182, "step": 78920 }, { - "epoch": 0.85, - "learning_rate": 0.00017200817279626384, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.0002402681990404165, + "loss": 0.0192, "step": 78930 }, { - "epoch": 0.85, - "learning_rate": 0.00017199195693066093, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024026063134740248, + "loss": 0.0141, "step": 78940 }, { - "epoch": 0.85, - "learning_rate": 0.00017197574106505805, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.0002402530636543885, + "loss": 0.0166, "step": 78950 }, { - "epoch": 0.85, - "learning_rate": 0.00017195952519945512, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00024024549596137447, + "loss": 0.0179, "step": 78960 }, { - "epoch": 0.85, - "learning_rate": 0.0001719433093338522, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024023792826836045, + "loss": 0.0154, "step": 78970 }, { - "epoch": 0.85, - "learning_rate": 0.00017192709346824933, - "loss": 0.0168, + "epoch": 0.4, + "learning_rate": 0.00024023036057534646, + "loss": 0.0157, "step": 78980 }, { - "epoch": 0.85, - "learning_rate": 0.00017191087760264642, - "loss": 0.0151, + "epoch": 0.4, + "learning_rate": 0.00024022279288233244, + "loss": 0.0167, "step": 78990 }, { - "epoch": 0.85, - "learning_rate": 0.0001718946617370435, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00024021522518931842, + "loss": 0.0181, "step": 79000 }, { - "epoch": 0.85, - "eval_cer": 0.9215269345090743, - "eval_loss": 0.010222644545137882, - "eval_runtime": 121.2156, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.4, + "eval_cer": 0.914508101352053, + "eval_loss": 0.012615088373422623, + "eval_runtime": 116.5859, + "eval_samples_per_second": 17.155, + "eval_steps_per_second": 4.289, "step": 79000 }, { - "epoch": 0.85, - "learning_rate": 0.0001718784458714406, - "loss": 0.0163, + "epoch": 0.4, + "learning_rate": 0.00024020765749630443, + "loss": 0.0181, "step": 79010 }, { - "epoch": 0.85, - "learning_rate": 0.0001718622300058377, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.0002402000898032904, + "loss": 0.0182, "step": 79020 }, { - "epoch": 0.85, - "learning_rate": 0.0001718460141402348, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.0002401925221102764, + "loss": 0.0178, "step": 79030 }, { - "epoch": 0.85, - "learning_rate": 0.00017182979827463186, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024018495441726237, + "loss": 0.019, "step": 79040 }, { - "epoch": 0.85, - "learning_rate": 0.00017181358240902898, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00024017738672424838, + "loss": 0.0146, "step": 79050 }, { - "epoch": 0.85, - "learning_rate": 0.00017179736654342607, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024016981903123436, + "loss": 0.0158, "step": 79060 }, { - "epoch": 0.85, - "learning_rate": 0.00017178115067782317, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024016225133822035, + "loss": 0.018, "step": 79070 }, { - "epoch": 0.85, - "learning_rate": 0.00017176493481222026, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.00024015468364520635, + "loss": 0.0188, "step": 79080 }, { - "epoch": 0.86, - "learning_rate": 0.00017174871894661735, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024014711595219234, + "loss": 0.0198, "step": 79090 }, { - "epoch": 0.86, - "learning_rate": 0.00017173250308101444, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00024013954825917832, + "loss": 0.02, "step": 79100 }, { - "epoch": 0.86, - "learning_rate": 0.00017171628721541156, - "loss": 0.016, + "epoch": 0.4, + "learning_rate": 0.00024013198056616433, + "loss": 0.0146, "step": 79110 }, { - "epoch": 0.86, - "learning_rate": 0.00017170007134980863, - "loss": 0.0166, + "epoch": 0.4, + "learning_rate": 0.0002401244128731503, + "loss": 0.0169, "step": 79120 }, { - "epoch": 0.86, - "learning_rate": 0.00017168385548420572, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.0002401168451801363, + "loss": 0.0132, "step": 79130 }, { - "epoch": 0.86, - "learning_rate": 0.00017166763961860281, - "loss": 0.019, + "epoch": 0.4, + "learning_rate": 0.0002401092774871223, + "loss": 0.0181, "step": 79140 }, { - "epoch": 0.86, - "learning_rate": 0.00017165142375299993, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00024010170979410828, + "loss": 0.019, "step": 79150 }, { - "epoch": 0.86, - "learning_rate": 0.00017163520788739703, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024009414210109426, + "loss": 0.022, "step": 79160 }, { - "epoch": 0.86, - "learning_rate": 0.0001716189920217941, - "loss": 0.0187, + "epoch": 0.4, + "learning_rate": 0.00024008657440808027, + "loss": 0.02, "step": 79170 }, { - "epoch": 0.86, - "learning_rate": 0.0001716027761561912, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00024007900671506625, + "loss": 0.0159, "step": 79180 }, { - "epoch": 0.86, - "learning_rate": 0.0001715865602905883, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00024007143902205223, + "loss": 0.0208, "step": 79190 }, { - "epoch": 0.86, - "learning_rate": 0.0001715703444249854, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.0002400638713290382, + "loss": 0.0177, "step": 79200 }, { - "epoch": 0.86, - "learning_rate": 0.00017155412855938246, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00024005630363602422, + "loss": 0.0155, "step": 79210 }, { - "epoch": 0.86, - "learning_rate": 0.00017153791269377958, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.0002400487359430102, + "loss": 0.0171, "step": 79220 }, { - "epoch": 0.86, - "learning_rate": 0.00017152169682817668, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024004116824999618, + "loss": 0.0201, "step": 79230 }, { - "epoch": 0.86, - "learning_rate": 0.00017150548096257377, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.0002400336005569822, + "loss": 0.0184, "step": 79240 }, { - "epoch": 0.86, - "learning_rate": 0.00017148926509697086, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024002603286396817, + "loss": 0.021, "step": 79250 }, { - "epoch": 0.86, - "learning_rate": 0.00017147304923136795, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024001846517095416, + "loss": 0.0165, "step": 79260 }, { - "epoch": 0.86, - "learning_rate": 0.00017145683336576505, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00024001089747794016, + "loss": 0.0173, "step": 79270 }, { - "epoch": 0.86, - "learning_rate": 0.00017144061750016217, - "loss": 0.0105, + "epoch": 0.4, + "learning_rate": 0.00024000332978492615, + "loss": 0.0199, "step": 79280 }, { - "epoch": 0.86, - "learning_rate": 0.00017142440163455923, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023999576209191213, + "loss": 0.019, "step": 79290 }, { - "epoch": 0.86, - "learning_rate": 0.00017140818576895633, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023998819439889814, + "loss": 0.018, "step": 79300 }, { - "epoch": 0.86, - "learning_rate": 0.00017139196990335345, - "loss": 0.015, + "epoch": 0.4, + "learning_rate": 0.00023998062670588412, + "loss": 0.0199, "step": 79310 }, { - "epoch": 0.86, - "learning_rate": 0.00017137575403775054, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.0002399730590128701, + "loss": 0.017, "step": 79320 }, { - "epoch": 0.86, - "learning_rate": 0.0001713595381721476, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.0002399654913198561, + "loss": 0.0181, "step": 79330 }, { - "epoch": 0.86, - "learning_rate": 0.0001713433223065447, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.0002399579236268421, + "loss": 0.0147, "step": 79340 }, { - "epoch": 0.86, - "learning_rate": 0.00017132710644094182, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023995035593382807, + "loss": 0.0157, "step": 79350 }, { - "epoch": 0.86, - "learning_rate": 0.0001713108905753389, - "loss": 0.0164, + "epoch": 0.4, + "learning_rate": 0.00023994278824081408, + "loss": 0.0157, "step": 79360 }, { - "epoch": 0.86, - "learning_rate": 0.00017129467470973597, - "loss": 0.0175, + "epoch": 0.4, + "learning_rate": 0.00023993522054780006, + "loss": 0.0178, "step": 79370 }, { - "epoch": 0.86, - "learning_rate": 0.0001712784588441331, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00023992765285478604, + "loss": 0.0152, "step": 79380 }, { - "epoch": 0.86, - "learning_rate": 0.0001712622429785302, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023992008516177202, + "loss": 0.0155, "step": 79390 }, { - "epoch": 0.86, - "learning_rate": 0.00017124602711292728, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00023991251746875803, + "loss": 0.017, "step": 79400 }, { - "epoch": 0.86, - "learning_rate": 0.00017122981124732435, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.000239904949775744, + "loss": 0.0179, "step": 79410 }, { - "epoch": 0.86, - "learning_rate": 0.00017121359538172147, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023989738208273, + "loss": 0.0212, "step": 79420 }, { - "epoch": 0.86, - "learning_rate": 0.00017119737951611856, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.000239889814389716, + "loss": 0.0262, "step": 79430 }, { - "epoch": 0.86, - "learning_rate": 0.00017118116365051565, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00023988224669670198, + "loss": 0.0186, "step": 79440 }, { - "epoch": 0.86, - "learning_rate": 0.00017116494778491274, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023987467900368797, + "loss": 0.0187, "step": 79450 }, { - "epoch": 0.86, - "learning_rate": 0.00017114873191930984, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023986711131067397, + "loss": 0.0218, "step": 79460 }, { - "epoch": 0.86, - "learning_rate": 0.00017113251605370693, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023985954361765996, + "loss": 0.0167, "step": 79470 }, { - "epoch": 0.86, - "learning_rate": 0.00017111630018810405, - "loss": 0.0148, + "epoch": 0.4, + "learning_rate": 0.00023985197592464594, + "loss": 0.02, "step": 79480 }, { - "epoch": 0.86, - "learning_rate": 0.00017110008432250111, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00023984440823163195, + "loss": 0.0144, "step": 79490 }, { - "epoch": 0.86, - "learning_rate": 0.0001710838684568982, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00023983684053861793, + "loss": 0.0187, "step": 79500 }, { - "epoch": 0.86, - "learning_rate": 0.0001710676525912953, - "loss": 0.0152, + "epoch": 0.4, + "learning_rate": 0.0002398292728456039, + "loss": 0.0156, "step": 79510 }, { - "epoch": 0.86, - "learning_rate": 0.00017105143672569242, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00023982170515258992, + "loss": 0.0184, "step": 79520 }, { - "epoch": 0.86, - "learning_rate": 0.00017103522086008949, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.0002398141374595759, + "loss": 0.0161, "step": 79530 }, { - "epoch": 0.86, - "learning_rate": 0.00017101900499448658, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023980656976656188, + "loss": 0.0204, "step": 79540 }, { - "epoch": 0.86, - "learning_rate": 0.0001710027891288837, - "loss": 0.0163, + "epoch": 0.4, + "learning_rate": 0.00023979900207354786, + "loss": 0.0165, "step": 79550 }, { - "epoch": 0.86, - "learning_rate": 0.0001709865732632808, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00023979143438053387, + "loss": 0.0173, "step": 79560 }, { - "epoch": 0.86, - "learning_rate": 0.00017097035739767786, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00023978386668751985, + "loss": 0.0168, "step": 79570 }, { - "epoch": 0.86, - "learning_rate": 0.00017095414153207495, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.00023977629899450583, + "loss": 0.0165, "step": 79580 }, { - "epoch": 0.86, - "learning_rate": 0.00017093792566647207, - "loss": 0.0153, + "epoch": 0.4, + "learning_rate": 0.00023976873130149184, + "loss": 0.0189, "step": 79590 }, { - "epoch": 0.86, - "learning_rate": 0.00017092170980086916, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00023976116360847782, + "loss": 0.0212, "step": 79600 }, { - "epoch": 0.86, - "learning_rate": 0.00017090549393526623, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.0002397535959154638, + "loss": 0.0217, "step": 79610 }, { - "epoch": 0.86, - "learning_rate": 0.00017088927806966335, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.0002397460282224498, + "loss": 0.02, "step": 79620 }, { - "epoch": 0.86, - "learning_rate": 0.00017087306220406044, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.0002397384605294358, + "loss": 0.0183, "step": 79630 }, { - "epoch": 0.86, - "learning_rate": 0.00017085684633845753, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00023973089283642178, + "loss": 0.0191, "step": 79640 }, { - "epoch": 0.86, - "learning_rate": 0.0001708406304728546, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00023972332514340778, + "loss": 0.0192, "step": 79650 }, { - "epoch": 0.86, - "learning_rate": 0.00017082441460725172, - "loss": 0.015, + "epoch": 0.4, + "learning_rate": 0.00023971575745039377, + "loss": 0.021, "step": 79660 }, { - "epoch": 0.86, - "learning_rate": 0.0001708081987416488, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00023970818975737975, + "loss": 0.0147, "step": 79670 }, { - "epoch": 0.86, - "learning_rate": 0.00017079198287604593, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00023970062206436576, + "loss": 0.0186, "step": 79680 }, { - "epoch": 0.86, - "learning_rate": 0.000170775767010443, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00023969305437135174, + "loss": 0.0195, "step": 79690 }, { - "epoch": 0.86, - "learning_rate": 0.0001707595511448401, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00023968548667833772, + "loss": 0.0194, "step": 79700 }, { - "epoch": 0.86, - "learning_rate": 0.00017074333527923718, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.0002396779189853237, + "loss": 0.0176, "step": 79710 }, { - "epoch": 0.86, - "learning_rate": 0.0001707271194136343, - "loss": 0.0163, + "epoch": 0.4, + "learning_rate": 0.0002396703512923097, + "loss": 0.0189, "step": 79720 }, { - "epoch": 0.86, - "learning_rate": 0.00017071090354803137, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.0002396627835992957, + "loss": 0.0164, "step": 79730 }, { - "epoch": 0.86, - "learning_rate": 0.00017069468768242846, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00023965521590628167, + "loss": 0.0141, "step": 79740 }, { - "epoch": 0.86, - "learning_rate": 0.00017067847181682558, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023964764821326768, + "loss": 0.0162, "step": 79750 }, { - "epoch": 0.86, - "learning_rate": 0.00017066225595122267, - "loss": 0.0192, + "epoch": 0.4, + "learning_rate": 0.00023964008052025366, + "loss": 0.017, "step": 79760 }, { - "epoch": 0.86, - "learning_rate": 0.00017064604008561974, - "loss": 0.0165, + "epoch": 0.4, + "learning_rate": 0.00023963251282723964, + "loss": 0.0156, "step": 79770 }, { - "epoch": 0.86, - "learning_rate": 0.00017062982422001683, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023962494513422565, + "loss": 0.0193, "step": 79780 }, { - "epoch": 0.86, - "learning_rate": 0.00017061360835441395, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.00023961737744121163, + "loss": 0.0144, "step": 79790 }, { - "epoch": 0.86, - "learning_rate": 0.00017059739248881104, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023960980974819761, + "loss": 0.0179, "step": 79800 }, { - "epoch": 0.86, - "learning_rate": 0.0001705811766232081, - "loss": 0.0167, + "epoch": 0.4, + "learning_rate": 0.00023960224205518362, + "loss": 0.0191, "step": 79810 }, { - "epoch": 0.86, - "learning_rate": 0.00017056496075760523, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00023959467436216958, + "loss": 0.019, "step": 79820 }, { - "epoch": 0.86, - "learning_rate": 0.00017054874489200232, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023958710666915556, + "loss": 0.0188, "step": 79830 }, { - "epoch": 0.86, - "learning_rate": 0.00017053252902639941, - "loss": 0.0157, + "epoch": 0.4, + "learning_rate": 0.00023957953897614154, + "loss": 0.0194, "step": 79840 }, { - "epoch": 0.86, - "learning_rate": 0.00017051631316079653, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.00023957197128312755, + "loss": 0.0162, "step": 79850 }, { - "epoch": 0.86, - "learning_rate": 0.0001705000972951936, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00023956440359011353, + "loss": 0.0175, "step": 79860 }, { - "epoch": 0.86, - "learning_rate": 0.0001704838814295907, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.0002395568358970995, + "loss": 0.0164, "step": 79870 }, { - "epoch": 0.86, - "learning_rate": 0.00017046766556398779, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023954926820408552, + "loss": 0.0181, "step": 79880 }, { - "epoch": 0.86, - "learning_rate": 0.0001704514496983849, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.0002395417005110715, + "loss": 0.0226, "step": 79890 }, { - "epoch": 0.86, - "learning_rate": 0.00017043523383278197, - "loss": 0.0152, + "epoch": 0.4, + "learning_rate": 0.00023953413281805748, + "loss": 0.0207, "step": 79900 }, { - "epoch": 0.86, - "learning_rate": 0.00017041901796717906, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.0002395265651250435, + "loss": 0.018, "step": 79910 }, { - "epoch": 0.86, - "learning_rate": 0.00017040280210157618, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.00023951899743202947, + "loss": 0.0194, "step": 79920 }, { - "epoch": 0.86, - "learning_rate": 0.00017038658623597328, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00023951142973901545, + "loss": 0.0228, "step": 79930 }, { - "epoch": 0.86, - "learning_rate": 0.00017037037037037034, - "loss": 0.0168, + "epoch": 0.4, + "learning_rate": 0.00023950386204600144, + "loss": 0.0186, "step": 79940 }, { - "epoch": 0.86, - "learning_rate": 0.00017035415450476744, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023949629435298744, + "loss": 0.0176, "step": 79950 }, { - "epoch": 0.86, - "learning_rate": 0.00017033793863916455, - "loss": 0.0155, + "epoch": 0.4, + "learning_rate": 0.00023948872665997343, + "loss": 0.0185, "step": 79960 }, { - "epoch": 0.86, - "learning_rate": 0.00017032172277356165, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.0002394811589669594, + "loss": 0.0174, "step": 79970 }, { - "epoch": 0.86, - "learning_rate": 0.0001703055069079587, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00023947359127394542, + "loss": 0.0178, "step": 79980 }, { - "epoch": 0.86, - "learning_rate": 0.00017028929104235583, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.0002394660235809314, + "loss": 0.0189, "step": 79990 }, { - "epoch": 0.86, - "learning_rate": 0.00017027307517675293, - "loss": 0.0178, + "epoch": 0.4, + "learning_rate": 0.00023945845588791738, + "loss": 0.0193, "step": 80000 }, { - "epoch": 0.86, - "eval_cer": 0.9215417007593327, - "eval_loss": 0.009527038782835007, - "eval_runtime": 121.101, - "eval_samples_per_second": 16.515, - "eval_steps_per_second": 4.129, + "epoch": 0.4, + "eval_cer": 0.9145207165016832, + "eval_loss": 0.012683646753430367, + "eval_runtime": 116.5374, + "eval_samples_per_second": 17.162, + "eval_steps_per_second": 4.29, "step": 80000 }, { - "epoch": 0.86, - "learning_rate": 0.00017025685931115002, - "loss": 0.0148, + "epoch": 0.4, + "learning_rate": 0.0002394508881949034, + "loss": 0.021, "step": 80010 }, { - "epoch": 0.87, - "learning_rate": 0.0001702406434455471, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.00023944332050188937, + "loss": 0.0137, "step": 80020 }, { - "epoch": 0.87, - "learning_rate": 0.0001702244275799442, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00023943575280887535, + "loss": 0.0192, "step": 80030 }, { - "epoch": 0.87, - "learning_rate": 0.0001702082117143413, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023942818511586136, + "loss": 0.0183, "step": 80040 }, { - "epoch": 0.87, - "learning_rate": 0.00017019199584873842, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00023942061742284734, + "loss": 0.0167, "step": 80050 }, { - "epoch": 0.87, - "learning_rate": 0.00017017577998313548, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00023941304972983332, + "loss": 0.0149, "step": 80060 }, { - "epoch": 0.87, - "learning_rate": 0.00017015956411753258, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00023940548203681933, + "loss": 0.0176, "step": 80070 }, { - "epoch": 0.87, - "learning_rate": 0.00017014334825192967, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.0002393979143438053, + "loss": 0.0176, "step": 80080 }, { - "epoch": 0.87, - "learning_rate": 0.0001701271323863268, - "loss": 0.0108, + "epoch": 0.4, + "learning_rate": 0.0002393903466507913, + "loss": 0.0201, "step": 80090 }, { - "epoch": 0.87, - "learning_rate": 0.00017011091652072385, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023938277895777727, + "loss": 0.02, "step": 80100 }, { - "epoch": 0.87, - "learning_rate": 0.00017009470065512095, - "loss": 0.0155, + "epoch": 0.4, + "learning_rate": 0.00023937521126476328, + "loss": 0.0158, "step": 80110 }, { - "epoch": 0.87, - "learning_rate": 0.00017007848478951807, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00023936764357174926, + "loss": 0.0187, "step": 80120 }, { - "epoch": 0.87, - "learning_rate": 0.00017006226892391516, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.00023936007587873525, + "loss": 0.0198, "step": 80130 }, { - "epoch": 0.87, - "learning_rate": 0.00017004605305831222, - "loss": 0.0107, + "epoch": 0.4, + "learning_rate": 0.00023935250818572125, + "loss": 0.02, "step": 80140 }, { - "epoch": 0.87, - "learning_rate": 0.00017002983719270932, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023934494049270724, + "loss": 0.0166, "step": 80150 }, { - "epoch": 0.87, - "learning_rate": 0.00017001362132710644, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023933737279969322, + "loss": 0.0193, "step": 80160 }, { - "epoch": 0.87, - "learning_rate": 0.00016999740546150353, - "loss": 0.0097, + "epoch": 0.4, + "learning_rate": 0.00023932980510667923, + "loss": 0.0182, "step": 80170 }, { - "epoch": 0.87, - "learning_rate": 0.0001699811895959006, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.0002393222374136652, + "loss": 0.0185, "step": 80180 }, { - "epoch": 0.87, - "learning_rate": 0.00016996497373029772, - "loss": 0.0104, + "epoch": 0.4, + "learning_rate": 0.0002393146697206512, + "loss": 0.0176, "step": 80190 }, { - "epoch": 0.87, - "learning_rate": 0.0001699487578646948, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.0002393071020276372, + "loss": 0.0157, "step": 80200 }, { - "epoch": 0.87, - "learning_rate": 0.0001699325419990919, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00023929953433462318, + "loss": 0.0172, "step": 80210 }, { - "epoch": 0.87, - "learning_rate": 0.00016991632613348897, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00023929196664160916, + "loss": 0.0128, "step": 80220 }, { - "epoch": 0.87, - "learning_rate": 0.00016990011026788609, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.00023928439894859517, + "loss": 0.0185, "step": 80230 }, { - "epoch": 0.87, - "learning_rate": 0.00016988389440228318, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00023927683125558115, + "loss": 0.0202, "step": 80240 }, { - "epoch": 0.87, - "learning_rate": 0.00016986767853668027, - "loss": 0.0148, + "epoch": 0.4, + "learning_rate": 0.00023926926356256713, + "loss": 0.0162, "step": 80250 }, { - "epoch": 0.87, - "learning_rate": 0.00016985146267107736, - "loss": 0.0156, + "epoch": 0.4, + "learning_rate": 0.00023926169586955314, + "loss": 0.0162, "step": 80260 }, { - "epoch": 0.87, - "learning_rate": 0.00016983524680547446, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00023925412817653912, + "loss": 0.0159, "step": 80270 }, { - "epoch": 0.87, - "learning_rate": 0.00016981903093987155, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.0002392465604835251, + "loss": 0.0347, "step": 80280 }, { - "epoch": 0.87, - "learning_rate": 0.00016980281507426867, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.00023923899279051108, + "loss": 0.0174, "step": 80290 }, { - "epoch": 0.87, - "learning_rate": 0.00016978659920866574, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.0002392314250974971, + "loss": 0.0184, "step": 80300 }, { - "epoch": 0.87, - "learning_rate": 0.00016977038334306283, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.00023922385740448307, + "loss": 0.0195, "step": 80310 }, { - "epoch": 0.87, - "learning_rate": 0.00016975416747745995, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023921628971146906, + "loss": 0.0182, "step": 80320 }, { - "epoch": 0.87, - "learning_rate": 0.00016973795161185704, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023920872201845506, + "loss": 0.0161, "step": 80330 }, { - "epoch": 0.87, - "learning_rate": 0.0001697217357462541, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023920115432544105, + "loss": 0.0174, "step": 80340 }, { - "epoch": 0.87, - "learning_rate": 0.0001697055198806512, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023919358663242703, + "loss": 0.0167, "step": 80350 }, { - "epoch": 0.87, - "learning_rate": 0.00016968930401504832, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023918601893941304, + "loss": 0.0167, "step": 80360 }, { - "epoch": 0.87, - "learning_rate": 0.0001696730881494454, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023917845124639902, + "loss": 0.0205, "step": 80370 }, { - "epoch": 0.87, - "learning_rate": 0.00016965687228384248, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.000239170883553385, + "loss": 0.02, "step": 80380 }, { - "epoch": 0.87, - "learning_rate": 0.0001696406564182396, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.000239163315860371, + "loss": 0.0207, "step": 80390 }, { - "epoch": 0.87, - "learning_rate": 0.0001696244405526367, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.000239155748167357, + "loss": 0.019, "step": 80400 }, { - "epoch": 0.87, - "learning_rate": 0.00016960822468703378, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023914818047434297, + "loss": 0.0211, "step": 80410 }, { - "epoch": 0.87, - "learning_rate": 0.00016959200882143085, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023914061278132898, + "loss": 0.0202, "step": 80420 }, { - "epoch": 0.87, - "learning_rate": 0.00016957579295582797, - "loss": 0.0161, + "epoch": 0.41, + "learning_rate": 0.00023913304508831496, + "loss": 0.0183, "step": 80430 }, { - "epoch": 0.87, - "learning_rate": 0.00016955957709022506, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023912547739530094, + "loss": 0.018, "step": 80440 }, { - "epoch": 0.87, - "learning_rate": 0.00016954336122462215, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.00023911790970228692, + "loss": 0.0182, "step": 80450 }, { - "epoch": 0.87, - "learning_rate": 0.00016952714535901925, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.00023911034200927293, + "loss": 0.0173, "step": 80460 }, { - "epoch": 0.87, - "learning_rate": 0.00016951092949341634, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002391027743162589, + "loss": 0.0227, "step": 80470 }, { - "epoch": 0.87, - "learning_rate": 0.00016949471362781343, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.0002390952066232449, + "loss": 0.0166, "step": 80480 }, { - "epoch": 0.87, - "learning_rate": 0.00016947849776221055, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.0002390876389302309, + "loss": 0.0164, "step": 80490 }, { - "epoch": 0.87, - "learning_rate": 0.00016946228189660762, - "loss": 0.0106, + "epoch": 0.41, + "learning_rate": 0.00023908007123721688, + "loss": 0.0159, "step": 80500 }, { - "epoch": 0.87, - "learning_rate": 0.0001694460660310047, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023907250354420287, + "loss": 0.0175, "step": 80510 }, { - "epoch": 0.87, - "learning_rate": 0.0001694298501654018, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023906493585118887, + "loss": 0.0194, "step": 80520 }, { - "epoch": 0.87, - "learning_rate": 0.00016941363429979892, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023905736815817486, + "loss": 0.0196, "step": 80530 }, { - "epoch": 0.87, - "learning_rate": 0.000169397418434196, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023904980046516084, + "loss": 0.019, "step": 80540 }, { - "epoch": 0.87, - "learning_rate": 0.00016938120256859308, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.00023904223277214685, + "loss": 0.0174, "step": 80550 }, { - "epoch": 0.87, - "learning_rate": 0.0001693649867029902, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023903466507913283, + "loss": 0.0157, "step": 80560 }, { - "epoch": 0.87, - "learning_rate": 0.0001693487708373873, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002390270973861188, + "loss": 0.0161, "step": 80570 }, { - "epoch": 0.87, - "learning_rate": 0.00016933255497178439, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023901952969310482, + "loss": 0.0181, "step": 80580 }, { - "epoch": 0.87, - "learning_rate": 0.00016931633910618145, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.0002390119620000908, + "loss": 0.0172, "step": 80590 }, { - "epoch": 0.87, - "learning_rate": 0.00016930012324057857, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023900439430707678, + "loss": 0.0153, "step": 80600 }, { - "epoch": 0.87, - "learning_rate": 0.00016928390737497566, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023899682661406276, + "loss": 0.0189, "step": 80610 }, { - "epoch": 0.87, - "learning_rate": 0.00016926769150937278, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023898925892104877, + "loss": 0.0187, "step": 80620 }, { - "epoch": 0.87, - "learning_rate": 0.00016925147564376985, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023898169122803475, + "loss": 0.0185, "step": 80630 }, { - "epoch": 0.87, - "learning_rate": 0.00016923525977816694, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023897412353502073, + "loss": 0.015, "step": 80640 }, { - "epoch": 0.87, - "learning_rate": 0.00016921904391256404, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023896655584200674, + "loss": 0.0205, "step": 80650 }, { - "epoch": 0.87, - "learning_rate": 0.00016920282804696116, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023895898814899272, + "loss": 0.018, "step": 80660 }, { - "epoch": 0.87, - "learning_rate": 0.00016918661218135822, - "loss": 0.019, + "epoch": 0.41, + "learning_rate": 0.0002389514204559787, + "loss": 0.0161, "step": 80670 }, { - "epoch": 0.87, - "learning_rate": 0.00016917039631575531, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.0002389438527629647, + "loss": 0.0176, "step": 80680 }, { - "epoch": 0.87, - "learning_rate": 0.00016915418045015243, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.0002389362850699507, + "loss": 0.0181, "step": 80690 }, { - "epoch": 0.87, - "learning_rate": 0.00016913796458454953, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023892871737693668, + "loss": 0.015, "step": 80700 }, { - "epoch": 0.87, - "learning_rate": 0.0001691217487189466, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.00023892114968392268, + "loss": 0.0183, "step": 80710 }, { - "epoch": 0.87, - "learning_rate": 0.00016910553285334368, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023891358199090867, + "loss": 0.0204, "step": 80720 }, { - "epoch": 0.87, - "learning_rate": 0.0001690893169877408, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023890601429789465, + "loss": 0.019, "step": 80730 }, { - "epoch": 0.87, - "learning_rate": 0.0001690731011221379, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023889844660488066, + "loss": 0.0166, "step": 80740 }, { - "epoch": 0.87, - "learning_rate": 0.00016905688525653496, - "loss": 0.0173, + "epoch": 0.41, + "learning_rate": 0.00023889087891186664, + "loss": 0.0178, "step": 80750 }, { - "epoch": 0.87, - "learning_rate": 0.00016904066939093208, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023888331121885262, + "loss": 0.0178, "step": 80760 }, { - "epoch": 0.87, - "learning_rate": 0.00016902445352532918, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023887574352583863, + "loss": 0.0189, "step": 80770 }, { - "epoch": 0.87, - "learning_rate": 0.00016900823765972627, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002388681758328246, + "loss": 0.016, "step": 80780 }, { - "epoch": 0.87, - "learning_rate": 0.00016899202179412333, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.0002388606081398106, + "loss": 0.0165, "step": 80790 }, { - "epoch": 0.87, - "learning_rate": 0.00016897580592852045, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023885304044679657, + "loss": 0.0181, "step": 80800 }, { - "epoch": 0.87, - "learning_rate": 0.00016895959006291755, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.00023884547275378258, + "loss": 0.0173, "step": 80810 }, { - "epoch": 0.87, - "learning_rate": 0.00016894337419731464, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023883790506076856, + "loss": 0.0173, "step": 80820 }, { - "epoch": 0.87, - "learning_rate": 0.00016892715833171173, - "loss": 0.0157, + "epoch": 0.41, + "learning_rate": 0.00023883033736775454, + "loss": 0.0159, "step": 80830 }, { - "epoch": 0.87, - "learning_rate": 0.00016891094246610882, - "loss": 0.0147, + "epoch": 0.41, + "learning_rate": 0.00023882276967474055, + "loss": 0.0154, "step": 80840 }, { - "epoch": 0.87, - "learning_rate": 0.00016889472660050592, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023881520198172653, + "loss": 0.0167, "step": 80850 }, { - "epoch": 0.87, - "learning_rate": 0.00016887851073490304, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023880763428871252, + "loss": 0.0255, "step": 80860 }, { - "epoch": 0.87, - "learning_rate": 0.0001688622948693001, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.00023880006659569852, + "loss": 0.0181, "step": 80870 }, { - "epoch": 0.87, - "learning_rate": 0.0001688460790036972, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.0002387924989026845, + "loss": 0.0139, "step": 80880 }, { - "epoch": 0.87, - "learning_rate": 0.0001688298631380943, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.0002387849312096705, + "loss": 0.0164, "step": 80890 }, { - "epoch": 0.87, - "learning_rate": 0.0001688136472724914, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002387773635166565, + "loss": 0.0188, "step": 80900 }, { - "epoch": 0.87, - "learning_rate": 0.00016879743140688847, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.00023876979582364248, + "loss": 0.0154, "step": 80910 }, { - "epoch": 0.87, - "learning_rate": 0.00016878121554128557, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023876222813062846, + "loss": 0.0137, "step": 80920 }, { - "epoch": 0.87, - "learning_rate": 0.0001687649996756827, - "loss": 0.0156, + "epoch": 0.41, + "learning_rate": 0.00023875466043761447, + "loss": 0.0185, "step": 80930 }, { - "epoch": 0.88, - "learning_rate": 0.00016874878381007978, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023874709274460045, + "loss": 0.015, "step": 80940 }, { - "epoch": 0.88, - "learning_rate": 0.00016873256794447685, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023873952505158643, + "loss": 0.0162, "step": 80950 }, { - "epoch": 0.88, - "learning_rate": 0.00016871635207887394, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.0002387319573585724, + "loss": 0.0192, "step": 80960 }, { - "epoch": 0.88, - "learning_rate": 0.00016870013621327106, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.00023872438966555842, + "loss": 0.0209, "step": 80970 }, { - "epoch": 0.88, - "learning_rate": 0.00016868392034766815, - "loss": 0.0192, + "epoch": 0.41, + "learning_rate": 0.0002387168219725444, + "loss": 0.0182, "step": 80980 }, { - "epoch": 0.88, - "learning_rate": 0.00016866770448206522, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.00023870925427953038, + "loss": 0.0168, "step": 80990 }, { - "epoch": 0.88, - "learning_rate": 0.00016865148861646234, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.0002387016865865164, + "loss": 0.016, "step": 81000 }, { - "epoch": 0.88, - "eval_cer": 0.9215668902450677, - "eval_loss": 0.009719022549688816, - "eval_runtime": 121.2086, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.41, + "eval_cer": 0.9145090717481783, + "eval_loss": 0.012487111613154411, + "eval_runtime": 116.7617, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, "step": 81000 }, { - "epoch": 0.88, - "learning_rate": 0.00016863527275085943, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023869411889350237, + "loss": 0.0197, "step": 81010 }, { - "epoch": 0.88, - "learning_rate": 0.00016861905688525652, - "loss": 0.0147, + "epoch": 0.41, + "learning_rate": 0.00023868655120048835, + "loss": 0.0159, "step": 81020 }, { - "epoch": 0.88, - "learning_rate": 0.00016860284101965361, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023867898350747436, + "loss": 0.0203, "step": 81030 }, { - "epoch": 0.88, - "learning_rate": 0.0001685866251540507, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023867141581446034, + "loss": 0.0169, "step": 81040 }, { - "epoch": 0.88, - "learning_rate": 0.0001685704092884478, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023866384812144633, + "loss": 0.0194, "step": 81050 }, { - "epoch": 0.88, - "learning_rate": 0.00016855419342284492, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023865628042843233, + "loss": 0.0174, "step": 81060 }, { - "epoch": 0.88, - "learning_rate": 0.00016853797755724199, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.0002386487127354183, + "loss": 0.0177, "step": 81070 }, { - "epoch": 0.88, - "learning_rate": 0.00016852176169163908, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023864114504240427, + "loss": 0.0169, "step": 81080 }, { - "epoch": 0.88, - "learning_rate": 0.00016850554582603617, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023863357734939025, + "loss": 0.0198, "step": 81090 }, { - "epoch": 0.88, - "learning_rate": 0.0001684893299604333, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023862600965637626, + "loss": 0.0161, "step": 81100 }, { - "epoch": 0.88, - "learning_rate": 0.00016847311409483036, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.00023861844196336224, + "loss": 0.0203, "step": 81110 }, { - "epoch": 0.88, - "learning_rate": 0.00016845689822922745, - "loss": 0.0126, + "epoch": 0.41, + "learning_rate": 0.00023861087427034822, + "loss": 0.0186, "step": 81120 }, { - "epoch": 0.88, - "learning_rate": 0.00016844068236362457, - "loss": 0.0086, + "epoch": 0.41, + "learning_rate": 0.00023860330657733423, + "loss": 0.0194, "step": 81130 }, { - "epoch": 0.88, - "learning_rate": 0.00016842446649802166, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.0002385957388843202, + "loss": 0.0222, "step": 81140 }, { - "epoch": 0.88, - "learning_rate": 0.00016840825063241873, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.0002385881711913062, + "loss": 0.0179, "step": 81150 }, { - "epoch": 0.88, - "learning_rate": 0.00016839203476681582, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002385806034982922, + "loss": 0.0176, "step": 81160 }, { - "epoch": 0.88, - "learning_rate": 0.00016837581890121294, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023857303580527818, + "loss": 0.0206, "step": 81170 }, { - "epoch": 0.88, - "learning_rate": 0.00016835960303561003, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023856546811226417, + "loss": 0.0173, "step": 81180 }, { - "epoch": 0.88, - "learning_rate": 0.0001683433871700071, - "loss": 0.0186, + "epoch": 0.41, + "learning_rate": 0.00023855790041925015, + "loss": 0.0187, "step": 81190 }, { - "epoch": 0.88, - "learning_rate": 0.00016832717130440422, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023855033272623616, + "loss": 0.0167, "step": 81200 }, { - "epoch": 0.88, - "learning_rate": 0.0001683109554388013, - "loss": 0.0112, + "epoch": 0.41, + "learning_rate": 0.00023854276503322214, + "loss": 0.0172, "step": 81210 }, { - "epoch": 0.88, - "learning_rate": 0.0001682947395731984, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023853519734020812, + "loss": 0.0161, "step": 81220 }, { - "epoch": 0.88, - "learning_rate": 0.00016827852370759547, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023852762964719413, + "loss": 0.0163, "step": 81230 }, { - "epoch": 0.88, - "learning_rate": 0.0001682623078419926, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.0002385200619541801, + "loss": 0.0138, "step": 81240 }, { - "epoch": 0.88, - "learning_rate": 0.00016824609197638968, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.0002385124942611661, + "loss": 0.0166, "step": 81250 }, { - "epoch": 0.88, - "learning_rate": 0.00016822987611078677, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.0002385049265681521, + "loss": 0.0182, "step": 81260 }, { - "epoch": 0.88, - "learning_rate": 0.00016821366024518387, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.00023849735887513808, + "loss": 0.0202, "step": 81270 }, { - "epoch": 0.88, - "learning_rate": 0.00016819744437958096, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.00023848979118212406, + "loss": 0.0228, "step": 81280 }, { - "epoch": 0.88, - "learning_rate": 0.00016818122851397805, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.00023848222348911007, + "loss": 0.0169, "step": 81290 }, { - "epoch": 0.88, - "learning_rate": 0.00016816501264837517, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023847465579609605, + "loss": 0.016, "step": 81300 }, { - "epoch": 0.88, - "learning_rate": 0.00016814879678277227, - "loss": 0.0104, + "epoch": 0.41, + "learning_rate": 0.00023846708810308203, + "loss": 0.0159, "step": 81310 }, { - "epoch": 0.88, - "learning_rate": 0.00016813258091716933, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023845952041006804, + "loss": 0.0159, "step": 81320 }, { - "epoch": 0.88, - "learning_rate": 0.00016811636505156645, - "loss": 0.0152, + "epoch": 0.41, + "learning_rate": 0.00023845195271705402, + "loss": 0.0175, "step": 81330 }, { - "epoch": 0.88, - "learning_rate": 0.00016810014918596354, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023844438502404, + "loss": 0.0187, "step": 81340 }, { - "epoch": 0.88, - "learning_rate": 0.00016808393332036064, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023843681733102599, + "loss": 0.0149, "step": 81350 }, { - "epoch": 0.88, - "learning_rate": 0.0001680677174547577, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.000238429249638012, + "loss": 0.0195, "step": 81360 }, { - "epoch": 0.88, - "learning_rate": 0.00016805150158915482, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.00023842168194499798, + "loss": 0.0214, "step": 81370 }, { - "epoch": 0.88, - "learning_rate": 0.00016803528572355191, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023841411425198396, + "loss": 0.0185, "step": 81380 }, { - "epoch": 0.88, - "learning_rate": 0.000168019069857949, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023840654655896997, + "loss": 0.0145, "step": 81390 }, { - "epoch": 0.88, - "learning_rate": 0.0001680028539923461, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023839897886595595, + "loss": 0.0149, "step": 81400 }, { - "epoch": 0.88, - "learning_rate": 0.0001679866381267432, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023839141117294193, + "loss": 0.0151, "step": 81410 }, { - "epoch": 0.88, - "learning_rate": 0.00016797042226114029, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023838384347992794, + "loss": 0.0137, "step": 81420 }, { - "epoch": 0.88, - "learning_rate": 0.0001679542063955374, - "loss": 0.0162, + "epoch": 0.41, + "learning_rate": 0.00023837627578691392, + "loss": 0.0121, "step": 81430 }, { - "epoch": 0.88, - "learning_rate": 0.00016793799052993447, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.0002383687080938999, + "loss": 0.0143, "step": 81440 }, { - "epoch": 0.88, - "learning_rate": 0.00016792177466433156, - "loss": 0.0156, + "epoch": 0.41, + "learning_rate": 0.0002383611404008859, + "loss": 0.0172, "step": 81450 }, { - "epoch": 0.88, - "learning_rate": 0.00016790555879872866, - "loss": 0.0126, + "epoch": 0.41, + "learning_rate": 0.0002383535727078719, + "loss": 0.0164, "step": 81460 }, { - "epoch": 0.88, - "learning_rate": 0.00016788934293312578, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.00023834600501485787, + "loss": 0.0186, "step": 81470 }, { - "epoch": 0.88, - "learning_rate": 0.00016787312706752284, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.00023833843732184388, + "loss": 0.0154, "step": 81480 }, { - "epoch": 0.88, - "learning_rate": 0.00016785691120191993, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023833086962882986, + "loss": 0.013, "step": 81490 }, { - "epoch": 0.88, - "learning_rate": 0.00016784069533631705, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023832330193581584, + "loss": 0.0175, "step": 81500 }, { - "epoch": 0.88, - "learning_rate": 0.00016782447947071415, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023831573424280182, + "loss": 0.0172, "step": 81510 }, { - "epoch": 0.88, - "learning_rate": 0.0001678082636051112, - "loss": 0.0158, + "epoch": 0.41, + "learning_rate": 0.00023830816654978783, + "loss": 0.0157, "step": 81520 }, { - "epoch": 0.88, - "learning_rate": 0.0001677920477395083, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023830059885677381, + "loss": 0.0181, "step": 81530 }, { - "epoch": 0.88, - "learning_rate": 0.00016777583187390543, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002382930311637598, + "loss": 0.0198, "step": 81540 }, { - "epoch": 0.88, - "learning_rate": 0.00016775961600830252, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.0002382854634707458, + "loss": 0.0143, "step": 81550 }, { - "epoch": 0.88, - "learning_rate": 0.00016774340014269958, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023827789577773179, + "loss": 0.0163, "step": 81560 }, { - "epoch": 0.88, - "learning_rate": 0.0001677271842770967, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023827032808471777, + "loss": 0.0148, "step": 81570 }, { - "epoch": 0.88, - "learning_rate": 0.0001677109684114938, - "loss": 0.0176, + "epoch": 0.41, + "learning_rate": 0.00023826276039170378, + "loss": 0.0155, "step": 81580 }, { - "epoch": 0.88, - "learning_rate": 0.0001676947525458909, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023825519269868976, + "loss": 0.0201, "step": 81590 }, { - "epoch": 0.88, - "learning_rate": 0.00016767853668028795, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.00023824762500567574, + "loss": 0.0193, "step": 81600 }, { - "epoch": 0.88, - "learning_rate": 0.00016766232081468507, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023824005731266175, + "loss": 0.0149, "step": 81610 }, { - "epoch": 0.88, - "learning_rate": 0.00016764610494908217, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023823248961964773, + "loss": 0.0212, "step": 81620 }, { - "epoch": 0.88, - "learning_rate": 0.0001676298890834793, - "loss": 0.0197, + "epoch": 0.41, + "learning_rate": 0.0002382249219266337, + "loss": 0.0181, "step": 81630 }, { - "epoch": 0.88, - "learning_rate": 0.00016761367321787635, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.00023821735423361972, + "loss": 0.0172, "step": 81640 }, { - "epoch": 0.88, - "learning_rate": 0.00016759745735227345, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.0002382097865406057, + "loss": 0.0236, "step": 81650 }, { - "epoch": 0.88, - "learning_rate": 0.00016758124148667054, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023820221884759168, + "loss": 0.0255, "step": 81660 }, { - "epoch": 0.88, - "learning_rate": 0.00016756502562106766, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.00023819465115457766, + "loss": 0.0179, "step": 81670 }, { - "epoch": 0.88, - "learning_rate": 0.00016754880975546472, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023818708346156367, + "loss": 0.0173, "step": 81680 }, { - "epoch": 0.88, - "learning_rate": 0.00016753259388986182, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023817951576854965, + "loss": 0.0176, "step": 81690 }, { - "epoch": 0.88, - "learning_rate": 0.00016751637802425894, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023817194807553563, + "loss": 0.0169, "step": 81700 }, { - "epoch": 0.88, - "learning_rate": 0.00016750016215865603, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023816438038252164, + "loss": 0.0199, "step": 81710 }, { - "epoch": 0.88, - "learning_rate": 0.0001674839462930531, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.00023815681268950762, + "loss": 0.016, "step": 81720 }, { - "epoch": 0.88, - "learning_rate": 0.0001674677304274502, - "loss": 0.0191, + "epoch": 0.41, + "learning_rate": 0.0002381492449964936, + "loss": 0.0171, "step": 81730 }, { - "epoch": 0.88, - "learning_rate": 0.0001674515145618473, - "loss": 0.0152, + "epoch": 0.41, + "learning_rate": 0.00023814167730347961, + "loss": 0.0189, "step": 81740 }, { - "epoch": 0.88, - "learning_rate": 0.0001674352986962444, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.0002381341096104656, + "loss": 0.018, "step": 81750 }, { - "epoch": 0.88, - "learning_rate": 0.00016741908283064147, - "loss": 0.0171, + "epoch": 0.41, + "learning_rate": 0.00023812654191745158, + "loss": 0.0158, "step": 81760 }, { - "epoch": 0.88, - "learning_rate": 0.00016740286696503859, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023811897422443759, + "loss": 0.0141, "step": 81770 }, { - "epoch": 0.88, - "learning_rate": 0.00016738665109943568, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023811140653142357, + "loss": 0.0172, "step": 81780 }, { - "epoch": 0.88, - "learning_rate": 0.00016737043523383277, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023810383883840955, + "loss": 0.0135, "step": 81790 }, { - "epoch": 0.88, - "learning_rate": 0.00016735421936822984, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023809627114539556, + "loss": 0.0158, "step": 81800 }, { - "epoch": 0.88, - "learning_rate": 0.00016733800350262696, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023808870345238154, + "loss": 0.0172, "step": 81810 }, { - "epoch": 0.88, - "learning_rate": 0.00016732178763702405, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023808113575936752, + "loss": 0.0173, "step": 81820 }, { - "epoch": 0.88, - "learning_rate": 0.00016730557177142114, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023807356806635353, + "loss": 0.0211, "step": 81830 }, { - "epoch": 0.88, - "learning_rate": 0.00016728935590581823, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002380660003733395, + "loss": 0.0167, "step": 81840 }, { - "epoch": 0.88, - "learning_rate": 0.00016727314004021533, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.0002380584326803255, + "loss": 0.0176, "step": 81850 }, { - "epoch": 0.88, - "learning_rate": 0.00016725692417461242, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023805086498731147, + "loss": 0.0185, "step": 81860 }, { - "epoch": 0.89, - "learning_rate": 0.00016724070830900954, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.00023804329729429748, + "loss": 0.0159, "step": 81870 }, { - "epoch": 0.89, - "learning_rate": 0.0001672244924434066, - "loss": 0.0106, + "epoch": 0.41, + "learning_rate": 0.00023803572960128346, + "loss": 0.0178, "step": 81880 }, { - "epoch": 0.89, - "learning_rate": 0.0001672082765778037, - "loss": 0.0172, + "epoch": 0.41, + "learning_rate": 0.00023802816190826944, + "loss": 0.0198, "step": 81890 }, { - "epoch": 0.89, - "learning_rate": 0.0001671920607122008, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023802059421525545, + "loss": 0.0191, "step": 81900 }, { - "epoch": 0.89, - "learning_rate": 0.0001671758448465979, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023801302652224143, + "loss": 0.0179, "step": 81910 }, { - "epoch": 0.89, - "learning_rate": 0.00016715962898099498, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023800545882922742, + "loss": 0.0177, "step": 81920 }, { - "epoch": 0.89, - "learning_rate": 0.00016714341311539207, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023799789113621342, + "loss": 0.0173, "step": 81930 }, { - "epoch": 0.89, - "learning_rate": 0.0001671271972497892, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.0002379903234431994, + "loss": 0.0204, "step": 81940 }, { - "epoch": 0.89, - "learning_rate": 0.00016711098138418628, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.0002379827557501854, + "loss": 0.0158, "step": 81950 }, { - "epoch": 0.89, - "learning_rate": 0.00016709476551858335, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.0002379751880571714, + "loss": 0.015, "step": 81960 }, { - "epoch": 0.89, - "learning_rate": 0.00016707854965298044, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.00023796762036415738, + "loss": 0.0147, "step": 81970 }, { - "epoch": 0.89, - "learning_rate": 0.00016706233378737756, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023796005267114336, + "loss": 0.0162, "step": 81980 }, { - "epoch": 0.89, - "learning_rate": 0.00016704611792177465, - "loss": 0.0192, + "epoch": 0.41, + "learning_rate": 0.00023795248497812937, + "loss": 0.016, "step": 81990 }, { - "epoch": 0.89, - "learning_rate": 0.00016702990205617172, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023794491728511535, + "loss": 0.0146, "step": 82000 }, { - "epoch": 0.89, - "eval_cer": 0.9215382263475072, - "eval_loss": 0.009874101728200912, - "eval_runtime": 121.2944, - "eval_samples_per_second": 16.489, - "eval_steps_per_second": 4.122, + "epoch": 0.41, + "eval_cer": 0.9144935454101719, + "eval_loss": 0.012472189962863922, + "eval_runtime": 116.6656, + "eval_samples_per_second": 17.143, + "eval_steps_per_second": 4.286, "step": 82000 }, { - "epoch": 0.89, - "learning_rate": 0.00016701368619056884, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.00023793734959210133, + "loss": 0.0162, "step": 82010 }, { - "epoch": 0.89, - "learning_rate": 0.00016699747032496593, - "loss": 0.0194, + "epoch": 0.41, + "learning_rate": 0.0002379297818990873, + "loss": 0.0168, "step": 82020 }, { - "epoch": 0.89, - "learning_rate": 0.00016698125445936302, - "loss": 0.0155, + "epoch": 0.41, + "learning_rate": 0.00023792221420607332, + "loss": 0.0198, "step": 82030 }, { - "epoch": 0.89, - "learning_rate": 0.00016696503859376014, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002379146465130593, + "loss": 0.0183, "step": 82040 }, { - "epoch": 0.89, - "learning_rate": 0.0001669488227281572, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023790707882004528, + "loss": 0.0302, "step": 82050 }, { - "epoch": 0.89, - "learning_rate": 0.0001669326068625543, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002378995111270313, + "loss": 0.0161, "step": 82060 }, { - "epoch": 0.89, - "learning_rate": 0.00016691639099695142, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.00023789194343401727, + "loss": 0.018, "step": 82070 }, { - "epoch": 0.89, - "learning_rate": 0.00016690017513134851, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023788437574100325, + "loss": 0.0202, "step": 82080 }, { - "epoch": 0.89, - "learning_rate": 0.00016688395926574558, - "loss": 0.0156, + "epoch": 0.41, + "learning_rate": 0.00023787680804798926, + "loss": 0.019, "step": 82090 }, { - "epoch": 0.89, - "learning_rate": 0.00016686774340014267, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023786924035497524, + "loss": 0.023, "step": 82100 }, { - "epoch": 0.89, - "learning_rate": 0.0001668515275345398, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023786167266196123, + "loss": 0.0193, "step": 82110 }, { - "epoch": 0.89, - "learning_rate": 0.00016683531166893689, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023785410496894723, + "loss": 0.0151, "step": 82120 }, { - "epoch": 0.89, - "learning_rate": 0.00016681909580333395, - "loss": 0.0157, + "epoch": 0.41, + "learning_rate": 0.00023784653727593322, + "loss": 0.0216, "step": 82130 }, { - "epoch": 0.89, - "learning_rate": 0.00016680287993773107, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.0002378389695829192, + "loss": 0.0253, "step": 82140 }, { - "epoch": 0.89, - "learning_rate": 0.00016678666407212816, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.0002378314018899052, + "loss": 0.0196, "step": 82150 }, { - "epoch": 0.89, - "learning_rate": 0.00016677044820652526, - "loss": 0.0152, + "epoch": 0.41, + "learning_rate": 0.0002378238341968912, + "loss": 0.0166, "step": 82160 }, { - "epoch": 0.89, - "learning_rate": 0.00016675423234092232, - "loss": 0.0161, + "epoch": 0.41, + "learning_rate": 0.00023781626650387717, + "loss": 0.0154, "step": 82170 }, { - "epoch": 0.89, - "learning_rate": 0.00016673801647531944, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023780869881086315, + "loss": 0.0148, "step": 82180 }, { - "epoch": 0.89, - "learning_rate": 0.00016672180060971653, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023780113111784916, + "loss": 0.0206, "step": 82190 }, { - "epoch": 0.89, - "learning_rate": 0.00016670558474411363, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023779356342483514, + "loss": 0.0171, "step": 82200 }, { - "epoch": 0.89, - "learning_rate": 0.00016668936887851072, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.00023778599573182112, + "loss": 0.0161, "step": 82210 }, { - "epoch": 0.89, - "learning_rate": 0.0001666731530129078, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023777842803880713, + "loss": 0.0177, "step": 82220 }, { - "epoch": 0.89, - "learning_rate": 0.0001666569371473049, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002377708603457931, + "loss": 0.0166, "step": 82230 }, { - "epoch": 0.89, - "learning_rate": 0.00016664072128170203, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002377632926527791, + "loss": 0.0183, "step": 82240 }, { - "epoch": 0.89, - "learning_rate": 0.0001666245054160991, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.0002377557249597651, + "loss": 0.0222, "step": 82250 }, { - "epoch": 0.89, - "learning_rate": 0.00016660828955049618, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023774815726675108, + "loss": 0.0154, "step": 82260 }, { - "epoch": 0.89, - "learning_rate": 0.00016659207368489328, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.00023774058957373706, + "loss": 0.0174, "step": 82270 }, { - "epoch": 0.89, - "learning_rate": 0.0001665758578192904, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023773302188072307, + "loss": 0.0222, "step": 82280 }, { - "epoch": 0.89, - "learning_rate": 0.00016655964195368746, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023772545418770905, + "loss": 0.017, "step": 82290 }, { - "epoch": 0.89, - "learning_rate": 0.00016654342608808456, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023771788649469504, + "loss": 0.0132, "step": 82300 }, { - "epoch": 0.89, - "learning_rate": 0.00016652721022248167, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023771031880168104, + "loss": 0.0185, "step": 82310 }, { - "epoch": 0.89, - "learning_rate": 0.00016651099435687877, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023770275110866703, + "loss": 0.0154, "step": 82320 }, { - "epoch": 0.89, - "learning_rate": 0.00016649477849127583, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023769518341565298, + "loss": 0.0219, "step": 82330 }, { - "epoch": 0.89, - "learning_rate": 0.00016647856262567295, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023768761572263896, + "loss": 0.0168, "step": 82340 }, { - "epoch": 0.89, - "learning_rate": 0.00016646234676007005, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023768004802962497, + "loss": 0.0198, "step": 82350 }, { - "epoch": 0.89, - "learning_rate": 0.00016644613089446714, - "loss": 0.0145, + "epoch": 0.42, + "learning_rate": 0.00023767248033661095, + "loss": 0.0175, "step": 82360 }, { - "epoch": 0.89, - "learning_rate": 0.0001664299150288642, - "loss": 0.0155, + "epoch": 0.42, + "learning_rate": 0.00023766491264359693, + "loss": 0.0187, "step": 82370 }, { - "epoch": 0.89, - "learning_rate": 0.00016641369916326132, - "loss": 0.0158, + "epoch": 0.42, + "learning_rate": 0.00023765734495058294, + "loss": 0.0216, "step": 82380 }, { - "epoch": 0.89, - "learning_rate": 0.00016639748329765842, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.00023764977725756892, + "loss": 0.0176, "step": 82390 }, { - "epoch": 0.89, - "learning_rate": 0.0001663812674320555, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.0002376422095645549, + "loss": 0.0199, "step": 82400 }, { - "epoch": 0.89, - "learning_rate": 0.0001663650515664526, - "loss": 0.0172, + "epoch": 0.42, + "learning_rate": 0.00023763464187154089, + "loss": 0.0169, "step": 82410 }, { - "epoch": 0.89, - "learning_rate": 0.0001663488357008497, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.0002376270741785269, + "loss": 0.017, "step": 82420 }, { - "epoch": 0.89, - "learning_rate": 0.0001663326198352468, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023761950648551288, + "loss": 0.0212, "step": 82430 }, { - "epoch": 0.89, - "learning_rate": 0.0001663164039696439, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.00023761193879249886, + "loss": 0.017, "step": 82440 }, { - "epoch": 0.89, - "learning_rate": 0.00016630018810404097, - "loss": 0.0148, + "epoch": 0.42, + "learning_rate": 0.00023760437109948487, + "loss": 0.0159, "step": 82450 }, { - "epoch": 0.89, - "learning_rate": 0.00016628397223843807, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.00023759680340647085, + "loss": 0.0241, "step": 82460 }, { - "epoch": 0.89, - "learning_rate": 0.00016626775637283516, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023758923571345683, + "loss": 0.0181, "step": 82470 }, { - "epoch": 0.89, - "learning_rate": 0.00016625154050723228, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023758166802044284, + "loss": 0.0194, "step": 82480 }, { - "epoch": 0.89, - "learning_rate": 0.00016623532464162934, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023757410032742882, + "loss": 0.0193, "step": 82490 }, { - "epoch": 0.89, - "learning_rate": 0.00016621910877602644, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.0002375665326344148, + "loss": 0.0213, "step": 82500 }, { - "epoch": 0.89, - "learning_rate": 0.00016620289291042356, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.0002375589649414008, + "loss": 0.02, "step": 82510 }, { - "epoch": 0.89, - "learning_rate": 0.00016618667704482065, - "loss": 0.0158, + "epoch": 0.42, + "learning_rate": 0.0002375513972483868, + "loss": 0.0183, "step": 82520 }, { - "epoch": 0.89, - "learning_rate": 0.00016617046117921772, - "loss": 0.0165, + "epoch": 0.42, + "learning_rate": 0.00023754382955537277, + "loss": 0.022, "step": 82530 }, { - "epoch": 0.89, - "learning_rate": 0.0001661542453136148, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.00023753626186235878, + "loss": 0.0179, "step": 82540 }, { - "epoch": 0.89, - "learning_rate": 0.00016613802944801193, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023752869416934476, + "loss": 0.0168, "step": 82550 }, { - "epoch": 0.89, - "learning_rate": 0.00016612181358240902, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023752112647633074, + "loss": 0.0143, "step": 82560 }, { - "epoch": 0.89, - "learning_rate": 0.00016610559771680609, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023751355878331672, + "loss": 0.0146, "step": 82570 }, { - "epoch": 0.89, - "learning_rate": 0.0001660893818512032, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023750599109030273, + "loss": 0.0178, "step": 82580 }, { - "epoch": 0.89, - "learning_rate": 0.0001660731659856003, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023749842339728871, + "loss": 0.0188, "step": 82590 }, { - "epoch": 0.89, - "learning_rate": 0.0001660569501199974, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.0002374908557042747, + "loss": 0.0206, "step": 82600 }, { - "epoch": 0.89, - "learning_rate": 0.00016604073425439446, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.0002374832880112607, + "loss": 0.0159, "step": 82610 }, { - "epoch": 0.89, - "learning_rate": 0.00016602451838879158, - "loss": 0.0185, + "epoch": 0.42, + "learning_rate": 0.00023747572031824669, + "loss": 0.014, "step": 82620 }, { - "epoch": 0.89, - "learning_rate": 0.00016600830252318867, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023746815262523267, + "loss": 0.016, "step": 82630 }, { - "epoch": 0.89, - "learning_rate": 0.0001659920866575858, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023746058493221868, + "loss": 0.0213, "step": 82640 }, { - "epoch": 0.89, - "learning_rate": 0.00016597587079198286, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023745301723920466, + "loss": 0.0156, "step": 82650 }, { - "epoch": 0.89, - "learning_rate": 0.00016595965492637995, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023744544954619064, + "loss": 0.0224, "step": 82660 }, { - "epoch": 0.89, - "learning_rate": 0.00016594343906077704, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023743788185317665, + "loss": 0.0151, "step": 82670 }, { - "epoch": 0.89, - "learning_rate": 0.00016592722319517416, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.00023743031416016263, + "loss": 0.0174, "step": 82680 }, { - "epoch": 0.89, - "learning_rate": 0.00016591100732957123, - "loss": 0.0169, + "epoch": 0.42, + "learning_rate": 0.0002374227464671486, + "loss": 0.0157, "step": 82690 }, { - "epoch": 0.89, - "learning_rate": 0.00016589479146396832, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023741517877413462, + "loss": 0.0215, "step": 82700 }, { - "epoch": 0.89, - "learning_rate": 0.00016587857559836544, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.0002374076110811206, + "loss": 0.0198, "step": 82710 }, { - "epoch": 0.89, - "learning_rate": 0.00016586235973276253, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023740004338810658, + "loss": 0.0164, "step": 82720 }, { - "epoch": 0.89, - "learning_rate": 0.00016584614386715962, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.0002373924756950926, + "loss": 0.0185, "step": 82730 }, { - "epoch": 0.89, - "learning_rate": 0.0001658299280015567, - "loss": 0.0105, + "epoch": 0.42, + "learning_rate": 0.00023738490800207857, + "loss": 0.0238, "step": 82740 }, { - "epoch": 0.89, - "learning_rate": 0.0001658137121359538, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023737734030906455, + "loss": 0.018, "step": 82750 }, { - "epoch": 0.89, - "learning_rate": 0.0001657974962703509, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023736977261605053, + "loss": 0.0216, "step": 82760 }, { - "epoch": 0.89, - "learning_rate": 0.000165781280404748, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023736220492303654, + "loss": 0.0214, "step": 82770 }, { - "epoch": 0.89, - "learning_rate": 0.0001657650645391451, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023735463723002252, + "loss": 0.0169, "step": 82780 }, { - "epoch": 0.9, - "learning_rate": 0.00016574884867354218, - "loss": 0.0161, + "epoch": 0.42, + "learning_rate": 0.0002373470695370085, + "loss": 0.0182, "step": 82790 }, { - "epoch": 0.9, - "learning_rate": 0.00016573263280793927, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023733950184399451, + "loss": 0.017, "step": 82800 }, { - "epoch": 0.9, - "learning_rate": 0.0001657164169423364, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.0002373319341509805, + "loss": 0.0162, "step": 82810 }, { - "epoch": 0.9, - "learning_rate": 0.00016570020107673346, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023732436645796648, + "loss": 0.0156, "step": 82820 }, { - "epoch": 0.9, - "learning_rate": 0.00016568398521113055, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023731679876495249, + "loss": 0.0242, "step": 82830 }, { - "epoch": 0.9, - "learning_rate": 0.00016566776934552764, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023730923107193847, + "loss": 0.0193, "step": 82840 }, { - "epoch": 0.9, - "learning_rate": 0.00016565155347992476, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023730166337892445, + "loss": 0.0184, "step": 82850 }, { - "epoch": 0.9, - "learning_rate": 0.00016563533761432183, - "loss": 0.0154, + "epoch": 0.42, + "learning_rate": 0.00023729409568591046, + "loss": 0.019, "step": 82860 }, { - "epoch": 0.9, - "learning_rate": 0.00016561912174871892, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023728652799289644, + "loss": 0.018, "step": 82870 }, { - "epoch": 0.9, - "learning_rate": 0.00016560290588311604, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023727896029988242, + "loss": 0.0199, "step": 82880 }, { - "epoch": 0.9, - "learning_rate": 0.00016558669001751314, - "loss": 0.0145, + "epoch": 0.42, + "learning_rate": 0.00023727139260686843, + "loss": 0.0158, "step": 82890 }, { - "epoch": 0.9, - "learning_rate": 0.0001655704741519102, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.0002372638249138544, + "loss": 0.0187, "step": 82900 }, { - "epoch": 0.9, - "learning_rate": 0.0001655542582863073, - "loss": 0.0159, + "epoch": 0.42, + "learning_rate": 0.0002372562572208404, + "loss": 0.0158, "step": 82910 }, { - "epoch": 0.9, - "learning_rate": 0.00016553804242070441, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.00023724868952782637, + "loss": 0.0192, "step": 82920 }, { - "epoch": 0.9, - "learning_rate": 0.0001655218265551015, - "loss": 0.0162, + "epoch": 0.42, + "learning_rate": 0.00023724112183481238, + "loss": 0.0194, "step": 82930 }, { - "epoch": 0.9, - "learning_rate": 0.00016550561068949857, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023723355414179836, + "loss": 0.0164, "step": 82940 }, { - "epoch": 0.9, - "learning_rate": 0.0001654893948238957, - "loss": 0.0157, + "epoch": 0.42, + "learning_rate": 0.00023722598644878434, + "loss": 0.0245, "step": 82950 }, { - "epoch": 0.9, - "learning_rate": 0.00016547317895829278, - "loss": 0.0148, + "epoch": 0.42, + "learning_rate": 0.00023721841875577035, + "loss": 0.0205, "step": 82960 }, { - "epoch": 0.9, - "learning_rate": 0.00016545696309268988, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023721085106275633, + "loss": 0.0172, "step": 82970 }, { - "epoch": 0.9, - "learning_rate": 0.00016544074722708694, - "loss": 0.0152, + "epoch": 0.42, + "learning_rate": 0.00023720328336974232, + "loss": 0.0163, "step": 82980 }, { - "epoch": 0.9, - "learning_rate": 0.00016542453136148406, - "loss": 0.0164, + "epoch": 0.42, + "learning_rate": 0.00023719571567672832, + "loss": 0.0156, "step": 82990 }, { - "epoch": 0.9, - "learning_rate": 0.00016540831549588116, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.0002371881479837143, + "loss": 0.0169, "step": 83000 }, { - "epoch": 0.9, - "eval_cer": 0.9215286717149871, - "eval_loss": 0.00943547859787941, - "eval_runtime": 121.1193, - "eval_samples_per_second": 16.513, - "eval_steps_per_second": 4.128, + "epoch": 0.42, + "eval_cer": 0.9144954862024227, + "eval_loss": 0.012444199062883854, + "eval_runtime": 116.798, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, "step": 83000 }, { - "epoch": 0.9, - "learning_rate": 0.00016539209963027828, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.0002371805802907003, + "loss": 0.0181, "step": 83010 }, { - "epoch": 0.9, - "learning_rate": 0.00016537588376467534, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.0002371730125976863, + "loss": 0.0159, "step": 83020 }, { - "epoch": 0.9, - "learning_rate": 0.00016535966789907243, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023716544490467228, + "loss": 0.0158, "step": 83030 }, { - "epoch": 0.9, - "learning_rate": 0.00016534345203346953, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023715787721165826, + "loss": 0.0195, "step": 83040 }, { - "epoch": 0.9, - "learning_rate": 0.00016532723616786665, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.00023715030951864427, + "loss": 0.0186, "step": 83050 }, { - "epoch": 0.9, - "learning_rate": 0.0001653110203022637, - "loss": 0.0095, + "epoch": 0.42, + "learning_rate": 0.00023714274182563025, + "loss": 0.0142, "step": 83060 }, { - "epoch": 0.9, - "learning_rate": 0.0001652948044366608, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023713517413261623, + "loss": 0.0178, "step": 83070 }, { - "epoch": 0.9, - "learning_rate": 0.00016527858857105792, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.0002371276064396022, + "loss": 0.0168, "step": 83080 }, { - "epoch": 0.9, - "learning_rate": 0.00016526237270545502, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023712003874658822, + "loss": 0.0164, "step": 83090 }, { - "epoch": 0.9, - "learning_rate": 0.00016524615683985208, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.0002371124710535742, + "loss": 0.017, "step": 83100 }, { - "epoch": 0.9, - "learning_rate": 0.00016522994097424918, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023710490336056018, + "loss": 0.0191, "step": 83110 }, { - "epoch": 0.9, - "learning_rate": 0.0001652137251086463, - "loss": 0.0101, + "epoch": 0.42, + "learning_rate": 0.0002370973356675462, + "loss": 0.02, "step": 83120 }, { - "epoch": 0.9, - "learning_rate": 0.0001651975092430434, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023708976797453217, + "loss": 0.0158, "step": 83130 }, { - "epoch": 0.9, - "learning_rate": 0.00016518129337744045, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023708220028151815, + "loss": 0.0154, "step": 83140 }, { - "epoch": 0.9, - "learning_rate": 0.00016516507751183757, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023707463258850416, + "loss": 0.0183, "step": 83150 }, { - "epoch": 0.9, - "learning_rate": 0.00016514886164623467, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023706706489549014, + "loss": 0.0162, "step": 83160 }, { - "epoch": 0.9, - "learning_rate": 0.00016513264578063176, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023705949720247613, + "loss": 0.0193, "step": 83170 }, { - "epoch": 0.9, - "learning_rate": 0.00016511642991502882, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.00023705192950946213, + "loss": 0.0179, "step": 83180 }, { - "epoch": 0.9, - "learning_rate": 0.00016510021404942594, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023704436181644812, + "loss": 0.0192, "step": 83190 }, { - "epoch": 0.9, - "learning_rate": 0.00016508399818382304, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002370367941234341, + "loss": 0.0184, "step": 83200 }, { - "epoch": 0.9, - "learning_rate": 0.00016506778231822013, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.0002370292264304201, + "loss": 0.0184, "step": 83210 }, { - "epoch": 0.9, - "learning_rate": 0.00016505156645261722, - "loss": 0.0149, + "epoch": 0.42, + "learning_rate": 0.0002370216587374061, + "loss": 0.016, "step": 83220 }, { - "epoch": 0.9, - "learning_rate": 0.00016503535058701432, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023701409104439207, + "loss": 0.0147, "step": 83230 }, { - "epoch": 0.9, - "learning_rate": 0.0001650191347214114, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023700652335137808, + "loss": 0.0153, "step": 83240 }, { - "epoch": 0.9, - "learning_rate": 0.00016500291885580853, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023699895565836406, + "loss": 0.016, "step": 83250 }, { - "epoch": 0.9, - "learning_rate": 0.0001649867029902056, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023699138796535004, + "loss": 0.0157, "step": 83260 }, { - "epoch": 0.9, - "learning_rate": 0.0001649704871246027, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023698382027233602, + "loss": 0.0171, "step": 83270 }, { - "epoch": 0.9, - "learning_rate": 0.00016495427125899978, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023697625257932203, + "loss": 0.0229, "step": 83280 }, { - "epoch": 0.9, - "learning_rate": 0.0001649380553933969, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.000236968684886308, + "loss": 0.0139, "step": 83290 }, { - "epoch": 0.9, - "learning_rate": 0.00016492183952779396, - "loss": 0.015, + "epoch": 0.42, + "learning_rate": 0.000236961117193294, + "loss": 0.0156, "step": 83300 }, { - "epoch": 0.9, - "learning_rate": 0.00016490562366219106, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023695354950028, + "loss": 0.0161, "step": 83310 }, { - "epoch": 0.9, - "learning_rate": 0.00016488940779658818, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023694598180726598, + "loss": 0.0163, "step": 83320 }, { - "epoch": 0.9, - "learning_rate": 0.00016487319193098527, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023693841411425196, + "loss": 0.016, "step": 83330 }, { - "epoch": 0.9, - "learning_rate": 0.00016485697606538234, - "loss": 0.0149, + "epoch": 0.42, + "learning_rate": 0.00023693084642123797, + "loss": 0.0206, "step": 83340 }, { - "epoch": 0.9, - "learning_rate": 0.00016484076019977946, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023692327872822395, + "loss": 0.0136, "step": 83350 }, { - "epoch": 0.9, - "learning_rate": 0.00016482454433417655, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023691571103520994, + "loss": 0.0184, "step": 83360 }, { - "epoch": 0.9, - "learning_rate": 0.00016480832846857364, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023690814334219594, + "loss": 0.0152, "step": 83370 }, { - "epoch": 0.9, - "learning_rate": 0.0001647921126029707, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023690057564918193, + "loss": 0.0183, "step": 83380 }, { - "epoch": 0.9, - "learning_rate": 0.00016477589673736783, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.0002368930079561679, + "loss": 0.0157, "step": 83390 }, { - "epoch": 0.9, - "learning_rate": 0.00016475968087176492, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023688544026315392, + "loss": 0.0207, "step": 83400 }, { - "epoch": 0.9, - "learning_rate": 0.000164743465006162, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002368778725701399, + "loss": 0.0177, "step": 83410 }, { - "epoch": 0.9, - "learning_rate": 0.0001647272491405591, - "loss": 0.0099, + "epoch": 0.42, + "learning_rate": 0.00023687030487712588, + "loss": 0.019, "step": 83420 }, { - "epoch": 0.9, - "learning_rate": 0.0001647110332749562, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.00023686273718411186, + "loss": 0.0185, "step": 83430 }, { - "epoch": 0.9, - "learning_rate": 0.0001646948174093533, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023685516949109787, + "loss": 0.0183, "step": 83440 }, { - "epoch": 0.9, - "learning_rate": 0.0001646786015437504, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023684760179808385, + "loss": 0.0154, "step": 83450 }, { - "epoch": 0.9, - "learning_rate": 0.0001646623856781475, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023684003410506983, + "loss": 0.0177, "step": 83460 }, { - "epoch": 0.9, - "learning_rate": 0.00016464616981254457, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023683246641205584, + "loss": 0.0152, "step": 83470 }, { - "epoch": 0.9, - "learning_rate": 0.00016462995394694166, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023682489871904182, + "loss": 0.0165, "step": 83480 }, { - "epoch": 0.9, - "learning_rate": 0.00016461373808133878, - "loss": 0.0152, + "epoch": 0.42, + "learning_rate": 0.0002368173310260278, + "loss": 0.0183, "step": 83490 }, { - "epoch": 0.9, - "learning_rate": 0.00016459752221573587, - "loss": 0.0165, + "epoch": 0.42, + "learning_rate": 0.0002368097633330138, + "loss": 0.0172, "step": 83500 }, { - "epoch": 0.9, - "learning_rate": 0.00016458130635013294, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.0002368021956399998, + "loss": 0.0186, "step": 83510 }, { - "epoch": 0.9, - "learning_rate": 0.00016456509048453006, - "loss": 0.0157, + "epoch": 0.42, + "learning_rate": 0.00023679462794698577, + "loss": 0.0145, "step": 83520 }, { - "epoch": 0.9, - "learning_rate": 0.00016454887461892715, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023678706025397178, + "loss": 0.0164, "step": 83530 }, { - "epoch": 0.9, - "learning_rate": 0.00016453265875332425, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.00023677949256095776, + "loss": 0.0151, "step": 83540 }, { - "epoch": 0.9, - "learning_rate": 0.0001645164428877213, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.00023677192486794375, + "loss": 0.0167, "step": 83550 }, { - "epoch": 0.9, - "learning_rate": 0.00016450022702211843, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023676435717492975, + "loss": 0.0142, "step": 83560 }, { - "epoch": 0.9, - "learning_rate": 0.00016448401115651552, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023675678948191574, + "loss": 0.0206, "step": 83570 }, { - "epoch": 0.9, - "learning_rate": 0.00016446779529091262, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023674922178890172, + "loss": 0.022, "step": 83580 }, { - "epoch": 0.9, - "learning_rate": 0.0001644515794253097, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023674165409588767, + "loss": 0.0183, "step": 83590 }, { - "epoch": 0.9, - "learning_rate": 0.0001644353635597068, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.00023673408640287368, + "loss": 0.035, "step": 83600 }, { - "epoch": 0.9, - "learning_rate": 0.0001644191476941039, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023672651870985966, + "loss": 0.0205, "step": 83610 }, { - "epoch": 0.9, - "learning_rate": 0.00016440293182850101, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023671895101684564, + "loss": 0.0173, "step": 83620 }, { - "epoch": 0.9, - "learning_rate": 0.00016438671596289808, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023671138332383165, + "loss": 0.018, "step": 83630 }, { - "epoch": 0.9, - "learning_rate": 0.00016437050009729517, - "loss": 0.0177, + "epoch": 0.42, + "learning_rate": 0.00023670381563081763, + "loss": 0.016, "step": 83640 }, { - "epoch": 0.9, - "learning_rate": 0.0001643542842316923, - "loss": 0.0172, + "epoch": 0.42, + "learning_rate": 0.00023669624793780361, + "loss": 0.0148, "step": 83650 }, { - "epoch": 0.9, - "learning_rate": 0.00016433806836608939, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002366886802447896, + "loss": 0.0175, "step": 83660 }, { - "epoch": 0.9, - "learning_rate": 0.00016432185250048645, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.0002366811125517756, + "loss": 0.0166, "step": 83670 }, { - "epoch": 0.9, - "learning_rate": 0.00016430563663488354, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023667354485876159, + "loss": 0.0138, "step": 83680 }, { - "epoch": 0.9, - "learning_rate": 0.00016428942076928066, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.00023666597716574757, + "loss": 0.0194, "step": 83690 }, { - "epoch": 0.9, - "learning_rate": 0.00016427320490367776, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023665840947273358, + "loss": 0.016, "step": 83700 }, { - "epoch": 0.9, - "learning_rate": 0.00016425698903807482, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023665084177971956, + "loss": 0.0191, "step": 83710 }, { - "epoch": 0.91, - "learning_rate": 0.00016424077317247194, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023664327408670554, + "loss": 0.0181, "step": 83720 }, { - "epoch": 0.91, - "learning_rate": 0.00016422455730686903, - "loss": 0.0163, + "epoch": 0.42, + "learning_rate": 0.00023663570639369155, + "loss": 0.0185, "step": 83730 }, { - "epoch": 0.91, - "learning_rate": 0.00016420834144126613, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023662813870067753, + "loss": 0.0172, "step": 83740 }, { - "epoch": 0.91, - "learning_rate": 0.0001641921255756632, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.0002366205710076635, + "loss": 0.0171, "step": 83750 }, { - "epoch": 0.91, - "learning_rate": 0.0001641759097100603, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023661300331464952, + "loss": 0.0184, "step": 83760 }, { - "epoch": 0.91, - "learning_rate": 0.0001641596938444574, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.0002366054356216355, + "loss": 0.0223, "step": 83770 }, { - "epoch": 0.91, - "learning_rate": 0.0001641434779788545, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023659786792862148, + "loss": 0.0146, "step": 83780 }, { - "epoch": 0.91, - "learning_rate": 0.0001641272621132516, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.0002365903002356075, + "loss": 0.018, "step": 83790 }, { - "epoch": 0.91, - "learning_rate": 0.00016411104624764868, - "loss": 0.0178, + "epoch": 0.42, + "learning_rate": 0.00023658273254259347, + "loss": 0.0158, "step": 83800 }, { - "epoch": 0.91, - "learning_rate": 0.00016409483038204578, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023657516484957945, + "loss": 0.0166, "step": 83810 }, { - "epoch": 0.91, - "learning_rate": 0.0001640786145164429, - "loss": 0.0183, + "epoch": 0.42, + "learning_rate": 0.00023656759715656543, + "loss": 0.0176, "step": 83820 }, { - "epoch": 0.91, - "learning_rate": 0.00016406239865083996, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023656002946355144, + "loss": 0.0176, "step": 83830 }, { - "epoch": 0.91, - "learning_rate": 0.00016404618278523705, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023655246177053742, + "loss": 0.0173, "step": 83840 }, { - "epoch": 0.91, - "learning_rate": 0.00016402996691963415, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.0002365448940775234, + "loss": 0.0143, "step": 83850 }, { - "epoch": 0.91, - "learning_rate": 0.00016401375105403127, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023653732638450941, + "loss": 0.0168, "step": 83860 }, { - "epoch": 0.91, - "learning_rate": 0.00016399753518842833, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002365297586914954, + "loss": 0.0139, "step": 83870 }, { - "epoch": 0.91, - "learning_rate": 0.00016398131932282543, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.00023652219099848138, + "loss": 0.0139, "step": 83880 }, { - "epoch": 0.91, - "learning_rate": 0.00016396510345722255, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023651462330546739, + "loss": 0.019, "step": 83890 }, { - "epoch": 0.91, - "learning_rate": 0.00016394888759161964, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023650705561245337, + "loss": 0.0175, "step": 83900 }, { - "epoch": 0.91, - "learning_rate": 0.0001639326717260167, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023649948791943935, + "loss": 0.0185, "step": 83910 }, { - "epoch": 0.91, - "learning_rate": 0.0001639164558604138, - "loss": 0.0164, + "epoch": 0.42, + "learning_rate": 0.00023649192022642536, + "loss": 0.0187, "step": 83920 }, { - "epoch": 0.91, - "learning_rate": 0.00016390023999481092, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023648435253341134, + "loss": 0.0206, "step": 83930 }, { - "epoch": 0.91, - "learning_rate": 0.000163884024129208, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023647678484039732, + "loss": 0.0166, "step": 83940 }, { - "epoch": 0.91, - "learning_rate": 0.00016386780826360507, - "loss": 0.0171, + "epoch": 0.42, + "learning_rate": 0.00023646921714738333, + "loss": 0.0219, "step": 83950 }, { - "epoch": 0.91, - "learning_rate": 0.0001638515923980022, - "loss": 0.0098, + "epoch": 0.42, + "learning_rate": 0.0002364616494543693, + "loss": 0.0189, "step": 83960 }, { - "epoch": 0.91, - "learning_rate": 0.0001638353765323993, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.0002364540817613553, + "loss": 0.02, "step": 83970 }, { - "epoch": 0.91, - "learning_rate": 0.00016381916066679638, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023644651406834127, + "loss": 0.02, "step": 83980 }, { - "epoch": 0.91, - "learning_rate": 0.00016380294480119345, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023643894637532728, + "loss": 0.0191, "step": 83990 }, { - "epoch": 0.91, - "learning_rate": 0.00016378672893559057, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023643137868231326, + "loss": 0.0162, "step": 84000 }, { - "epoch": 0.91, - "eval_cer": 0.9215373577445508, - "eval_loss": 0.009720318019390106, - "eval_runtime": 121.0619, - "eval_samples_per_second": 16.52, - "eval_steps_per_second": 4.13, + "epoch": 0.42, + "eval_cer": 0.9144935454101719, + "eval_loss": 0.012893411330878735, + "eval_runtime": 116.7828, + "eval_samples_per_second": 17.126, + "eval_steps_per_second": 4.281, "step": 84000 }, { - "epoch": 0.91, - "learning_rate": 0.00016377051306998766, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.00023642381098929924, + "loss": 0.0194, "step": 84010 }, { - "epoch": 0.91, - "learning_rate": 0.00016375429720438478, - "loss": 0.0099, + "epoch": 0.42, + "learning_rate": 0.00023641624329628525, + "loss": 0.0205, "step": 84020 }, { - "epoch": 0.91, - "learning_rate": 0.00016373808133878184, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023640867560327123, + "loss": 0.0171, "step": 84030 }, { - "epoch": 0.91, - "learning_rate": 0.00016372186547317894, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023640110791025722, + "loss": 0.0153, "step": 84040 }, { - "epoch": 0.91, - "learning_rate": 0.00016370564960757603, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.00023639354021724322, + "loss": 0.0116, "step": 84050 }, { - "epoch": 0.91, - "learning_rate": 0.00016368943374197315, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.0002363859725242292, + "loss": 0.0176, "step": 84060 }, { - "epoch": 0.91, - "learning_rate": 0.00016367321787637021, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.0002363784048312152, + "loss": 0.0144, "step": 84070 }, { - "epoch": 0.91, - "learning_rate": 0.0001636570020107673, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002363708371382012, + "loss": 0.0176, "step": 84080 }, { - "epoch": 0.91, - "learning_rate": 0.00016364078614516443, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.00023636326944518718, + "loss": 0.0194, "step": 84090 }, { - "epoch": 0.91, - "learning_rate": 0.00016362457027956152, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023635570175217316, + "loss": 0.0176, "step": 84100 }, { - "epoch": 0.91, - "learning_rate": 0.00016360835441395859, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023634813405915917, + "loss": 0.0159, "step": 84110 }, { - "epoch": 0.91, - "learning_rate": 0.00016359213854835568, - "loss": 0.0148, + "epoch": 0.42, + "learning_rate": 0.00023634056636614515, + "loss": 0.0232, "step": 84120 }, { - "epoch": 0.91, - "learning_rate": 0.0001635759226827528, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023633299867313113, + "loss": 0.019, "step": 84130 }, { - "epoch": 0.91, - "learning_rate": 0.0001635597068171499, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023632543098011714, + "loss": 0.0165, "step": 84140 }, { - "epoch": 0.91, - "learning_rate": 0.00016354349095154696, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023631786328710312, + "loss": 0.0165, "step": 84150 }, { - "epoch": 0.91, - "learning_rate": 0.00016352727508594408, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.0002363102955940891, + "loss": 0.0164, "step": 84160 }, { - "epoch": 0.91, - "learning_rate": 0.00016351105922034117, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023630272790107508, + "loss": 0.0176, "step": 84170 }, { - "epoch": 0.91, - "learning_rate": 0.00016349484335473826, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.0002362951602080611, + "loss": 0.0169, "step": 84180 }, { - "epoch": 0.91, - "learning_rate": 0.00016347862748913538, - "loss": 0.0155, + "epoch": 0.42, + "learning_rate": 0.00023628759251504707, + "loss": 0.015, "step": 84190 }, { - "epoch": 0.91, - "learning_rate": 0.00016346241162353245, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023628002482203305, + "loss": 0.0201, "step": 84200 }, { - "epoch": 0.91, - "learning_rate": 0.00016344619575792954, - "loss": 0.015, + "epoch": 0.42, + "learning_rate": 0.00023627245712901906, + "loss": 0.0176, "step": 84210 }, { - "epoch": 0.91, - "learning_rate": 0.00016342997989232663, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023626488943600504, + "loss": 0.0152, "step": 84220 }, { - "epoch": 0.91, - "learning_rate": 0.00016341376402672375, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023625732174299103, + "loss": 0.0144, "step": 84230 }, { - "epoch": 0.91, - "learning_rate": 0.00016339754816112082, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023624975404997703, + "loss": 0.0189, "step": 84240 }, { - "epoch": 0.91, - "learning_rate": 0.0001633813322955179, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023624218635696302, + "loss": 0.0212, "step": 84250 }, { - "epoch": 0.91, - "learning_rate": 0.00016336511642991503, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.000236234618663949, + "loss": 0.0167, "step": 84260 }, { - "epoch": 0.91, - "learning_rate": 0.00016334890056431212, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.000236227050970935, + "loss": 0.0186, "step": 84270 }, { - "epoch": 0.91, - "learning_rate": 0.0001633326846987092, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.000236219483277921, + "loss": 0.016, "step": 84280 }, { - "epoch": 0.91, - "learning_rate": 0.00016331646883310628, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.00023621191558490697, + "loss": 0.0168, "step": 84290 }, { - "epoch": 0.91, - "learning_rate": 0.0001633002529675034, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023620434789189298, + "loss": 0.0152, "step": 84300 }, { - "epoch": 0.91, - "learning_rate": 0.0001632840371019005, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023619678019887896, + "loss": 0.0189, "step": 84310 }, { - "epoch": 0.91, - "learning_rate": 0.00016326782123629756, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023618921250586494, + "loss": 0.0158, "step": 84320 }, { - "epoch": 0.91, - "learning_rate": 0.00016325160537069468, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.00023618164481285092, + "loss": 0.0188, "step": 84330 }, { - "epoch": 0.91, - "learning_rate": 0.00016323538950509177, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023617407711983693, + "loss": 0.0146, "step": 84340 }, { - "epoch": 0.91, - "learning_rate": 0.00016321917363948887, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002361665094268229, + "loss": 0.0139, "step": 84350 }, { - "epoch": 0.91, - "learning_rate": 0.00016320295777388596, - "loss": 0.0101, + "epoch": 0.43, + "learning_rate": 0.0002361589417338089, + "loss": 0.0151, "step": 84360 }, { - "epoch": 0.91, - "learning_rate": 0.00016318674190828305, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.0002361513740407949, + "loss": 0.0148, "step": 84370 }, { - "epoch": 0.91, - "learning_rate": 0.00016317052604268014, - "loss": 0.0099, + "epoch": 0.43, + "learning_rate": 0.00023614380634778088, + "loss": 0.0184, "step": 84380 }, { - "epoch": 0.91, - "learning_rate": 0.00016315431017707726, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023613623865476686, + "loss": 0.0186, "step": 84390 }, { - "epoch": 0.91, - "learning_rate": 0.00016313809431147433, - "loss": 0.0144, + "epoch": 0.43, + "learning_rate": 0.00023612867096175287, + "loss": 0.017, "step": 84400 }, { - "epoch": 0.91, - "learning_rate": 0.00016312187844587142, - "loss": 0.0135, + "epoch": 0.43, + "learning_rate": 0.00023612110326873885, + "loss": 0.0207, "step": 84410 }, { - "epoch": 0.91, - "learning_rate": 0.00016310566258026851, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023611353557572484, + "loss": 0.018, "step": 84420 }, { - "epoch": 0.91, - "learning_rate": 0.00016308944671466563, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023610596788271084, + "loss": 0.0179, "step": 84430 }, { - "epoch": 0.91, - "learning_rate": 0.0001630732308490627, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023609840018969683, + "loss": 0.0189, "step": 84440 }, { - "epoch": 0.91, - "learning_rate": 0.0001630570149834598, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002360908324966828, + "loss": 0.0164, "step": 84450 }, { - "epoch": 0.91, - "learning_rate": 0.0001630407991178569, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023608326480366882, + "loss": 0.021, "step": 84460 }, { - "epoch": 0.91, - "learning_rate": 0.000163024583252254, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002360756971106548, + "loss": 0.0167, "step": 84470 }, { - "epoch": 0.91, - "learning_rate": 0.00016300836738665107, - "loss": 0.0146, + "epoch": 0.43, + "learning_rate": 0.00023606812941764078, + "loss": 0.0172, "step": 84480 }, { - "epoch": 0.91, - "learning_rate": 0.00016299215152104816, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023606056172462676, + "loss": 0.0172, "step": 84490 }, { - "epoch": 0.91, - "learning_rate": 0.00016297593565544528, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023605299403161277, + "loss": 0.0175, "step": 84500 }, { - "epoch": 0.91, - "learning_rate": 0.00016295971978984238, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.00023604542633859875, + "loss": 0.0187, "step": 84510 }, { - "epoch": 0.91, - "learning_rate": 0.00016294350392423944, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.00023603785864558473, + "loss": 0.015, "step": 84520 }, { - "epoch": 0.91, - "learning_rate": 0.00016292728805863656, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023603029095257074, + "loss": 0.0154, "step": 84530 }, { - "epoch": 0.91, - "learning_rate": 0.00016291107219303365, - "loss": 0.0151, + "epoch": 0.43, + "learning_rate": 0.00023602272325955672, + "loss": 0.0154, "step": 84540 }, { - "epoch": 0.91, - "learning_rate": 0.00016289485632743075, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.0002360151555665427, + "loss": 0.0156, "step": 84550 }, { - "epoch": 0.91, - "learning_rate": 0.0001628786404618278, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.0002360075878735287, + "loss": 0.0186, "step": 84560 }, { - "epoch": 0.91, - "learning_rate": 0.00016286242459622493, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002360000201805147, + "loss": 0.0154, "step": 84570 }, { - "epoch": 0.91, - "learning_rate": 0.00016284620873062203, - "loss": 0.0183, + "epoch": 0.43, + "learning_rate": 0.00023599245248750067, + "loss": 0.0162, "step": 84580 }, { - "epoch": 0.91, - "learning_rate": 0.00016282999286501912, - "loss": 0.0167, + "epoch": 0.43, + "learning_rate": 0.00023598488479448668, + "loss": 0.0142, "step": 84590 }, { - "epoch": 0.91, - "learning_rate": 0.0001628137769994162, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.00023597731710147266, + "loss": 0.0206, "step": 84600 }, { - "epoch": 0.91, - "learning_rate": 0.0001627975611338133, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.00023596974940845865, + "loss": 0.0174, "step": 84610 }, { - "epoch": 0.91, - "learning_rate": 0.0001627813452682104, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.00023596218171544465, + "loss": 0.0177, "step": 84620 }, { - "epoch": 0.91, - "learning_rate": 0.00016276512940260752, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.00023595461402243064, + "loss": 0.0167, "step": 84630 }, { - "epoch": 0.92, - "learning_rate": 0.00016274891353700458, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023594704632941662, + "loss": 0.017, "step": 84640 }, { - "epoch": 0.92, - "learning_rate": 0.00016273269767140168, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023593947863640263, + "loss": 0.0201, "step": 84650 }, { - "epoch": 0.92, - "learning_rate": 0.0001627164818057988, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.0002359319109433886, + "loss": 0.0167, "step": 84660 }, { - "epoch": 0.92, - "learning_rate": 0.0001627002659401959, - "loss": 0.0099, + "epoch": 0.43, + "learning_rate": 0.0002359243432503746, + "loss": 0.018, "step": 84670 }, { - "epoch": 0.92, - "learning_rate": 0.00016268405007459295, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.00023591677555736057, + "loss": 0.0173, "step": 84680 }, { - "epoch": 0.92, - "learning_rate": 0.00016266783420899005, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023590920786434658, + "loss": 0.0158, "step": 84690 }, { - "epoch": 0.92, - "learning_rate": 0.00016265161834338717, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.00023590164017133256, + "loss": 0.0185, "step": 84700 }, { - "epoch": 0.92, - "learning_rate": 0.00016263540247778426, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023589407247831854, + "loss": 0.0172, "step": 84710 }, { - "epoch": 0.92, - "learning_rate": 0.00016261918661218132, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023588650478530455, + "loss": 0.0194, "step": 84720 }, { - "epoch": 0.92, - "learning_rate": 0.00016260297074657844, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023587893709229053, + "loss": 0.0151, "step": 84730 }, { - "epoch": 0.92, - "learning_rate": 0.00016258675488097554, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.0002358713693992765, + "loss": 0.0136, "step": 84740 }, { - "epoch": 0.92, - "learning_rate": 0.00016257053901537263, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023586380170626252, + "loss": 0.015, "step": 84750 }, { - "epoch": 0.92, - "learning_rate": 0.0001625543231497697, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.0002358562340132485, + "loss": 0.0193, "step": 84760 }, { - "epoch": 0.92, - "learning_rate": 0.00016253810728416682, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.00023584866632023448, + "loss": 0.0174, "step": 84770 }, { - "epoch": 0.92, - "learning_rate": 0.0001625218914185639, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.0002358410986272205, + "loss": 0.0197, "step": 84780 }, { - "epoch": 0.92, - "learning_rate": 0.000162505675552961, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023583353093420647, + "loss": 0.0195, "step": 84790 }, { - "epoch": 0.92, - "learning_rate": 0.0001624894596873581, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023582596324119246, + "loss": 0.0194, "step": 84800 }, { - "epoch": 0.92, - "learning_rate": 0.00016247324382175519, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023581839554817846, + "loss": 0.0161, "step": 84810 }, { - "epoch": 0.92, - "learning_rate": 0.00016245702795615228, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023581082785516445, + "loss": 0.0177, "step": 84820 }, { - "epoch": 0.92, - "learning_rate": 0.0001624408120905494, - "loss": 0.0109, + "epoch": 0.43, + "learning_rate": 0.00023580326016215043, + "loss": 0.0206, "step": 84830 }, { - "epoch": 0.92, - "learning_rate": 0.00016242459622494646, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023579569246913638, + "loss": 0.0149, "step": 84840 }, { - "epoch": 0.92, - "learning_rate": 0.00016240838035934356, - "loss": 0.0155, + "epoch": 0.43, + "learning_rate": 0.0002357881247761224, + "loss": 0.0203, "step": 84850 }, { - "epoch": 0.92, - "learning_rate": 0.00016239216449374065, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.00023578055708310837, + "loss": 0.018, "step": 84860 }, { - "epoch": 0.92, - "learning_rate": 0.00016237594862813777, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023577298939009435, + "loss": 0.0154, "step": 84870 }, { - "epoch": 0.92, - "learning_rate": 0.00016235973276253486, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023576542169708033, + "loss": 0.0179, "step": 84880 }, { - "epoch": 0.92, - "learning_rate": 0.00016234351689693193, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023575785400406634, + "loss": 0.0173, "step": 84890 }, { - "epoch": 0.92, - "learning_rate": 0.00016232730103132905, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023575028631105232, + "loss": 0.0165, "step": 84900 }, { - "epoch": 0.92, - "learning_rate": 0.00016231108516572614, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.0002357427186180383, + "loss": 0.0219, "step": 84910 }, { - "epoch": 0.92, - "learning_rate": 0.00016229486930012323, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023573515092502431, + "loss": 0.0202, "step": 84920 }, { - "epoch": 0.92, - "learning_rate": 0.0001622786534345203, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.0002357275832320103, + "loss": 0.0185, "step": 84930 }, { - "epoch": 0.92, - "learning_rate": 0.00016226243756891742, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023572001553899628, + "loss": 0.0187, "step": 84940 }, { - "epoch": 0.92, - "learning_rate": 0.0001622462217033145, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023571244784598229, + "loss": 0.0163, "step": 84950 }, { - "epoch": 0.92, - "learning_rate": 0.00016223000583771163, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023570488015296827, + "loss": 0.0191, "step": 84960 }, { - "epoch": 0.92, - "learning_rate": 0.0001622137899721087, - "loss": 0.017, + "epoch": 0.43, + "learning_rate": 0.00023569731245995425, + "loss": 0.0154, "step": 84970 }, { - "epoch": 0.92, - "learning_rate": 0.0001621975741065058, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.00023568974476694026, + "loss": 0.0209, "step": 84980 }, { - "epoch": 0.92, - "learning_rate": 0.00016218135824090288, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.00023568217707392624, + "loss": 0.0169, "step": 84990 }, { - "epoch": 0.92, - "learning_rate": 0.0001621651423753, - "loss": 0.0147, + "epoch": 0.43, + "learning_rate": 0.00023567460938091222, + "loss": 0.014, "step": 85000 }, { - "epoch": 0.92, - "eval_cer": 0.9215269345090743, - "eval_loss": 0.00925032515078783, - "eval_runtime": 121.1422, - "eval_samples_per_second": 16.51, - "eval_steps_per_second": 4.127, + "epoch": 0.43, + "eval_cer": 0.9145236276900593, + "eval_loss": 0.01236006710678339, + "eval_runtime": 116.6924, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 85000 }, { - "epoch": 0.92, - "learning_rate": 0.00016214892650969707, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023566704168789823, + "loss": 0.0166, "step": 85010 }, { - "epoch": 0.92, - "learning_rate": 0.00016213271064409416, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002356594739948842, + "loss": 0.0159, "step": 85020 }, { - "epoch": 0.92, - "learning_rate": 0.00016211649477849128, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.0002356519063018702, + "loss": 0.0167, "step": 85030 }, { - "epoch": 0.92, - "learning_rate": 0.00016210027891288837, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.0002356443386088562, + "loss": 0.0184, "step": 85040 }, { - "epoch": 0.92, - "learning_rate": 0.00016208406304728544, - "loss": 0.0082, + "epoch": 0.43, + "learning_rate": 0.00023563677091584218, + "loss": 0.0172, "step": 85050 }, { - "epoch": 0.92, - "learning_rate": 0.00016206784718168253, - "loss": 0.0157, + "epoch": 0.43, + "learning_rate": 0.00023562920322282816, + "loss": 0.0181, "step": 85060 }, { - "epoch": 0.92, - "learning_rate": 0.00016205163131607965, - "loss": 0.0154, + "epoch": 0.43, + "learning_rate": 0.00023562163552981414, + "loss": 0.0162, "step": 85070 }, { - "epoch": 0.92, - "learning_rate": 0.00016203541545047674, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.00023561406783680015, + "loss": 0.0224, "step": 85080 }, { - "epoch": 0.92, - "learning_rate": 0.0001620191995848738, - "loss": 0.0144, + "epoch": 0.43, + "learning_rate": 0.00023560650014378613, + "loss": 0.0173, "step": 85090 }, { - "epoch": 0.92, - "learning_rate": 0.00016200298371927093, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.00023559893245077212, + "loss": 0.0159, "step": 85100 }, { - "epoch": 0.92, - "learning_rate": 0.00016198676785366802, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023559136475775812, + "loss": 0.017, "step": 85110 }, { - "epoch": 0.92, - "learning_rate": 0.00016197055198806512, - "loss": 0.0146, + "epoch": 0.43, + "learning_rate": 0.0002355837970647441, + "loss": 0.0232, "step": 85120 }, { - "epoch": 0.92, - "learning_rate": 0.00016195433612246218, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.0002355762293717301, + "loss": 0.0168, "step": 85130 }, { - "epoch": 0.92, - "learning_rate": 0.0001619381202568593, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.0002355686616787161, + "loss": 0.0187, "step": 85140 }, { - "epoch": 0.92, - "learning_rate": 0.0001619219043912564, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.00023556109398570208, + "loss": 0.0213, "step": 85150 }, { - "epoch": 0.92, - "learning_rate": 0.00016190568852565349, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023555352629268806, + "loss": 0.0174, "step": 85160 }, { - "epoch": 0.92, - "learning_rate": 0.00016188947266005058, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023554595859967407, + "loss": 0.0183, "step": 85170 }, { - "epoch": 0.92, - "learning_rate": 0.00016187325679444767, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023553839090666005, + "loss": 0.0219, "step": 85180 }, { - "epoch": 0.92, - "learning_rate": 0.00016185704092884476, - "loss": 0.0154, + "epoch": 0.43, + "learning_rate": 0.00023553082321364603, + "loss": 0.0171, "step": 85190 }, { - "epoch": 0.92, - "learning_rate": 0.00016184082506324188, - "loss": 0.0229, + "epoch": 0.43, + "learning_rate": 0.00023552325552063204, + "loss": 0.0119, "step": 85200 }, { - "epoch": 0.92, - "learning_rate": 0.00016182460919763895, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023551568782761802, + "loss": 0.0162, "step": 85210 }, { - "epoch": 0.92, - "learning_rate": 0.00016180839333203604, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.000235508120134604, + "loss": 0.0229, "step": 85220 }, { - "epoch": 0.92, - "learning_rate": 0.00016179217746643314, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023550055244158998, + "loss": 0.0165, "step": 85230 }, { - "epoch": 0.92, - "learning_rate": 0.00016177596160083026, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.000235492984748576, + "loss": 0.0147, "step": 85240 }, { - "epoch": 0.92, - "learning_rate": 0.00016175974573522732, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023548541705556197, + "loss": 0.0177, "step": 85250 }, { - "epoch": 0.92, - "learning_rate": 0.00016174352986962441, - "loss": 0.0109, + "epoch": 0.43, + "learning_rate": 0.00023547784936254795, + "loss": 0.0179, "step": 85260 }, { - "epoch": 0.92, - "learning_rate": 0.00016172731400402153, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023547028166953396, + "loss": 0.0185, "step": 85270 }, { - "epoch": 0.92, - "learning_rate": 0.00016171109813841863, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023546271397651994, + "loss": 0.0192, "step": 85280 }, { - "epoch": 0.92, - "learning_rate": 0.0001616948822728157, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.00023545514628350593, + "loss": 0.0205, "step": 85290 }, { - "epoch": 0.92, - "learning_rate": 0.00016167866640721278, - "loss": 0.0098, + "epoch": 0.43, + "learning_rate": 0.00023544757859049193, + "loss": 0.0212, "step": 85300 }, { - "epoch": 0.92, - "learning_rate": 0.0001616624505416099, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023544001089747792, + "loss": 0.0166, "step": 85310 }, { - "epoch": 0.92, - "learning_rate": 0.000161646234676007, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002354324432044639, + "loss": 0.016, "step": 85320 }, { - "epoch": 0.92, - "learning_rate": 0.00016163001881040406, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.0002354248755114499, + "loss": 0.0301, "step": 85330 }, { - "epoch": 0.92, - "learning_rate": 0.00016161380294480118, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.0002354173078184359, + "loss": 0.0199, "step": 85340 }, { - "epoch": 0.92, - "learning_rate": 0.00016159758707919828, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.00023540974012542187, + "loss": 0.0149, "step": 85350 }, { - "epoch": 0.92, - "learning_rate": 0.00016158137121359537, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023540217243240788, + "loss": 0.0169, "step": 85360 }, { - "epoch": 0.92, - "learning_rate": 0.00016156515534799246, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023539460473939386, + "loss": 0.0229, "step": 85370 }, { - "epoch": 0.92, - "learning_rate": 0.00016154893948238955, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023538703704637984, + "loss": 0.0135, "step": 85380 }, { - "epoch": 0.92, - "learning_rate": 0.00016153272361678665, - "loss": 0.0156, + "epoch": 0.43, + "learning_rate": 0.00023537946935336582, + "loss": 0.0181, "step": 85390 }, { - "epoch": 0.92, - "learning_rate": 0.00016151650775118377, - "loss": 0.0149, + "epoch": 0.43, + "learning_rate": 0.00023537190166035183, + "loss": 0.0173, "step": 85400 }, { - "epoch": 0.92, - "learning_rate": 0.00016150029188558083, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.0002353643339673378, + "loss": 0.0154, "step": 85410 }, { - "epoch": 0.92, - "learning_rate": 0.00016148407601997792, - "loss": 0.0106, + "epoch": 0.43, + "learning_rate": 0.0002353567662743238, + "loss": 0.0192, "step": 85420 }, { - "epoch": 0.92, - "learning_rate": 0.00016146786015437502, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002353491985813098, + "loss": 0.0172, "step": 85430 }, { - "epoch": 0.92, - "learning_rate": 0.00016145164428877214, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.00023534163088829578, + "loss": 0.0134, "step": 85440 }, { - "epoch": 0.92, - "learning_rate": 0.0001614354284231692, - "loss": 0.0092, + "epoch": 0.43, + "learning_rate": 0.00023533406319528176, + "loss": 0.0162, "step": 85450 }, { - "epoch": 0.92, - "learning_rate": 0.0001614192125575663, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023532649550226777, + "loss": 0.0139, "step": 85460 }, { - "epoch": 0.92, - "learning_rate": 0.00016140299669196342, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023531892780925375, + "loss": 0.0175, "step": 85470 }, { - "epoch": 0.92, - "learning_rate": 0.0001613867808263605, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023531136011623974, + "loss": 0.0146, "step": 85480 }, { - "epoch": 0.92, - "learning_rate": 0.00016137056496075757, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023530379242322574, + "loss": 0.0171, "step": 85490 }, { - "epoch": 0.92, - "learning_rate": 0.00016135434909515467, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.00023529622473021173, + "loss": 0.0172, "step": 85500 }, { - "epoch": 0.92, - "learning_rate": 0.0001613381332295518, - "loss": 0.0167, + "epoch": 0.43, + "learning_rate": 0.0002352886570371977, + "loss": 0.0191, "step": 85510 }, { - "epoch": 0.92, - "learning_rate": 0.00016132191736394888, - "loss": 0.0144, + "epoch": 0.43, + "learning_rate": 0.00023528108934418372, + "loss": 0.0164, "step": 85520 }, { - "epoch": 0.92, - "learning_rate": 0.00016130570149834594, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002352735216511697, + "loss": 0.0168, "step": 85530 }, { - "epoch": 0.92, - "learning_rate": 0.00016128948563274306, - "loss": 0.0135, + "epoch": 0.43, + "learning_rate": 0.00023526595395815568, + "loss": 0.0165, "step": 85540 }, { - "epoch": 0.92, - "learning_rate": 0.00016127326976714016, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.00023525838626514166, + "loss": 0.0168, "step": 85550 }, { - "epoch": 0.92, - "learning_rate": 0.00016125705390153725, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.00023525081857212767, + "loss": 0.0123, "step": 85560 }, { - "epoch": 0.93, - "learning_rate": 0.00016124083803593432, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.00023524325087911365, + "loss": 0.0198, "step": 85570 }, { - "epoch": 0.93, - "learning_rate": 0.00016122462217033144, - "loss": 0.0135, + "epoch": 0.43, + "learning_rate": 0.00023523568318609963, + "loss": 0.0272, "step": 85580 }, { - "epoch": 0.93, - "learning_rate": 0.00016120840630472853, - "loss": 0.0179, + "epoch": 0.43, + "learning_rate": 0.00023522811549308564, + "loss": 0.0184, "step": 85590 }, { - "epoch": 0.93, - "learning_rate": 0.00016119219043912562, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023522054780007162, + "loss": 0.0179, "step": 85600 }, { - "epoch": 0.93, - "learning_rate": 0.00016117597457352274, - "loss": 0.0147, + "epoch": 0.43, + "learning_rate": 0.0002352129801070576, + "loss": 0.0159, "step": 85610 }, { - "epoch": 0.93, - "learning_rate": 0.0001611597587079198, - "loss": 0.0158, + "epoch": 0.43, + "learning_rate": 0.0002352054124140436, + "loss": 0.0219, "step": 85620 }, { - "epoch": 0.93, - "learning_rate": 0.0001611435428423169, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.0002351978447210296, + "loss": 0.0174, "step": 85630 }, { - "epoch": 0.93, - "learning_rate": 0.00016112732697671402, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.00023519027702801557, + "loss": 0.0162, "step": 85640 }, { - "epoch": 0.93, - "learning_rate": 0.0001611111111111111, - "loss": 0.0131, + "epoch": 0.43, + "learning_rate": 0.00023518270933500158, + "loss": 0.0184, "step": 85650 }, { - "epoch": 0.93, - "learning_rate": 0.00016109489524550818, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023517514164198756, + "loss": 0.0149, "step": 85660 }, { - "epoch": 0.93, - "learning_rate": 0.0001610786793799053, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023516757394897355, + "loss": 0.0168, "step": 85670 }, { - "epoch": 0.93, - "learning_rate": 0.0001610624635143024, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023516000625595955, + "loss": 0.0165, "step": 85680 }, { - "epoch": 0.93, - "learning_rate": 0.00016104624764869948, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023515243856294554, + "loss": 0.0194, "step": 85690 }, { - "epoch": 0.93, - "learning_rate": 0.00016103003178309655, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023514487086993152, + "loss": 0.0115, "step": 85700 }, { - "epoch": 0.93, - "learning_rate": 0.00016101381591749367, - "loss": 0.0177, + "epoch": 0.43, + "learning_rate": 0.00023513730317691753, + "loss": 0.0178, "step": 85710 }, { - "epoch": 0.93, - "learning_rate": 0.00016099760005189076, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.0002351297354839035, + "loss": 0.0152, "step": 85720 }, { - "epoch": 0.93, - "learning_rate": 0.00016098138418628785, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.0002351221677908895, + "loss": 0.016, "step": 85730 }, { - "epoch": 0.93, - "learning_rate": 0.00016096516832068495, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023511460009787547, + "loss": 0.0182, "step": 85740 }, { - "epoch": 0.93, - "learning_rate": 0.00016094895245508204, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.00023510703240486148, + "loss": 0.0233, "step": 85750 }, { - "epoch": 0.93, - "learning_rate": 0.00016093273658947913, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.00023509946471184746, + "loss": 0.0231, "step": 85760 }, { - "epoch": 0.93, - "learning_rate": 0.00016091652072387625, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.00023509189701883344, + "loss": 0.0201, "step": 85770 }, { - "epoch": 0.93, - "learning_rate": 0.00016090030485827332, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023508432932581945, + "loss": 0.0201, "step": 85780 }, { - "epoch": 0.93, - "learning_rate": 0.0001608840889926704, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023507676163280543, + "loss": 0.023, "step": 85790 }, { - "epoch": 0.93, - "learning_rate": 0.0001608678731270675, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.0002350691939397914, + "loss": 0.0151, "step": 85800 }, { - "epoch": 0.93, - "learning_rate": 0.00016085165726146462, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023506162624677742, + "loss": 0.023, "step": 85810 }, { - "epoch": 0.93, - "learning_rate": 0.0001608354413958617, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.0002350540585537634, + "loss": 0.0161, "step": 85820 }, { - "epoch": 0.93, - "learning_rate": 0.00016081922553025878, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023504649086074938, + "loss": 0.0202, "step": 85830 }, { - "epoch": 0.93, - "learning_rate": 0.0001608030096646559, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.0002350389231677354, + "loss": 0.0151, "step": 85840 }, { - "epoch": 0.93, - "learning_rate": 0.000160786793799053, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.00023503135547472137, + "loss": 0.0163, "step": 85850 }, { - "epoch": 0.93, - "learning_rate": 0.00016077057793345006, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023502378778170736, + "loss": 0.0139, "step": 85860 }, { - "epoch": 0.93, - "learning_rate": 0.00016075436206784715, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023501622008869336, + "loss": 0.0157, "step": 85870 }, { - "epoch": 0.93, - "learning_rate": 0.00016073814620224427, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023500865239567935, + "loss": 0.0173, "step": 85880 }, { - "epoch": 0.93, - "learning_rate": 0.00016072193033664137, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023500108470266533, + "loss": 0.0174, "step": 85890 }, { - "epoch": 0.93, - "learning_rate": 0.00016070571447103843, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.0002349935170096513, + "loss": 0.0166, "step": 85900 }, { - "epoch": 0.93, - "learning_rate": 0.00016068949860543555, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023498594931663732, + "loss": 0.0237, "step": 85910 }, { - "epoch": 0.93, - "learning_rate": 0.00016067328273983264, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.0002349783816236233, + "loss": 0.0184, "step": 85920 }, { - "epoch": 0.93, - "learning_rate": 0.00016065706687422974, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023497081393060928, + "loss": 0.0186, "step": 85930 }, { - "epoch": 0.93, - "learning_rate": 0.0001606408510086268, - "loss": 0.0158, + "epoch": 0.43, + "learning_rate": 0.0002349632462375953, + "loss": 0.0175, "step": 85940 }, { - "epoch": 0.93, - "learning_rate": 0.00016062463514302392, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023495567854458127, + "loss": 0.0183, "step": 85950 }, { - "epoch": 0.93, - "learning_rate": 0.00016060841927742101, - "loss": 0.0168, + "epoch": 0.43, + "learning_rate": 0.00023494811085156725, + "loss": 0.0169, "step": 85960 }, { - "epoch": 0.93, - "learning_rate": 0.00016059220341181813, - "loss": 0.016, + "epoch": 0.43, + "learning_rate": 0.00023494054315855326, + "loss": 0.0143, "step": 85970 }, { - "epoch": 0.93, - "learning_rate": 0.0001605759875462152, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.00023493297546553924, + "loss": 0.0171, "step": 85980 }, { - "epoch": 0.93, - "learning_rate": 0.0001605597716806123, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023492540777252522, + "loss": 0.0171, "step": 85990 }, { - "epoch": 0.93, - "learning_rate": 0.00016054355581500939, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.00023491784007951123, + "loss": 0.0186, "step": 86000 }, { - "epoch": 0.93, - "eval_cer": 0.9215278031120306, - "eval_loss": 0.009139015339314938, - "eval_runtime": 121.317, - "eval_samples_per_second": 16.486, - "eval_steps_per_second": 4.121, + "epoch": 0.43, + "eval_cer": 0.9144702559031622, + "eval_loss": 0.012443006969988346, + "eval_runtime": 116.6618, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, "step": 86000 }, { - "epoch": 0.93, - "learning_rate": 0.0001605273399494065, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.0002349102723864972, + "loss": 0.016, "step": 86010 }, { - "epoch": 0.93, - "learning_rate": 0.00016051112408380357, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.0002349027046934832, + "loss": 0.0165, "step": 86020 }, { - "epoch": 0.93, - "learning_rate": 0.00016049490821820066, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.0002348951370004692, + "loss": 0.0162, "step": 86030 }, { - "epoch": 0.93, - "learning_rate": 0.00016047869235259778, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023488756930745518, + "loss": 0.0176, "step": 86040 }, { - "epoch": 0.93, - "learning_rate": 0.00016046247648699488, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023488000161444117, + "loss": 0.017, "step": 86050 }, { - "epoch": 0.93, - "learning_rate": 0.00016044626062139194, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023487243392142715, + "loss": 0.0163, "step": 86060 }, { - "epoch": 0.93, - "learning_rate": 0.00016043004475578903, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.00023486486622841316, + "loss": 0.0178, "step": 86070 }, { - "epoch": 0.93, - "learning_rate": 0.00016041382889018615, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023485729853539914, + "loss": 0.0188, "step": 86080 }, { - "epoch": 0.93, - "learning_rate": 0.00016039761302458325, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023484973084238512, + "loss": 0.0184, "step": 86090 }, { - "epoch": 0.93, - "learning_rate": 0.0001603813971589803, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.0002348421631493711, + "loss": 0.017, "step": 86100 }, { - "epoch": 0.93, - "learning_rate": 0.00016036518129337743, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.00023483459545635708, + "loss": 0.0166, "step": 86110 }, { - "epoch": 0.93, - "learning_rate": 0.00016034896542777453, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023482702776334306, + "loss": 0.0151, "step": 86120 }, { - "epoch": 0.93, - "learning_rate": 0.00016033274956217162, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023481946007032904, + "loss": 0.0159, "step": 86130 }, { - "epoch": 0.93, - "learning_rate": 0.00016031653369656868, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023481189237731505, + "loss": 0.0159, "step": 86140 }, { - "epoch": 0.93, - "learning_rate": 0.0001603003178309658, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023480432468430103, + "loss": 0.021, "step": 86150 }, { - "epoch": 0.93, - "learning_rate": 0.0001602841019653629, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023479675699128702, + "loss": 0.0153, "step": 86160 }, { - "epoch": 0.93, - "learning_rate": 0.00016026788609976, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023478918929827302, + "loss": 0.0155, "step": 86170 }, { - "epoch": 0.93, - "learning_rate": 0.00016025167023415708, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.000234781621605259, + "loss": 0.016, "step": 86180 }, { - "epoch": 0.93, - "learning_rate": 0.00016023545436855417, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.000234774053912245, + "loss": 0.0188, "step": 86190 }, { - "epoch": 0.93, - "learning_rate": 0.00016021923850295127, - "loss": 0.0161, + "epoch": 0.43, + "learning_rate": 0.000234766486219231, + "loss": 0.0251, "step": 86200 }, { - "epoch": 0.93, - "learning_rate": 0.0001602030226373484, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023475891852621698, + "loss": 0.0162, "step": 86210 }, { - "epoch": 0.93, - "learning_rate": 0.00016018680677174545, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.00023475135083320296, + "loss": 0.0194, "step": 86220 }, { - "epoch": 0.93, - "learning_rate": 0.00016017059090614255, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023474378314018897, + "loss": 0.0236, "step": 86230 }, { - "epoch": 0.93, - "learning_rate": 0.00016015437504053964, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023473621544717495, + "loss": 0.0163, "step": 86240 }, { - "epoch": 0.93, - "learning_rate": 0.00016013815917493676, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023472864775416093, + "loss": 0.0151, "step": 86250 }, { - "epoch": 0.93, - "learning_rate": 0.00016012194330933382, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023472108006114694, + "loss": 0.0137, "step": 86260 }, { - "epoch": 0.93, - "learning_rate": 0.00016010572744373092, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023471351236813292, + "loss": 0.0157, "step": 86270 }, { - "epoch": 0.93, - "learning_rate": 0.00016008951157812804, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.0002347059446751189, + "loss": 0.0172, "step": 86280 }, { - "epoch": 0.93, - "learning_rate": 0.00016007329571252513, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.00023469837698210488, + "loss": 0.0181, "step": 86290 }, { - "epoch": 0.93, - "learning_rate": 0.0001600570798469222, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.0002346908092890909, + "loss": 0.0163, "step": 86300 }, { - "epoch": 0.93, - "learning_rate": 0.0001600408639813193, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023468324159607687, + "loss": 0.0136, "step": 86310 }, { - "epoch": 0.93, - "learning_rate": 0.0001600246481157164, - "loss": 0.0172, + "epoch": 0.44, + "learning_rate": 0.00023467567390306285, + "loss": 0.016, "step": 86320 }, { - "epoch": 0.93, - "learning_rate": 0.0001600084322501135, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023466810621004886, + "loss": 0.0142, "step": 86330 }, { - "epoch": 0.93, - "learning_rate": 0.00015999221638451062, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.00023466053851703484, + "loss": 0.0193, "step": 86340 }, { - "epoch": 0.93, - "learning_rate": 0.00015997600051890769, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023465297082402083, + "loss": 0.0159, "step": 86350 }, { - "epoch": 0.93, - "learning_rate": 0.00015995978465330478, - "loss": 0.0162, + "epoch": 0.44, + "learning_rate": 0.00023464540313100683, + "loss": 0.0158, "step": 86360 }, { - "epoch": 0.93, - "learning_rate": 0.00015994356878770187, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023463783543799282, + "loss": 0.0161, "step": 86370 }, { - "epoch": 0.93, - "learning_rate": 0.000159927352922099, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.0002346302677449788, + "loss": 0.014, "step": 86380 }, { - "epoch": 0.93, - "learning_rate": 0.00015991113705649606, - "loss": 0.0162, + "epoch": 0.44, + "learning_rate": 0.0002346227000519648, + "loss": 0.019, "step": 86390 }, { - "epoch": 0.93, - "learning_rate": 0.00015989492119089315, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.0002346151323589508, + "loss": 0.019, "step": 86400 }, { - "epoch": 0.93, - "learning_rate": 0.00015987870532529027, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023460756466593677, + "loss": 0.0165, "step": 86410 }, { - "epoch": 0.93, - "learning_rate": 0.00015986248945968736, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023459999697292278, + "loss": 0.0169, "step": 86420 }, { - "epoch": 0.93, - "learning_rate": 0.00015984627359408443, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023459242927990876, + "loss": 0.0149, "step": 86430 }, { - "epoch": 0.93, - "learning_rate": 0.00015983005772848152, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023458486158689474, + "loss": 0.0163, "step": 86440 }, { - "epoch": 0.93, - "learning_rate": 0.00015981384186287864, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023457729389388072, + "loss": 0.0152, "step": 86450 }, { - "epoch": 0.93, - "learning_rate": 0.00015979762599727573, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023456972620086673, + "loss": 0.0161, "step": 86460 }, { - "epoch": 0.93, - "learning_rate": 0.0001597814101316728, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.0002345621585078527, + "loss": 0.0149, "step": 86470 }, { - "epoch": 0.93, - "learning_rate": 0.00015976519426606992, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.0002345545908148387, + "loss": 0.0228, "step": 86480 }, { - "epoch": 0.93, - "learning_rate": 0.000159748978400467, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.0002345470231218247, + "loss": 0.0214, "step": 86490 }, { - "epoch": 0.94, - "learning_rate": 0.0001597327625348641, - "loss": 0.016, + "epoch": 0.44, + "learning_rate": 0.00023453945542881068, + "loss": 0.0142, "step": 86500 }, { - "epoch": 0.94, - "learning_rate": 0.00015971654666926117, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023453188773579667, + "loss": 0.0158, "step": 86510 }, { - "epoch": 0.94, - "learning_rate": 0.0001597003308036583, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023452432004278267, + "loss": 0.0293, "step": 86520 }, { - "epoch": 0.94, - "learning_rate": 0.00015968411493805538, + "epoch": 0.44, + "learning_rate": 0.00023451675234976865, "loss": 0.0173, "step": 86530 }, { - "epoch": 0.94, - "learning_rate": 0.00015966789907245247, - "loss": 0.0145, + "epoch": 0.44, + "learning_rate": 0.00023450918465675464, + "loss": 0.0191, "step": 86540 }, { - "epoch": 0.94, - "learning_rate": 0.00015965168320684957, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023450161696374064, + "loss": 0.015, "step": 86550 }, { - "epoch": 0.94, - "learning_rate": 0.00015963546734124666, - "loss": 0.0153, + "epoch": 0.44, + "learning_rate": 0.00023449404927072663, + "loss": 0.02, "step": 86560 }, { - "epoch": 0.94, - "learning_rate": 0.00015961925147564375, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.0002344864815777126, + "loss": 0.0195, "step": 86570 }, { - "epoch": 0.94, - "learning_rate": 0.00015960303561004087, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023447891388469862, + "loss": 0.0164, "step": 86580 }, { - "epoch": 0.94, - "learning_rate": 0.00015958681974443794, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.0002344713461916846, + "loss": 0.0173, "step": 86590 }, { - "epoch": 0.94, - "learning_rate": 0.00015957060387883503, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.00023446377849867058, + "loss": 0.0151, "step": 86600 }, { - "epoch": 0.94, - "learning_rate": 0.00015955438801323212, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.0002344562108056566, + "loss": 0.0161, "step": 86610 }, { - "epoch": 0.94, - "learning_rate": 0.00015953817214762924, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023444864311264257, + "loss": 0.0179, "step": 86620 }, { - "epoch": 0.94, - "learning_rate": 0.0001595219562820263, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023444107541962855, + "loss": 0.0188, "step": 86630 }, { - "epoch": 0.94, - "learning_rate": 0.0001595057404164234, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.00023443350772661453, + "loss": 0.0166, "step": 86640 }, { - "epoch": 0.94, - "learning_rate": 0.00015948952455082052, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023442594003360054, + "loss": 0.0145, "step": 86650 }, { - "epoch": 0.94, - "learning_rate": 0.00015947330868521761, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023441837234058652, + "loss": 0.0177, "step": 86660 }, { - "epoch": 0.94, - "learning_rate": 0.00015945709281961468, - "loss": 0.0145, + "epoch": 0.44, + "learning_rate": 0.0002344108046475725, + "loss": 0.0158, "step": 86670 }, { - "epoch": 0.94, - "learning_rate": 0.0001594408769540118, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.0002344032369545585, + "loss": 0.0177, "step": 86680 }, { - "epoch": 0.94, - "learning_rate": 0.0001594246610884089, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.0002343956692615445, + "loss": 0.0147, "step": 86690 }, { - "epoch": 0.94, - "learning_rate": 0.00015940844522280599, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023438810156853048, + "loss": 0.0143, "step": 86700 }, { - "epoch": 0.94, - "learning_rate": 0.00015939222935720305, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023438053387551648, + "loss": 0.0138, "step": 86710 }, { - "epoch": 0.94, - "learning_rate": 0.00015937601349160017, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023437296618250247, + "loss": 0.0211, "step": 86720 }, { - "epoch": 0.94, - "learning_rate": 0.00015935979762599726, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023436539848948845, + "loss": 0.0192, "step": 86730 }, { - "epoch": 0.94, - "learning_rate": 0.00015934358176039436, - "loss": 0.0096, + "epoch": 0.44, + "learning_rate": 0.00023435783079647446, + "loss": 0.0151, "step": 86740 }, { - "epoch": 0.94, - "learning_rate": 0.00015932736589479145, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023435026310346044, + "loss": 0.0171, "step": 86750 }, { - "epoch": 0.94, - "learning_rate": 0.00015931115002918854, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023434269541044642, + "loss": 0.0155, "step": 86760 }, { - "epoch": 0.94, - "learning_rate": 0.00015929493416358563, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023433512771743243, + "loss": 0.0193, "step": 86770 }, { - "epoch": 0.94, - "learning_rate": 0.00015927871829798275, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.0002343275600244184, + "loss": 0.0165, "step": 86780 }, { - "epoch": 0.94, - "learning_rate": 0.00015926250243237982, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.0002343199923314044, + "loss": 0.0176, "step": 86790 }, { - "epoch": 0.94, - "learning_rate": 0.0001592462865667769, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023431242463839037, + "loss": 0.0166, "step": 86800 }, { - "epoch": 0.94, - "learning_rate": 0.000159230070701174, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023430485694537638, + "loss": 0.0178, "step": 86810 }, { - "epoch": 0.94, - "learning_rate": 0.00015921385483557113, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023429728925236236, + "loss": 0.0171, "step": 86820 }, { - "epoch": 0.94, - "learning_rate": 0.0001591976389699682, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023428972155934834, + "loss": 0.0147, "step": 86830 }, { - "epoch": 0.94, - "learning_rate": 0.00015918142310436528, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023428215386633435, + "loss": 0.0191, "step": 86840 }, { - "epoch": 0.94, - "learning_rate": 0.0001591652072387624, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023427458617332033, + "loss": 0.0196, "step": 86850 }, { - "epoch": 0.94, - "learning_rate": 0.0001591489913731595, - "loss": 0.0094, + "epoch": 0.44, + "learning_rate": 0.00023426701848030631, + "loss": 0.0203, "step": 86860 }, { - "epoch": 0.94, - "learning_rate": 0.00015913277550755656, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023425945078729232, + "loss": 0.016, "step": 86870 }, { - "epoch": 0.94, - "learning_rate": 0.00015911655964195366, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.0002342518830942783, + "loss": 0.015, "step": 86880 }, { - "epoch": 0.94, - "learning_rate": 0.00015910034377635077, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023424431540126429, + "loss": 0.0169, "step": 86890 }, { - "epoch": 0.94, - "learning_rate": 0.00015908412791074787, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.0002342367477082503, + "loss": 0.0175, "step": 86900 }, { - "epoch": 0.94, - "learning_rate": 0.00015906791204514493, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023422918001523628, + "loss": 0.0187, "step": 86910 }, { - "epoch": 0.94, - "learning_rate": 0.00015905169617954205, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023422161232222226, + "loss": 0.0185, "step": 86920 }, { - "epoch": 0.94, - "learning_rate": 0.00015903548031393915, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023421404462920827, + "loss": 0.0194, "step": 86930 }, { - "epoch": 0.94, - "learning_rate": 0.00015901926444833624, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023420647693619425, + "loss": 0.0167, "step": 86940 }, { - "epoch": 0.94, - "learning_rate": 0.0001590030485827333, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023419890924318023, + "loss": 0.0196, "step": 86950 }, { - "epoch": 0.94, - "learning_rate": 0.00015898683271713042, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.0002341913415501662, + "loss": 0.0191, "step": 86960 }, { - "epoch": 0.94, - "learning_rate": 0.00015897061685152752, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023418377385715222, + "loss": 0.0243, "step": 86970 }, { - "epoch": 0.94, - "learning_rate": 0.00015895440098592464, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002341762061641382, + "loss": 0.0139, "step": 86980 }, { - "epoch": 0.94, - "learning_rate": 0.0001589381851203217, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023416863847112418, + "loss": 0.0147, "step": 86990 }, { - "epoch": 0.94, - "learning_rate": 0.0001589219692547188, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.0002341610707781102, + "loss": 0.0172, "step": 87000 }, { - "epoch": 0.94, - "eval_cer": 0.921526065906118, - "eval_loss": 0.008875695057213306, - "eval_runtime": 121.5017, - "eval_samples_per_second": 16.461, - "eval_steps_per_second": 4.115, + "epoch": 0.44, + "eval_cer": 0.9144848118450433, + "eval_loss": 0.012073654681444168, + "eval_runtime": 116.8061, + "eval_samples_per_second": 17.122, + "eval_steps_per_second": 4.281, "step": 87000 }, { - "epoch": 0.94, - "learning_rate": 0.0001589057533891159, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.00023415350308509617, + "loss": 0.0192, "step": 87010 }, { - "epoch": 0.94, - "learning_rate": 0.000158889537523513, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.00023414593539208215, + "loss": 0.022, "step": 87020 }, { - "epoch": 0.94, - "learning_rate": 0.00015887332165791007, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023413836769906816, + "loss": 0.0149, "step": 87030 }, { - "epoch": 0.94, - "learning_rate": 0.00015885710579230717, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023413080000605414, + "loss": 0.0178, "step": 87040 }, { - "epoch": 0.94, - "learning_rate": 0.00015884088992670429, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023412323231304012, + "loss": 0.0156, "step": 87050 }, { - "epoch": 0.94, - "learning_rate": 0.00015882467406110138, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023411566462002613, + "loss": 0.0165, "step": 87060 }, { - "epoch": 0.94, - "learning_rate": 0.00015880845819549847, - "loss": 0.0163, + "epoch": 0.44, + "learning_rate": 0.00023410809692701211, + "loss": 0.0154, "step": 87070 }, { - "epoch": 0.94, - "learning_rate": 0.00015879224232989554, - "loss": 0.0156, + "epoch": 0.44, + "learning_rate": 0.0002341005292339981, + "loss": 0.0174, "step": 87080 }, { - "epoch": 0.94, - "learning_rate": 0.00015877602646429266, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.0002340929615409841, + "loss": 0.0164, "step": 87090 }, { - "epoch": 0.94, - "learning_rate": 0.00015875981059868975, - "loss": 0.0145, + "epoch": 0.44, + "learning_rate": 0.00023408539384797009, + "loss": 0.024, "step": 87100 }, { - "epoch": 0.94, - "learning_rate": 0.00015874359473308684, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.00023407782615495607, + "loss": 0.0189, "step": 87110 }, { - "epoch": 0.94, - "learning_rate": 0.00015872737886748394, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.00023407025846194208, + "loss": 0.0173, "step": 87120 }, { - "epoch": 0.94, - "learning_rate": 0.00015871116300188103, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023406269076892806, + "loss": 0.012, "step": 87130 }, { - "epoch": 0.94, - "learning_rate": 0.00015869494713627812, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023405512307591404, + "loss": 0.0167, "step": 87140 }, { - "epoch": 0.94, - "learning_rate": 0.00015867873127067524, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023404755538290002, + "loss": 0.0172, "step": 87150 }, { - "epoch": 0.94, - "learning_rate": 0.0001586625154050723, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023403998768988603, + "loss": 0.0223, "step": 87160 }, { - "epoch": 0.94, - "learning_rate": 0.0001586462995394694, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.000234032419996872, + "loss": 0.0191, "step": 87170 }, { - "epoch": 0.94, - "learning_rate": 0.0001586300836738665, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.000234024852303858, + "loss": 0.0192, "step": 87180 }, { - "epoch": 0.94, - "learning_rate": 0.0001586138678082636, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.000234017284610844, + "loss": 0.019, "step": 87190 }, { - "epoch": 0.94, - "learning_rate": 0.00015859765194266068, - "loss": 0.0156, + "epoch": 0.44, + "learning_rate": 0.00023400971691782998, + "loss": 0.0179, "step": 87200 }, { - "epoch": 0.94, - "learning_rate": 0.00015858143607705777, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023400214922481596, + "loss": 0.0153, "step": 87210 }, { - "epoch": 0.94, - "learning_rate": 0.0001585652202114549, - "loss": 0.0151, + "epoch": 0.44, + "learning_rate": 0.00023399458153180197, + "loss": 0.02, "step": 87220 }, { - "epoch": 0.94, - "learning_rate": 0.00015854900434585198, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023398701383878795, + "loss": 0.0151, "step": 87230 }, { - "epoch": 0.94, - "learning_rate": 0.00015853278848024905, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.00023397944614577393, + "loss": 0.0207, "step": 87240 }, { - "epoch": 0.94, - "learning_rate": 0.00015851657261464614, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023397187845275994, + "loss": 0.0176, "step": 87250 }, { - "epoch": 0.94, - "learning_rate": 0.00015850035674904326, - "loss": 0.0143, + "epoch": 0.44, + "learning_rate": 0.00023396431075974592, + "loss": 0.0173, "step": 87260 }, { - "epoch": 0.94, - "learning_rate": 0.00015848414088344035, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.0002339567430667319, + "loss": 0.021, "step": 87270 }, { - "epoch": 0.94, - "learning_rate": 0.00015846792501783742, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023394917537371791, + "loss": 0.0132, "step": 87280 }, { - "epoch": 0.94, - "learning_rate": 0.00015845170915223454, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.0002339416076807039, + "loss": 0.0142, "step": 87290 }, { - "epoch": 0.94, - "learning_rate": 0.00015843549328663163, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023393403998768988, + "loss": 0.015, "step": 87300 }, { - "epoch": 0.94, - "learning_rate": 0.00015841927742102872, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023392647229467586, + "loss": 0.0171, "step": 87310 }, { - "epoch": 0.94, - "learning_rate": 0.0001584030615554258, - "loss": 0.0154, + "epoch": 0.44, + "learning_rate": 0.00023391890460166187, + "loss": 0.0159, "step": 87320 }, { - "epoch": 0.94, - "learning_rate": 0.0001583868456898229, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023391133690864785, + "loss": 0.0182, "step": 87330 }, { - "epoch": 0.94, - "learning_rate": 0.00015837062982422, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.00023390376921563383, + "loss": 0.0198, "step": 87340 }, { - "epoch": 0.94, - "learning_rate": 0.00015835441395861712, - "loss": 0.0167, + "epoch": 0.44, + "learning_rate": 0.00023389620152261984, + "loss": 0.0191, "step": 87350 }, { - "epoch": 0.94, - "learning_rate": 0.0001583381980930142, - "loss": 0.0163, + "epoch": 0.44, + "learning_rate": 0.0002338886338296058, + "loss": 0.0222, "step": 87360 }, { - "epoch": 0.94, - "learning_rate": 0.00015832198222741128, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.00023388106613659177, + "loss": 0.016, "step": 87370 }, { - "epoch": 0.94, - "learning_rate": 0.00015830576636180837, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023387349844357776, + "loss": 0.0142, "step": 87380 }, { - "epoch": 0.94, - "learning_rate": 0.0001582895504962055, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023386593075056376, + "loss": 0.0169, "step": 87390 }, { - "epoch": 0.94, - "learning_rate": 0.00015827333463060256, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023385836305754975, + "loss": 0.0189, "step": 87400 }, { - "epoch": 0.94, - "learning_rate": 0.00015825711876499965, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023385079536453573, + "loss": 0.016, "step": 87410 }, { - "epoch": 0.95, - "learning_rate": 0.00015824090289939677, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023384322767152174, + "loss": 0.0152, "step": 87420 }, { - "epoch": 0.95, - "learning_rate": 0.00015822468703379386, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023383565997850772, + "loss": 0.0168, "step": 87430 }, { - "epoch": 0.95, - "learning_rate": 0.00015820847116819093, - "loss": 0.0157, + "epoch": 0.44, + "learning_rate": 0.0002338280922854937, + "loss": 0.0142, "step": 87440 }, { - "epoch": 0.95, - "learning_rate": 0.00015819225530258802, - "loss": 0.0149, + "epoch": 0.44, + "learning_rate": 0.0002338205245924797, + "loss": 0.0186, "step": 87450 }, { - "epoch": 0.95, - "learning_rate": 0.00015817603943698514, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.0002338129568994657, + "loss": 0.0179, "step": 87460 }, { - "epoch": 0.95, - "learning_rate": 0.00015815982357138224, - "loss": 0.016, + "epoch": 0.44, + "learning_rate": 0.00023380538920645167, + "loss": 0.0174, "step": 87470 }, { - "epoch": 0.95, - "learning_rate": 0.0001581436077057793, - "loss": 0.016, + "epoch": 0.44, + "learning_rate": 0.00023379782151343768, + "loss": 0.0149, "step": 87480 }, { - "epoch": 0.95, - "learning_rate": 0.00015812739184017642, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023379025382042366, + "loss": 0.0194, "step": 87490 }, { - "epoch": 0.95, - "learning_rate": 0.0001581111759745735, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023378268612740964, + "loss": 0.0167, "step": 87500 }, { - "epoch": 0.95, - "learning_rate": 0.0001580949601089706, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023377511843439565, + "loss": 0.0138, "step": 87510 }, { - "epoch": 0.95, - "learning_rate": 0.00015807874424336767, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023376755074138163, + "loss": 0.0171, "step": 87520 }, { - "epoch": 0.95, - "learning_rate": 0.0001580625283777648, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.0002337599830483676, + "loss": 0.0178, "step": 87530 }, { - "epoch": 0.95, - "learning_rate": 0.00015804631251216188, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.0002337524153553536, + "loss": 0.0156, "step": 87540 }, { - "epoch": 0.95, - "learning_rate": 0.00015803009664655898, - "loss": 0.0153, + "epoch": 0.44, + "learning_rate": 0.0002337448476623396, + "loss": 0.0217, "step": 87550 }, { - "epoch": 0.95, - "learning_rate": 0.00015801388078095607, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023373727996932558, + "loss": 0.0163, "step": 87560 }, { - "epoch": 0.95, - "learning_rate": 0.00015799766491535316, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023372971227631157, + "loss": 0.0169, "step": 87570 }, { - "epoch": 0.95, - "learning_rate": 0.00015798144904975026, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023372214458329757, + "loss": 0.02, "step": 87580 }, { - "epoch": 0.95, - "learning_rate": 0.00015796523318414738, - "loss": 0.0148, + "epoch": 0.44, + "learning_rate": 0.00023371457689028356, + "loss": 0.0147, "step": 87590 }, { - "epoch": 0.95, - "learning_rate": 0.00015794901731854444, - "loss": 0.0154, + "epoch": 0.44, + "learning_rate": 0.00023370700919726954, + "loss": 0.0192, "step": 87600 }, { - "epoch": 0.95, - "learning_rate": 0.00015793280145294153, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.00023369944150425555, + "loss": 0.0147, "step": 87610 }, { - "epoch": 0.95, - "learning_rate": 0.00015791658558733863, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023369187381124153, + "loss": 0.0226, "step": 87620 }, { - "epoch": 0.95, - "learning_rate": 0.00015790036972173575, - "loss": 0.016, + "epoch": 0.44, + "learning_rate": 0.0002336843061182275, + "loss": 0.0209, "step": 87630 }, { - "epoch": 0.95, - "learning_rate": 0.0001578841538561328, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023367673842521352, + "loss": 0.0165, "step": 87640 }, { - "epoch": 0.95, - "learning_rate": 0.0001578679379905299, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.0002336691707321995, + "loss": 0.0218, "step": 87650 }, { - "epoch": 0.95, - "learning_rate": 0.00015785172212492702, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023366160303918548, + "loss": 0.0169, "step": 87660 }, { - "epoch": 0.95, - "learning_rate": 0.00015783550625932412, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.0002336540353461715, + "loss": 0.0139, "step": 87670 }, { - "epoch": 0.95, - "learning_rate": 0.00015781929039372118, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023364646765315747, + "loss": 0.0148, "step": 87680 }, { - "epoch": 0.95, - "learning_rate": 0.0001578030745281183, - "loss": 0.0134, + "epoch": 0.44, + "learning_rate": 0.00023363889996014345, + "loss": 0.0142, "step": 87690 }, { - "epoch": 0.95, - "learning_rate": 0.0001577868586625154, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023363133226712943, + "loss": 0.0135, "step": 87700 }, { - "epoch": 0.95, - "learning_rate": 0.0001577706427969125, - "loss": 0.0164, + "epoch": 0.44, + "learning_rate": 0.00023362376457411544, + "loss": 0.0161, "step": 87710 }, { - "epoch": 0.95, - "learning_rate": 0.00015775442693130955, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023361619688110142, + "loss": 0.0164, "step": 87720 }, { - "epoch": 0.95, - "learning_rate": 0.00015773821106570667, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.0002336086291880874, + "loss": 0.0183, "step": 87730 }, { - "epoch": 0.95, - "learning_rate": 0.00015772199520010377, - "loss": 0.0146, + "epoch": 0.44, + "learning_rate": 0.0002336010614950734, + "loss": 0.0213, "step": 87740 }, { - "epoch": 0.95, - "learning_rate": 0.00015770577933450086, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002335934938020594, + "loss": 0.0156, "step": 87750 }, { - "epoch": 0.95, - "learning_rate": 0.00015768956346889798, - "loss": 0.0146, + "epoch": 0.44, + "learning_rate": 0.00023358592610904538, + "loss": 0.0202, "step": 87760 }, { - "epoch": 0.95, - "learning_rate": 0.00015767334760329504, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023357835841603138, + "loss": 0.0174, "step": 87770 }, { - "epoch": 0.95, - "learning_rate": 0.00015765713173769214, - "loss": 0.0153, + "epoch": 0.44, + "learning_rate": 0.00023357079072301737, + "loss": 0.0167, "step": 87780 }, { - "epoch": 0.95, - "learning_rate": 0.00015764091587208926, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023356322303000335, + "loss": 0.0173, "step": 87790 }, { - "epoch": 0.95, - "learning_rate": 0.00015762470000648635, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023355565533698936, + "loss": 0.0182, "step": 87800 }, { - "epoch": 0.95, - "learning_rate": 0.00015760848414088342, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.00023354808764397534, + "loss": 0.0163, "step": 87810 }, { - "epoch": 0.95, - "learning_rate": 0.0001575922682752805, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023354051995096132, + "loss": 0.017, "step": 87820 }, { - "epoch": 0.95, - "learning_rate": 0.00015757605240967763, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023353295225794733, + "loss": 0.0153, "step": 87830 }, { - "epoch": 0.95, - "learning_rate": 0.00015755983654407472, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.0002335253845649333, + "loss": 0.0165, "step": 87840 }, { - "epoch": 0.95, - "learning_rate": 0.0001575436206784718, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.0002335178168719193, + "loss": 0.0151, "step": 87850 }, { - "epoch": 0.95, - "learning_rate": 0.0001575274048128689, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023351024917890527, + "loss": 0.0186, "step": 87860 }, { - "epoch": 0.95, - "learning_rate": 0.000157511188947266, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023350268148589128, + "loss": 0.016, "step": 87870 }, { - "epoch": 0.95, - "learning_rate": 0.0001574949730816631, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023349511379287726, + "loss": 0.016, "step": 87880 }, { - "epoch": 0.95, - "learning_rate": 0.00015747875721606016, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.00023348754609986324, + "loss": 0.0159, "step": 87890 }, { - "epoch": 0.95, - "learning_rate": 0.00015746254135045728, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023347997840684925, + "loss": 0.0171, "step": 87900 }, { - "epoch": 0.95, - "learning_rate": 0.00015744632548485437, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023347241071383523, + "loss": 0.0177, "step": 87910 }, { - "epoch": 0.95, - "learning_rate": 0.0001574301096192515, - "loss": 0.0156, + "epoch": 0.44, + "learning_rate": 0.00023346484302082121, + "loss": 0.0154, "step": 87920 }, { - "epoch": 0.95, - "learning_rate": 0.00015741389375364856, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023345727532780722, + "loss": 0.0172, "step": 87930 }, { - "epoch": 0.95, - "learning_rate": 0.00015739767788804565, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.0002334497076347932, + "loss": 0.0172, "step": 87940 }, { - "epoch": 0.95, - "learning_rate": 0.00015738146202244274, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023344213994177919, + "loss": 0.0157, "step": 87950 }, { - "epoch": 0.95, - "learning_rate": 0.00015736524615683986, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.0002334345722487652, + "loss": 0.0148, "step": 87960 }, { - "epoch": 0.95, - "learning_rate": 0.00015734903029123693, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023342700455575118, + "loss": 0.0168, "step": 87970 }, { - "epoch": 0.95, - "learning_rate": 0.00015733281442563402, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023341943686273716, + "loss": 0.0173, "step": 87980 }, { - "epoch": 0.95, - "learning_rate": 0.00015731659856003114, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023341186916972317, + "loss": 0.0205, "step": 87990 }, { - "epoch": 0.95, - "learning_rate": 0.00015730038269442823, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023340430147670915, + "loss": 0.019, "step": 88000 }, { - "epoch": 0.95, - "eval_cer": 0.9215382263475072, - "eval_loss": 0.009381990879774094, - "eval_runtime": 121.3259, - "eval_samples_per_second": 16.485, - "eval_steps_per_second": 4.121, + "epoch": 0.44, + "eval_cer": 0.9145042197675514, + "eval_loss": 0.011925076134502888, + "eval_runtime": 116.6489, + "eval_samples_per_second": 17.145, + "eval_steps_per_second": 4.286, "step": 88000 }, { - "epoch": 0.95, - "learning_rate": 0.0001572841668288253, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023339673378369513, + "loss": 0.0132, "step": 88010 }, { - "epoch": 0.95, - "learning_rate": 0.0001572679509632224, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023338916609068114, + "loss": 0.0178, "step": 88020 }, { - "epoch": 0.95, - "learning_rate": 0.0001572517350976195, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023338159839766712, + "loss": 0.0176, "step": 88030 }, { - "epoch": 0.95, - "learning_rate": 0.0001572355192320166, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.0002333740307046531, + "loss": 0.0148, "step": 88040 }, { - "epoch": 0.95, - "learning_rate": 0.00015721930336641367, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023336646301163908, + "loss": 0.0163, "step": 88050 }, { - "epoch": 0.95, - "learning_rate": 0.0001572030875008108, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.0002333588953186251, + "loss": 0.0156, "step": 88060 }, { - "epoch": 0.95, - "learning_rate": 0.00015718687163520788, - "loss": 0.015, + "epoch": 0.44, + "learning_rate": 0.00023335132762561107, + "loss": 0.0207, "step": 88070 }, { - "epoch": 0.95, - "learning_rate": 0.00015717065576960497, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023334375993259705, + "loss": 0.0164, "step": 88080 }, { - "epoch": 0.95, - "learning_rate": 0.00015715443990400204, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023333619223958306, + "loss": 0.0148, "step": 88090 }, { - "epoch": 0.95, - "learning_rate": 0.00015713822403839916, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023332862454656904, + "loss": 0.0157, "step": 88100 }, { - "epoch": 0.95, - "learning_rate": 0.00015712200817279625, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023332105685355502, + "loss": 0.0205, "step": 88110 }, { - "epoch": 0.95, - "learning_rate": 0.00015710579230719334, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023331348916054103, + "loss": 0.0174, "step": 88120 }, { - "epoch": 0.95, - "learning_rate": 0.00015708957644159044, - "loss": 0.0156, + "epoch": 0.44, + "learning_rate": 0.00023330592146752701, + "loss": 0.0187, "step": 88130 }, { - "epoch": 0.95, - "learning_rate": 0.00015707336057598753, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.000233298353774513, + "loss": 0.0189, "step": 88140 }, { - "epoch": 0.95, - "learning_rate": 0.00015705714471038462, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.000233290786081499, + "loss": 0.0156, "step": 88150 }, { - "epoch": 0.95, - "learning_rate": 0.00015704092884478174, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023328321838848499, + "loss": 0.0185, "step": 88160 }, { - "epoch": 0.95, - "learning_rate": 0.0001570247129791788, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023327565069547097, + "loss": 0.0164, "step": 88170 }, { - "epoch": 0.95, - "learning_rate": 0.0001570084971135759, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023326808300245698, + "loss": 0.0176, "step": 88180 }, { - "epoch": 0.95, - "learning_rate": 0.000156992281247973, - "loss": 0.0143, + "epoch": 0.44, + "learning_rate": 0.00023326051530944296, + "loss": 0.0132, "step": 88190 }, { - "epoch": 0.95, - "learning_rate": 0.00015697606538237011, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023325294761642894, + "loss": 0.016, "step": 88200 }, { - "epoch": 0.95, - "learning_rate": 0.00015695984951676718, - "loss": 0.0149, + "epoch": 0.45, + "learning_rate": 0.00023324537992341492, + "loss": 0.0175, "step": 88210 }, { - "epoch": 0.95, - "learning_rate": 0.00015694363365116427, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023323781223040093, + "loss": 0.0136, "step": 88220 }, { - "epoch": 0.95, - "learning_rate": 0.0001569274177855614, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.0002332302445373869, + "loss": 0.0161, "step": 88230 }, { - "epoch": 0.95, - "learning_rate": 0.00015691120191995848, - "loss": 0.0132, + "epoch": 0.45, + "learning_rate": 0.0002332226768443729, + "loss": 0.0184, "step": 88240 }, { - "epoch": 0.95, - "learning_rate": 0.00015689498605435555, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002332151091513589, + "loss": 0.015, "step": 88250 }, { - "epoch": 0.95, - "learning_rate": 0.00015687877018875264, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.00023320754145834488, + "loss": 0.0202, "step": 88260 }, { - "epoch": 0.95, - "learning_rate": 0.00015686255432314976, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023319997376533086, + "loss": 0.0182, "step": 88270 }, { - "epoch": 0.95, - "learning_rate": 0.00015684633845754686, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023319240607231687, + "loss": 0.0161, "step": 88280 }, { - "epoch": 0.95, - "learning_rate": 0.00015683012259194392, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023318483837930285, + "loss": 0.0142, "step": 88290 }, { - "epoch": 0.95, - "learning_rate": 0.00015681390672634104, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023317727068628883, + "loss": 0.0176, "step": 88300 }, { - "epoch": 0.95, - "learning_rate": 0.00015679769086073813, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023316970299327484, + "loss": 0.0203, "step": 88310 }, { - "epoch": 0.95, - "learning_rate": 0.00015678147499513523, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023316213530026082, + "loss": 0.0157, "step": 88320 }, { - "epoch": 0.95, - "learning_rate": 0.0001567652591295323, - "loss": 0.0153, + "epoch": 0.45, + "learning_rate": 0.0002331545676072468, + "loss": 0.0189, "step": 88330 }, { - "epoch": 0.95, - "learning_rate": 0.0001567490432639294, - "loss": 0.0178, + "epoch": 0.45, + "learning_rate": 0.00023314699991423281, + "loss": 0.0163, "step": 88340 }, { - "epoch": 0.96, - "learning_rate": 0.0001567328273983265, - "loss": 0.0166, + "epoch": 0.45, + "learning_rate": 0.0002331394322212188, + "loss": 0.0159, "step": 88350 }, { - "epoch": 0.96, - "learning_rate": 0.00015671661153272363, - "loss": 0.0148, + "epoch": 0.45, + "learning_rate": 0.00023313186452820478, + "loss": 0.0182, "step": 88360 }, { - "epoch": 0.96, - "learning_rate": 0.0001567003956671207, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023312429683519076, + "loss": 0.0168, "step": 88370 }, { - "epoch": 0.96, - "learning_rate": 0.00015668417980151778, - "loss": 0.014, + "epoch": 0.45, + "learning_rate": 0.00023311672914217677, + "loss": 0.016, "step": 88380 }, { - "epoch": 0.96, - "learning_rate": 0.00015666796393591488, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023310916144916275, + "loss": 0.0198, "step": 88390 }, { - "epoch": 0.96, - "learning_rate": 0.000156651748070312, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023310159375614873, + "loss": 0.018, "step": 88400 }, { - "epoch": 0.96, - "learning_rate": 0.00015663553220470906, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.00023309402606313474, + "loss": 0.0168, "step": 88410 }, { - "epoch": 0.96, - "learning_rate": 0.00015661931633910615, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023308645837012072, + "loss": 0.019, "step": 88420 }, { - "epoch": 0.96, - "learning_rate": 0.00015660310047350327, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.0002330788906771067, + "loss": 0.0175, "step": 88430 }, { - "epoch": 0.96, - "learning_rate": 0.00015658688460790037, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.0002330713229840927, + "loss": 0.0205, "step": 88440 }, { - "epoch": 0.96, - "learning_rate": 0.00015657066874229743, - "loss": 0.0168, + "epoch": 0.45, + "learning_rate": 0.0002330637552910787, + "loss": 0.0187, "step": 88450 }, { - "epoch": 0.96, - "learning_rate": 0.00015655445287669453, - "loss": 0.0176, + "epoch": 0.45, + "learning_rate": 0.00023305618759806467, + "loss": 0.0158, "step": 88460 }, { - "epoch": 0.96, - "learning_rate": 0.00015653823701109165, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023304861990505068, + "loss": 0.0181, "step": 88470 }, { - "epoch": 0.96, - "learning_rate": 0.00015652202114548874, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023304105221203666, + "loss": 0.0167, "step": 88480 }, { - "epoch": 0.96, - "learning_rate": 0.00015650580527988583, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023303348451902264, + "loss": 0.0165, "step": 88490 }, { - "epoch": 0.96, - "learning_rate": 0.00015648958941428292, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023302591682600865, + "loss": 0.0164, "step": 88500 }, { - "epoch": 0.96, - "learning_rate": 0.00015647337354868002, - "loss": 0.0145, + "epoch": 0.45, + "learning_rate": 0.00023301834913299463, + "loss": 0.018, "step": 88510 }, { - "epoch": 0.96, - "learning_rate": 0.0001564571576830771, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023301078143998062, + "loss": 0.0186, "step": 88520 }, { - "epoch": 0.96, - "learning_rate": 0.00015644094181747423, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023300321374696662, + "loss": 0.0172, "step": 88530 }, { - "epoch": 0.96, - "learning_rate": 0.0001564247259518713, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.0002329956460539526, + "loss": 0.0157, "step": 88540 }, { - "epoch": 0.96, - "learning_rate": 0.0001564085100862684, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.0002329880783609386, + "loss": 0.0197, "step": 88550 }, { - "epoch": 0.96, - "learning_rate": 0.00015639229422066548, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023298051066792457, + "loss": 0.017, "step": 88560 }, { - "epoch": 0.96, - "learning_rate": 0.0001563760783550626, - "loss": 0.0154, + "epoch": 0.45, + "learning_rate": 0.00023297294297491058, + "loss": 0.0136, "step": 88570 }, { - "epoch": 0.96, - "learning_rate": 0.00015635986248945967, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023296537528189656, + "loss": 0.0144, "step": 88580 }, { - "epoch": 0.96, - "learning_rate": 0.00015634364662385676, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023295780758888254, + "loss": 0.0136, "step": 88590 }, { - "epoch": 0.96, - "learning_rate": 0.00015632743075825388, - "loss": 0.0155, + "epoch": 0.45, + "learning_rate": 0.00023295023989586855, + "loss": 0.017, "step": 88600 }, { - "epoch": 0.96, - "learning_rate": 0.00015631121489265097, - "loss": 0.0188, + "epoch": 0.45, + "learning_rate": 0.00023294267220285453, + "loss": 0.0172, "step": 88610 }, { - "epoch": 0.96, - "learning_rate": 0.00015629499902704804, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023293510450984048, + "loss": 0.0182, "step": 88620 }, { - "epoch": 0.96, - "learning_rate": 0.00015627878316144513, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023292753681682647, + "loss": 0.0153, "step": 88630 }, { - "epoch": 0.96, - "learning_rate": 0.00015626256729584225, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023291996912381247, + "loss": 0.0177, "step": 88640 }, { - "epoch": 0.96, - "learning_rate": 0.00015624635143023934, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023291240143079846, + "loss": 0.0148, "step": 88650 }, { - "epoch": 0.96, - "learning_rate": 0.0001562301355646364, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.00023290483373778444, + "loss": 0.0167, "step": 88660 }, { - "epoch": 0.96, - "learning_rate": 0.00015621391969903353, - "loss": 0.0178, + "epoch": 0.45, + "learning_rate": 0.00023289726604477045, + "loss": 0.0172, "step": 88670 }, { - "epoch": 0.96, - "learning_rate": 0.00015619770383343062, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.00023288969835175643, + "loss": 0.014, "step": 88680 }, { - "epoch": 0.96, - "learning_rate": 0.0001561814879678277, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.0002328821306587424, + "loss": 0.0171, "step": 88690 }, { - "epoch": 0.96, - "learning_rate": 0.0001561652721022248, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023287456296572842, + "loss": 0.0229, "step": 88700 }, { - "epoch": 0.96, - "learning_rate": 0.0001561490562366219, - "loss": 0.0144, + "epoch": 0.45, + "learning_rate": 0.0002328669952727144, + "loss": 0.0173, "step": 88710 }, { - "epoch": 0.96, - "learning_rate": 0.000156132840371019, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023285942757970038, + "loss": 0.0181, "step": 88720 }, { - "epoch": 0.96, - "learning_rate": 0.0001561166245054161, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002328518598866864, + "loss": 0.0206, "step": 88730 }, { - "epoch": 0.96, - "learning_rate": 0.00015610040863981318, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023284429219367237, + "loss": 0.0186, "step": 88740 }, { - "epoch": 0.96, - "learning_rate": 0.00015608419277421027, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023283672450065835, + "loss": 0.014, "step": 88750 }, { - "epoch": 0.96, - "learning_rate": 0.00015606797690860736, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023282915680764433, + "loss": 0.0172, "step": 88760 }, { - "epoch": 0.96, - "learning_rate": 0.00015605176104300448, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023282158911463034, + "loss": 0.0184, "step": 88770 }, { - "epoch": 0.96, - "learning_rate": 0.00015603554517740155, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023281402142161632, + "loss": 0.0158, "step": 88780 }, { - "epoch": 0.96, - "learning_rate": 0.00015601932931179864, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.0002328064537286023, + "loss": 0.0191, "step": 88790 }, { - "epoch": 0.96, - "learning_rate": 0.00015600311344619576, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.0002327988860355883, + "loss": 0.0208, "step": 88800 }, { - "epoch": 0.96, - "learning_rate": 0.00015598689758059285, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.0002327913183425743, + "loss": 0.0166, "step": 88810 }, { - "epoch": 0.96, - "learning_rate": 0.00015597068171498992, - "loss": 0.0151, + "epoch": 0.45, + "learning_rate": 0.00023278375064956028, + "loss": 0.0134, "step": 88820 }, { - "epoch": 0.96, - "learning_rate": 0.000155954465849387, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023277618295654628, + "loss": 0.0185, "step": 88830 }, { - "epoch": 0.96, - "learning_rate": 0.00015593824998378413, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023276861526353227, + "loss": 0.0174, "step": 88840 }, { - "epoch": 0.96, - "learning_rate": 0.00015592203411818122, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023276104757051825, + "loss": 0.0149, "step": 88850 }, { - "epoch": 0.96, - "learning_rate": 0.0001559058182525783, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023275347987750426, + "loss": 0.0165, "step": 88860 }, { - "epoch": 0.96, - "learning_rate": 0.0001558896023869754, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.00023274591218449024, + "loss": 0.0163, "step": 88870 }, { - "epoch": 0.96, - "learning_rate": 0.0001558733865213725, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023273834449147622, + "loss": 0.0157, "step": 88880 }, { - "epoch": 0.96, - "learning_rate": 0.0001558571706557696, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023273077679846223, + "loss": 0.0165, "step": 88890 }, { - "epoch": 0.96, - "learning_rate": 0.00015584095479016666, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.0002327232091054482, + "loss": 0.0216, "step": 88900 }, { - "epoch": 0.96, - "learning_rate": 0.00015582473892456378, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.0002327156414124342, + "loss": 0.0164, "step": 88910 }, { - "epoch": 0.96, - "learning_rate": 0.00015580852305896087, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002327080737194202, + "loss": 0.0183, "step": 88920 }, { - "epoch": 0.96, - "learning_rate": 0.000155792307193358, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023270050602640618, + "loss": 0.0163, "step": 88930 }, { - "epoch": 0.96, - "learning_rate": 0.00015577609132775506, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023269293833339216, + "loss": 0.0175, "step": 88940 }, { - "epoch": 0.96, - "learning_rate": 0.00015575987546215215, - "loss": 0.0141, + "epoch": 0.45, + "learning_rate": 0.00023268537064037814, + "loss": 0.023, "step": 88950 }, { - "epoch": 0.96, - "learning_rate": 0.00015574365959654924, - "loss": 0.0146, + "epoch": 0.45, + "learning_rate": 0.00023267780294736415, + "loss": 0.0185, "step": 88960 }, { - "epoch": 0.96, - "learning_rate": 0.00015572744373094636, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023267023525435013, + "loss": 0.0168, "step": 88970 }, { - "epoch": 0.96, - "learning_rate": 0.00015571122786534343, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023266266756133611, + "loss": 0.0144, "step": 88980 }, { - "epoch": 0.96, - "learning_rate": 0.00015569501199974052, - "loss": 0.016, + "epoch": 0.45, + "learning_rate": 0.00023265509986832212, + "loss": 0.0162, "step": 88990 }, { - "epoch": 0.96, - "learning_rate": 0.00015567879613413764, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.0002326475321753081, + "loss": 0.0146, "step": 89000 }, { - "epoch": 0.96, - "eval_cer": 0.9215721018628059, - "eval_loss": 0.008774230256676674, - "eval_runtime": 121.1545, - "eval_samples_per_second": 16.508, - "eval_steps_per_second": 4.127, + "epoch": 0.45, + "eval_cer": 0.9144906342217957, + "eval_loss": 0.01203860528767109, + "eval_runtime": 116.6624, + "eval_samples_per_second": 17.143, + "eval_steps_per_second": 4.286, "step": 89000 }, { - "epoch": 0.96, - "learning_rate": 0.00015566258026853473, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023263996448229409, + "loss": 0.0206, "step": 89010 }, { - "epoch": 0.96, - "learning_rate": 0.0001556463644029318, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.0002326323967892801, + "loss": 0.0151, "step": 89020 }, { - "epoch": 0.96, - "learning_rate": 0.0001556301485373289, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023262482909626608, + "loss": 0.0156, "step": 89030 }, { - "epoch": 0.96, - "learning_rate": 0.000155613932671726, - "loss": 0.0141, + "epoch": 0.45, + "learning_rate": 0.00023261726140325206, + "loss": 0.0193, "step": 89040 }, { - "epoch": 0.96, - "learning_rate": 0.0001555977168061231, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023260969371023807, + "loss": 0.0177, "step": 89050 }, { - "epoch": 0.96, - "learning_rate": 0.00015558150094052017, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023260212601722405, + "loss": 0.0126, "step": 89060 }, { - "epoch": 0.96, - "learning_rate": 0.0001555652850749173, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023259455832421003, + "loss": 0.0178, "step": 89070 }, { - "epoch": 0.96, - "learning_rate": 0.00015554906920931438, - "loss": 0.0153, + "epoch": 0.45, + "learning_rate": 0.00023258699063119604, + "loss": 0.0148, "step": 89080 }, { - "epoch": 0.96, - "learning_rate": 0.00015553285334371148, - "loss": 0.014, + "epoch": 0.45, + "learning_rate": 0.00023257942293818202, + "loss": 0.0187, "step": 89090 }, { - "epoch": 0.96, - "learning_rate": 0.00015551663747810854, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.000232571855245168, + "loss": 0.0183, "step": 89100 }, { - "epoch": 0.96, - "learning_rate": 0.00015550042161250566, - "loss": 0.0138, + "epoch": 0.45, + "learning_rate": 0.00023256428755215398, + "loss": 0.0152, "step": 89110 }, { - "epoch": 0.96, - "learning_rate": 0.00015548420574690275, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023255671985914, + "loss": 0.017, "step": 89120 }, { - "epoch": 0.96, - "learning_rate": 0.00015546798988129985, - "loss": 0.0159, + "epoch": 0.45, + "learning_rate": 0.00023254915216612597, + "loss": 0.0177, "step": 89130 }, { - "epoch": 0.96, - "learning_rate": 0.00015545177401569694, - "loss": 0.0138, + "epoch": 0.45, + "learning_rate": 0.00023254158447311195, + "loss": 0.0146, "step": 89140 }, { - "epoch": 0.96, - "learning_rate": 0.00015543555815009403, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.00023253401678009796, + "loss": 0.0181, "step": 89150 }, { - "epoch": 0.96, - "learning_rate": 0.00015541934228449113, - "loss": 0.0137, + "epoch": 0.45, + "learning_rate": 0.00023252644908708394, + "loss": 0.0179, "step": 89160 }, { - "epoch": 0.96, - "learning_rate": 0.00015540312641888825, - "loss": 0.0137, + "epoch": 0.45, + "learning_rate": 0.00023251888139406992, + "loss": 0.0158, "step": 89170 }, { - "epoch": 0.96, - "learning_rate": 0.0001553869105532853, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023251131370105593, + "loss": 0.0187, "step": 89180 }, { - "epoch": 0.96, - "learning_rate": 0.0001553706946876824, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023250374600804191, + "loss": 0.0164, "step": 89190 }, { - "epoch": 0.96, - "learning_rate": 0.0001553544788220795, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.0002324961783150279, + "loss": 0.0138, "step": 89200 }, { - "epoch": 0.96, - "learning_rate": 0.00015533826295647662, - "loss": 0.0132, + "epoch": 0.45, + "learning_rate": 0.0002324886106220139, + "loss": 0.0152, "step": 89210 }, { - "epoch": 0.96, - "learning_rate": 0.0001553220470908737, - "loss": 0.014, + "epoch": 0.45, + "learning_rate": 0.00023248104292899989, + "loss": 0.0161, "step": 89220 }, { - "epoch": 0.96, - "learning_rate": 0.00015530583122527077, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023247347523598587, + "loss": 0.0172, "step": 89230 }, { - "epoch": 0.96, - "learning_rate": 0.0001552896153596679, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023246590754297188, + "loss": 0.0216, "step": 89240 }, { - "epoch": 0.96, - "learning_rate": 0.000155273399494065, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023245833984995786, + "loss": 0.0152, "step": 89250 }, { - "epoch": 0.96, - "learning_rate": 0.00015525718362846208, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023245077215694384, + "loss": 0.0187, "step": 89260 }, { - "epoch": 0.97, - "learning_rate": 0.00015524096776285915, - "loss": 0.0137, + "epoch": 0.45, + "learning_rate": 0.00023244320446392982, + "loss": 0.0173, "step": 89270 }, { - "epoch": 0.97, - "learning_rate": 0.00015522475189725627, - "loss": 0.0152, + "epoch": 0.45, + "learning_rate": 0.00023243563677091583, + "loss": 0.0155, "step": 89280 }, { - "epoch": 0.97, - "learning_rate": 0.00015520853603165336, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.0002324280690779018, + "loss": 0.0158, "step": 89290 }, { - "epoch": 0.97, - "learning_rate": 0.00015519232016605048, - "loss": 0.0148, + "epoch": 0.45, + "learning_rate": 0.0002324205013848878, + "loss": 0.0177, "step": 89300 }, { - "epoch": 0.97, - "learning_rate": 0.00015517610430044754, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002324129336918738, + "loss": 0.0223, "step": 89310 }, { - "epoch": 0.97, - "learning_rate": 0.00015515988843484464, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023240536599885978, + "loss": 0.0172, "step": 89320 }, { - "epoch": 0.97, - "learning_rate": 0.00015514367256924173, - "loss": 0.0098, + "epoch": 0.45, + "learning_rate": 0.00023239779830584576, + "loss": 0.0197, "step": 89330 }, { - "epoch": 0.97, - "learning_rate": 0.00015512745670363885, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023239023061283177, + "loss": 0.0157, "step": 89340 }, { - "epoch": 0.97, - "learning_rate": 0.00015511124083803592, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023238266291981775, + "loss": 0.0156, "step": 89350 }, { - "epoch": 0.97, - "learning_rate": 0.000155095024972433, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.00023237509522680373, + "loss": 0.0146, "step": 89360 }, { - "epoch": 0.97, - "learning_rate": 0.00015507880910683013, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023236752753378974, + "loss": 0.0138, "step": 89370 }, { - "epoch": 0.97, - "learning_rate": 0.00015506259324122722, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.00023235995984077572, + "loss": 0.0142, "step": 89380 }, { - "epoch": 0.97, - "learning_rate": 0.00015504637737562429, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.0002323523921477617, + "loss": 0.0192, "step": 89390 }, { - "epoch": 0.97, - "learning_rate": 0.00015503016151002138, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023234482445474771, + "loss": 0.0189, "step": 89400 }, { - "epoch": 0.97, - "learning_rate": 0.0001550139456444185, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002323372567617337, + "loss": 0.0165, "step": 89410 }, { - "epoch": 0.97, - "learning_rate": 0.0001549977297788156, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.00023232968906871968, + "loss": 0.016, "step": 89420 }, { - "epoch": 0.97, - "learning_rate": 0.00015498151391321266, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023232212137570566, + "loss": 0.0171, "step": 89430 }, { - "epoch": 0.97, - "learning_rate": 0.00015496529804760978, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.00023231455368269167, + "loss": 0.0133, "step": 89440 }, { - "epoch": 0.97, - "learning_rate": 0.00015494908218200687, - "loss": 0.0137, + "epoch": 0.45, + "learning_rate": 0.00023230698598967765, + "loss": 0.0127, "step": 89450 }, { - "epoch": 0.97, - "learning_rate": 0.00015493286631640396, - "loss": 0.015, + "epoch": 0.45, + "learning_rate": 0.00023229941829666363, + "loss": 0.0155, "step": 89460 }, { - "epoch": 0.97, - "learning_rate": 0.00015491665045080103, - "loss": 0.0145, + "epoch": 0.45, + "learning_rate": 0.00023229185060364964, + "loss": 0.017, "step": 89470 }, { - "epoch": 0.97, - "learning_rate": 0.00015490043458519815, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.00023228428291063562, + "loss": 0.0136, "step": 89480 }, { - "epoch": 0.97, - "learning_rate": 0.00015488421871959524, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002322767152176216, + "loss": 0.018, "step": 89490 }, { - "epoch": 0.97, - "learning_rate": 0.00015486800285399233, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.0002322691475246076, + "loss": 0.0151, "step": 89500 }, { - "epoch": 0.97, - "learning_rate": 0.00015485178698838943, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.0002322615798315936, + "loss": 0.0158, "step": 89510 }, { - "epoch": 0.97, - "learning_rate": 0.00015483557112278652, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023225401213857957, + "loss": 0.0214, "step": 89520 }, { - "epoch": 0.97, - "learning_rate": 0.0001548193552571836, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023224644444556558, + "loss": 0.0207, "step": 89530 }, { - "epoch": 0.97, - "learning_rate": 0.00015480313939158073, - "loss": 0.0168, + "epoch": 0.45, + "learning_rate": 0.00023223887675255156, + "loss": 0.0157, "step": 89540 }, { - "epoch": 0.97, - "learning_rate": 0.0001547869235259778, - "loss": 0.0144, + "epoch": 0.45, + "learning_rate": 0.00023223130905953754, + "loss": 0.018, "step": 89550 }, { - "epoch": 0.97, - "learning_rate": 0.0001547707076603749, - "loss": 0.0162, + "epoch": 0.45, + "learning_rate": 0.00023222374136652355, + "loss": 0.0153, "step": 89560 }, { - "epoch": 0.97, - "learning_rate": 0.00015475449179477198, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023221617367350953, + "loss": 0.0168, "step": 89570 }, { - "epoch": 0.97, - "learning_rate": 0.0001547382759291691, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.00023220860598049552, + "loss": 0.0153, "step": 89580 }, { - "epoch": 0.97, - "learning_rate": 0.00015472206006356617, - "loss": 0.0095, + "epoch": 0.45, + "learning_rate": 0.00023220103828748152, + "loss": 0.0172, "step": 89590 }, { - "epoch": 0.97, - "learning_rate": 0.00015470584419796326, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002321934705944675, + "loss": 0.0229, "step": 89600 }, { - "epoch": 0.97, - "learning_rate": 0.00015468962833236038, - "loss": 0.0166, + "epoch": 0.45, + "learning_rate": 0.0002321859029014535, + "loss": 0.0186, "step": 89610 }, { - "epoch": 0.97, - "learning_rate": 0.00015467341246675747, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.00023217833520843947, + "loss": 0.0167, "step": 89620 }, { - "epoch": 0.97, - "learning_rate": 0.00015465719660115454, - "loss": 0.0159, + "epoch": 0.45, + "learning_rate": 0.00023217076751542548, + "loss": 0.0154, "step": 89630 }, { - "epoch": 0.97, - "learning_rate": 0.00015464098073555163, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023216319982241146, + "loss": 0.0152, "step": 89640 }, { - "epoch": 0.97, - "learning_rate": 0.00015462476486994875, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023215563212939744, + "loss": 0.0156, "step": 89650 }, { - "epoch": 0.97, - "learning_rate": 0.00015460854900434584, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023214806443638345, + "loss": 0.0174, "step": 89660 }, { - "epoch": 0.97, - "learning_rate": 0.0001545923331387429, - "loss": 0.0158, + "epoch": 0.45, + "learning_rate": 0.00023214049674336943, + "loss": 0.0186, "step": 89670 }, { - "epoch": 0.97, - "learning_rate": 0.00015457611727314003, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.0002321329290503554, + "loss": 0.0169, "step": 89680 }, { - "epoch": 0.97, - "learning_rate": 0.00015455990140753712, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023212536135734142, + "loss": 0.0139, "step": 89690 }, { - "epoch": 0.97, - "learning_rate": 0.00015454368554193422, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.0002321177936643274, + "loss": 0.0133, "step": 89700 }, { - "epoch": 0.97, - "learning_rate": 0.0001545274696763313, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023211022597131338, + "loss": 0.0133, "step": 89710 }, { - "epoch": 0.97, - "learning_rate": 0.0001545112538107284, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.0002321026582782994, + "loss": 0.0154, "step": 89720 }, { - "epoch": 0.97, - "learning_rate": 0.0001544950379451255, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023209509058528537, + "loss": 0.0154, "step": 89730 }, { - "epoch": 0.97, - "learning_rate": 0.0001544788220795226, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023208752289227135, + "loss": 0.0176, "step": 89740 }, { - "epoch": 0.97, - "learning_rate": 0.00015446260621391968, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023207995519925736, + "loss": 0.0167, "step": 89750 }, { - "epoch": 0.97, - "learning_rate": 0.00015444639034831677, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023207238750624334, + "loss": 0.0197, "step": 89760 }, { - "epoch": 0.97, - "learning_rate": 0.00015443017448271386, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.00023206481981322933, + "loss": 0.0126, "step": 89770 }, { - "epoch": 0.97, - "learning_rate": 0.00015441395861711098, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.0002320572521202153, + "loss": 0.0146, "step": 89780 }, { - "epoch": 0.97, - "learning_rate": 0.00015439774275150805, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023204968442720132, + "loss": 0.0126, "step": 89790 }, { - "epoch": 0.97, - "learning_rate": 0.00015438152688590514, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.0002320421167341873, + "loss": 0.0174, "step": 89800 }, { - "epoch": 0.97, - "learning_rate": 0.00015436531102030226, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023203454904117328, + "loss": 0.0147, "step": 89810 }, { - "epoch": 0.97, - "learning_rate": 0.00015434909515469936, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.0002320269813481593, + "loss": 0.0167, "step": 89820 }, { - "epoch": 0.97, - "learning_rate": 0.00015433287928909642, - "loss": 0.0148, + "epoch": 0.45, + "learning_rate": 0.00023201941365514527, + "loss": 0.0202, "step": 89830 }, { - "epoch": 0.97, - "learning_rate": 0.00015431666342349351, - "loss": 0.0094, + "epoch": 0.45, + "learning_rate": 0.00023201184596213125, + "loss": 0.0135, "step": 89840 }, { - "epoch": 0.97, - "learning_rate": 0.00015430044755789063, - "loss": 0.0141, + "epoch": 0.45, + "learning_rate": 0.00023200427826911726, + "loss": 0.0138, "step": 89850 }, { - "epoch": 0.97, - "learning_rate": 0.00015428423169228773, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023199671057610324, + "loss": 0.0158, "step": 89860 }, { - "epoch": 0.97, - "learning_rate": 0.0001542680158266848, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.0002319891428830892, + "loss": 0.015, "step": 89870 }, { - "epoch": 0.97, - "learning_rate": 0.0001542517999610819, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023198157519007518, + "loss": 0.0149, "step": 89880 }, { - "epoch": 0.97, - "learning_rate": 0.000154235584095479, - "loss": 0.0166, + "epoch": 0.45, + "learning_rate": 0.00023197400749706118, + "loss": 0.0162, "step": 89890 }, { - "epoch": 0.97, - "learning_rate": 0.0001542193682298761, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023196643980404717, + "loss": 0.0156, "step": 89900 }, { - "epoch": 0.97, - "learning_rate": 0.00015420315236427316, - "loss": 0.0153, + "epoch": 0.45, + "learning_rate": 0.00023195887211103315, + "loss": 0.0146, "step": 89910 }, { - "epoch": 0.97, - "learning_rate": 0.00015418693649867028, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023195130441801916, + "loss": 0.0142, "step": 89920 }, { - "epoch": 0.97, - "learning_rate": 0.00015417072063306738, - "loss": 0.0157, + "epoch": 0.45, + "learning_rate": 0.00023194373672500514, + "loss": 0.0144, "step": 89930 }, { - "epoch": 0.97, - "learning_rate": 0.0001541545047674645, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.00023193616903199112, + "loss": 0.0159, "step": 89940 }, { - "epoch": 0.97, - "learning_rate": 0.0001541382889018616, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023192860133897713, + "loss": 0.0333, "step": 89950 }, { - "epoch": 0.97, - "learning_rate": 0.00015412207303625865, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002319210336459631, + "loss": 0.0643, "step": 89960 }, { - "epoch": 0.97, - "learning_rate": 0.00015410585717065575, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.0002319134659529491, + "loss": 0.0249, "step": 89970 }, { - "epoch": 0.97, - "learning_rate": 0.00015408964130505287, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.0002319058982599351, + "loss": 0.0134, "step": 89980 }, { - "epoch": 0.97, - "learning_rate": 0.00015407342543944996, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023189833056692108, + "loss": 0.0211, "step": 89990 }, { - "epoch": 0.97, - "learning_rate": 0.00015405720957384702, - "loss": 0.0098, + "epoch": 0.45, + "learning_rate": 0.00023189076287390706, + "loss": 0.0173, "step": 90000 }, { - "epoch": 0.97, - "eval_cer": 0.9215616786273294, - "eval_loss": 0.009352602064609528, - "eval_runtime": 121.4051, - "eval_samples_per_second": 16.474, - "eval_steps_per_second": 4.118, + "epoch": 0.45, + "eval_cer": 0.9144983973907989, + "eval_loss": 0.0122450590133667, + "eval_runtime": 116.807, + "eval_samples_per_second": 17.122, + "eval_steps_per_second": 4.281, "step": 90000 }, { - "epoch": 0.97, - "learning_rate": 0.00015404099370824414, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.00023188319518089304, + "loss": 0.0216, "step": 90010 }, { - "epoch": 0.97, - "learning_rate": 0.00015402477784264124, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023187562748787905, + "loss": 0.0186, "step": 90020 }, { - "epoch": 0.97, - "learning_rate": 0.00015400856197703833, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.00023186805979486503, + "loss": 0.0161, "step": 90030 }, { - "epoch": 0.97, - "learning_rate": 0.0001539923461114354, - "loss": 0.0097, + "epoch": 0.45, + "learning_rate": 0.00023186049210185101, + "loss": 0.0171, "step": 90040 }, { - "epoch": 0.97, - "learning_rate": 0.00015397613024583252, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023185292440883702, + "loss": 0.0156, "step": 90050 }, { - "epoch": 0.97, - "learning_rate": 0.0001539599143802296, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.000231845356715823, + "loss": 0.019, "step": 90060 }, { - "epoch": 0.97, - "learning_rate": 0.0001539436985146267, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023183778902280899, + "loss": 0.0145, "step": 90070 }, { - "epoch": 0.97, - "learning_rate": 0.0001539274826490238, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.000231830221329795, + "loss": 0.0184, "step": 90080 }, { - "epoch": 0.97, - "learning_rate": 0.0001539112667834209, - "loss": 0.0151, + "epoch": 0.45, + "learning_rate": 0.00023182265363678098, + "loss": 0.0175, "step": 90090 }, { - "epoch": 0.97, - "learning_rate": 0.00015389505091781798, - "loss": 0.0095, + "epoch": 0.45, + "learning_rate": 0.00023181508594376696, + "loss": 0.0194, "step": 90100 }, { - "epoch": 0.97, - "learning_rate": 0.0001538788350522151, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023180751825075297, + "loss": 0.0152, "step": 90110 }, { - "epoch": 0.97, - "learning_rate": 0.00015386261918661216, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023179995055773895, + "loss": 0.0167, "step": 90120 }, { - "epoch": 0.97, - "learning_rate": 0.00015384640332100926, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023179238286472493, + "loss": 0.0178, "step": 90130 }, { - "epoch": 0.97, - "learning_rate": 0.00015383018745540635, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023178481517171094, + "loss": 0.017, "step": 90140 }, { - "epoch": 0.97, - "learning_rate": 0.00015381397158980347, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023177724747869692, + "loss": 0.0173, "step": 90150 }, { - "epoch": 0.97, - "learning_rate": 0.00015379775572420054, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.0002317696797856829, + "loss": 0.0188, "step": 90160 }, { - "epoch": 0.97, - "learning_rate": 0.00015378153985859763, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023176211209266888, + "loss": 0.0174, "step": 90170 }, { - "epoch": 0.97, - "learning_rate": 0.00015376532399299475, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.0002317545443996549, + "loss": 0.0222, "step": 90180 }, { - "epoch": 0.97, - "learning_rate": 0.00015374910812739184, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023174697670664087, + "loss": 0.0157, "step": 90190 }, { - "epoch": 0.98, - "learning_rate": 0.0001537328922617889, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023173940901362685, + "loss": 0.018, "step": 90200 }, { - "epoch": 0.98, - "learning_rate": 0.000153716676396186, - "loss": 0.014, + "epoch": 0.46, + "learning_rate": 0.00023173184132061286, + "loss": 0.0191, "step": 90210 }, { - "epoch": 0.98, - "learning_rate": 0.00015370046053058312, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023172427362759884, + "loss": 0.018, "step": 90220 }, { - "epoch": 0.98, - "learning_rate": 0.0001536842446649802, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023171670593458482, + "loss": 0.0176, "step": 90230 }, { - "epoch": 0.98, - "learning_rate": 0.00015366802879937728, - "loss": 0.0162, + "epoch": 0.46, + "learning_rate": 0.00023170913824157083, + "loss": 0.0167, "step": 90240 }, { - "epoch": 0.98, - "learning_rate": 0.0001536518129337744, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023170157054855681, + "loss": 0.0154, "step": 90250 }, { - "epoch": 0.98, - "learning_rate": 0.0001536355970681715, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.0002316940028555428, + "loss": 0.0155, "step": 90260 }, { - "epoch": 0.98, - "learning_rate": 0.00015361938120256858, - "loss": 0.0144, + "epoch": 0.46, + "learning_rate": 0.0002316864351625288, + "loss": 0.0184, "step": 90270 }, { - "epoch": 0.98, - "learning_rate": 0.00015360316533696565, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.00023167886746951479, + "loss": 0.019, "step": 90280 }, { - "epoch": 0.98, - "learning_rate": 0.00015358694947136277, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023167129977650077, + "loss": 0.0158, "step": 90290 }, { - "epoch": 0.98, - "learning_rate": 0.00015357073360575986, - "loss": 0.0193, + "epoch": 0.46, + "learning_rate": 0.00023166373208348678, + "loss": 0.0136, "step": 90300 }, { - "epoch": 0.98, - "learning_rate": 0.00015355451774015698, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023165616439047276, + "loss": 0.0182, "step": 90310 }, { - "epoch": 0.98, - "learning_rate": 0.00015353830187455405, - "loss": 0.014, + "epoch": 0.46, + "learning_rate": 0.00023164859669745874, + "loss": 0.0154, "step": 90320 }, { - "epoch": 0.98, - "learning_rate": 0.00015352208600895114, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.00023164102900444472, + "loss": 0.0161, "step": 90330 }, { - "epoch": 0.98, - "learning_rate": 0.00015350587014334823, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023163346131143073, + "loss": 0.0169, "step": 90340 }, { - "epoch": 0.98, - "learning_rate": 0.00015348965427774535, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.0002316258936184167, + "loss": 0.0159, "step": 90350 }, { - "epoch": 0.98, - "learning_rate": 0.00015347343841214242, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.0002316183259254027, + "loss": 0.0181, "step": 90360 }, { - "epoch": 0.98, - "learning_rate": 0.0001534572225465395, - "loss": 0.0145, + "epoch": 0.46, + "learning_rate": 0.0002316107582323887, + "loss": 0.0152, "step": 90370 }, { - "epoch": 0.98, - "learning_rate": 0.00015344100668093663, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023160319053937468, + "loss": 0.0189, "step": 90380 }, { - "epoch": 0.98, - "learning_rate": 0.00015342479081533372, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023159562284636066, + "loss": 0.018, "step": 90390 }, { - "epoch": 0.98, - "learning_rate": 0.0001534085749497308, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023158805515334667, + "loss": 0.0143, "step": 90400 }, { - "epoch": 0.98, - "learning_rate": 0.00015339235908412788, - "loss": 0.0157, + "epoch": 0.46, + "learning_rate": 0.00023158048746033265, + "loss": 0.0194, "step": 90410 }, { - "epoch": 0.98, - "learning_rate": 0.000153376143218525, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023157291976731863, + "loss": 0.0168, "step": 90420 }, { - "epoch": 0.98, - "learning_rate": 0.0001533599273529221, - "loss": 0.0167, + "epoch": 0.46, + "learning_rate": 0.00023156535207430464, + "loss": 0.0149, "step": 90430 }, { - "epoch": 0.98, - "learning_rate": 0.00015334371148731916, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.00023155778438129062, + "loss": 0.0148, "step": 90440 }, { - "epoch": 0.98, - "learning_rate": 0.00015332749562171628, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.0002315502166882766, + "loss": 0.0171, "step": 90450 }, { - "epoch": 0.98, - "learning_rate": 0.00015331127975611337, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023154264899526261, + "loss": 0.0157, "step": 90460 }, { - "epoch": 0.98, - "learning_rate": 0.00015329506389051046, - "loss": 0.0163, + "epoch": 0.46, + "learning_rate": 0.0002315350813022486, + "loss": 0.0168, "step": 90470 }, { - "epoch": 0.98, - "learning_rate": 0.00015327884802490753, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023152751360923458, + "loss": 0.0157, "step": 90480 }, { - "epoch": 0.98, - "learning_rate": 0.00015326263215930465, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023151994591622059, + "loss": 0.0178, "step": 90490 }, { - "epoch": 0.98, - "learning_rate": 0.00015324641629370174, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.00023151237822320657, + "loss": 0.013, "step": 90500 }, { - "epoch": 0.98, - "learning_rate": 0.00015323020042809884, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023150481053019255, + "loss": 0.0145, "step": 90510 }, { - "epoch": 0.98, - "learning_rate": 0.00015321398456249593, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023149724283717853, + "loss": 0.0141, "step": 90520 }, { - "epoch": 0.98, - "learning_rate": 0.00015319776869689302, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023148967514416454, + "loss": 0.0154, "step": 90530 }, { - "epoch": 0.98, - "learning_rate": 0.00015318155283129011, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.00023148210745115052, + "loss": 0.0154, "step": 90540 }, { - "epoch": 0.98, - "learning_rate": 0.00015316533696568723, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.0002314745397581365, + "loss": 0.0155, "step": 90550 }, { - "epoch": 0.98, - "learning_rate": 0.0001531491211000843, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.0002314669720651225, + "loss": 0.0163, "step": 90560 }, { - "epoch": 0.98, - "learning_rate": 0.0001531329052344814, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.0002314594043721085, + "loss": 0.0189, "step": 90570 }, { - "epoch": 0.98, - "learning_rate": 0.00015311668936887849, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023145183667909447, + "loss": 0.014, "step": 90580 }, { - "epoch": 0.98, - "learning_rate": 0.0001531004735032756, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023144426898608048, + "loss": 0.0141, "step": 90590 }, { - "epoch": 0.98, - "learning_rate": 0.00015308425763767267, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.00023143670129306646, + "loss": 0.0144, "step": 90600 }, { - "epoch": 0.98, - "learning_rate": 0.00015306804177206976, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023142913360005244, + "loss": 0.0135, "step": 90610 }, { - "epoch": 0.98, - "learning_rate": 0.00015305182590646688, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023142156590703845, + "loss": 0.0189, "step": 90620 }, { - "epoch": 0.98, - "learning_rate": 0.00015303561004086398, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023141399821402443, + "loss": 0.0156, "step": 90630 }, { - "epoch": 0.98, - "learning_rate": 0.00015301939417526107, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023140643052101042, + "loss": 0.0198, "step": 90640 }, { - "epoch": 0.98, - "learning_rate": 0.00015300317830965813, - "loss": 0.0136, + "epoch": 0.46, + "learning_rate": 0.00023139886282799642, + "loss": 0.015, "step": 90650 }, { - "epoch": 0.98, - "learning_rate": 0.00015298696244405525, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002313912951349824, + "loss": 0.0173, "step": 90660 }, { - "epoch": 0.98, - "learning_rate": 0.00015297074657845235, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.0002313837274419684, + "loss": 0.018, "step": 90670 }, { - "epoch": 0.98, - "learning_rate": 0.00015295453071284947, - "loss": 0.0153, + "epoch": 0.46, + "learning_rate": 0.00023137615974895437, + "loss": 0.0168, "step": 90680 }, { - "epoch": 0.98, - "learning_rate": 0.00015293831484724653, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023136859205594038, + "loss": 0.0194, "step": 90690 }, { - "epoch": 0.98, - "learning_rate": 0.00015292209898164363, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023136102436292636, + "loss": 0.018, "step": 90700 }, { - "epoch": 0.98, - "learning_rate": 0.00015290588311604072, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023135345666991234, + "loss": 0.0119, "step": 90710 }, { - "epoch": 0.98, - "learning_rate": 0.00015288966725043784, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023134588897689835, + "loss": 0.0158, "step": 90720 }, { - "epoch": 0.98, - "learning_rate": 0.0001528734513848349, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023133832128388433, + "loss": 0.015, "step": 90730 }, { - "epoch": 0.98, - "learning_rate": 0.000152857235519232, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002313307535908703, + "loss": 0.0161, "step": 90740 }, { - "epoch": 0.98, - "learning_rate": 0.00015284101965362912, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023132318589785632, + "loss": 0.0151, "step": 90750 }, { - "epoch": 0.98, - "learning_rate": 0.0001528248037880262, - "loss": 0.0151, + "epoch": 0.46, + "learning_rate": 0.0002313156182048423, + "loss": 0.0207, "step": 90760 }, { - "epoch": 0.98, - "learning_rate": 0.00015280858792242327, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023130805051182828, + "loss": 0.0183, "step": 90770 }, { - "epoch": 0.98, - "learning_rate": 0.00015279237205682037, - "loss": 0.0153, + "epoch": 0.46, + "learning_rate": 0.0002313004828188143, + "loss": 0.0148, "step": 90780 }, { - "epoch": 0.98, - "learning_rate": 0.0001527761561912175, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023129291512580027, + "loss": 0.0157, "step": 90790 }, { - "epoch": 0.98, - "learning_rate": 0.00015275994032561458, - "loss": 0.0164, + "epoch": 0.46, + "learning_rate": 0.00023128534743278625, + "loss": 0.0169, "step": 90800 }, { - "epoch": 0.98, - "learning_rate": 0.00015274372446001165, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023127777973977226, + "loss": 0.0172, "step": 90810 }, { - "epoch": 0.98, - "learning_rate": 0.00015272750859440877, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023127021204675824, + "loss": 0.0178, "step": 90820 }, { - "epoch": 0.98, - "learning_rate": 0.00015271129272880586, - "loss": 0.0094, + "epoch": 0.46, + "learning_rate": 0.00023126264435374423, + "loss": 0.0186, "step": 90830 }, { - "epoch": 0.98, - "learning_rate": 0.00015269507686320295, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.0002312550766607302, + "loss": 0.0152, "step": 90840 }, { - "epoch": 0.98, - "learning_rate": 0.00015267886099760002, - "loss": 0.0147, + "epoch": 0.46, + "learning_rate": 0.00023124750896771622, + "loss": 0.0134, "step": 90850 }, { - "epoch": 0.98, - "learning_rate": 0.00015266264513199714, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.0002312399412747022, + "loss": 0.0157, "step": 90860 }, { - "epoch": 0.98, - "learning_rate": 0.00015264642926639423, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023123237358168818, + "loss": 0.0211, "step": 90870 }, { - "epoch": 0.98, - "learning_rate": 0.00015263021340079132, - "loss": 0.0171, + "epoch": 0.46, + "learning_rate": 0.0002312248058886742, + "loss": 0.0192, "step": 90880 }, { - "epoch": 0.98, - "learning_rate": 0.00015261399753518841, - "loss": 0.0163, + "epoch": 0.46, + "learning_rate": 0.00023121723819566017, + "loss": 0.0149, "step": 90890 }, { - "epoch": 0.98, - "learning_rate": 0.0001525977816695855, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023120967050264615, + "loss": 0.0156, "step": 90900 }, { - "epoch": 0.98, - "learning_rate": 0.0001525815658039826, - "loss": 0.0135, + "epoch": 0.46, + "learning_rate": 0.00023120210280963216, + "loss": 0.015, "step": 90910 }, { - "epoch": 0.98, - "learning_rate": 0.00015256534993837972, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023119453511661814, + "loss": 0.0175, "step": 90920 }, { - "epoch": 0.98, - "learning_rate": 0.00015254913407277679, - "loss": 0.0135, + "epoch": 0.46, + "learning_rate": 0.00023118696742360412, + "loss": 0.0149, "step": 90930 }, { - "epoch": 0.98, - "learning_rate": 0.00015253291820717388, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023117939973059013, + "loss": 0.0145, "step": 90940 }, { - "epoch": 0.98, - "learning_rate": 0.00015251670234157097, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.0002311718320375761, + "loss": 0.0163, "step": 90950 }, { - "epoch": 0.98, - "learning_rate": 0.0001525004864759681, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.0002311642643445621, + "loss": 0.0163, "step": 90960 }, { - "epoch": 0.98, - "learning_rate": 0.00015248427061036516, - "loss": 0.014, + "epoch": 0.46, + "learning_rate": 0.0002311566966515481, + "loss": 0.0162, "step": 90970 }, { - "epoch": 0.98, - "learning_rate": 0.00015246805474476225, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023114912895853408, + "loss": 0.0172, "step": 90980 }, { - "epoch": 0.98, - "learning_rate": 0.00015245183887915937, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023114156126552006, + "loss": 0.0177, "step": 90990 }, { - "epoch": 0.98, - "learning_rate": 0.00015243562301355646, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023113399357250607, + "loss": 0.0168, "step": 91000 }, { - "epoch": 0.98, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.00892550777643919, - "eval_runtime": 121.1506, - "eval_samples_per_second": 16.508, - "eval_steps_per_second": 4.127, + "epoch": 0.46, + "eval_cer": 0.9145022789753005, + "eval_loss": 0.01197886560112238, + "eval_runtime": 116.7595, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, "step": 91000 }, { - "epoch": 0.98, - "learning_rate": 0.00015241940714795353, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023112642587949205, + "loss": 0.0226, "step": 91010 }, { - "epoch": 0.98, - "learning_rate": 0.00015240319128235065, - "loss": 0.0129, + "epoch": 0.46, + "learning_rate": 0.00023111885818647804, + "loss": 0.0155, "step": 91020 }, { - "epoch": 0.98, - "learning_rate": 0.00015238697541674774, - "loss": 0.0135, + "epoch": 0.46, + "learning_rate": 0.00023111129049346402, + "loss": 0.0138, "step": 91030 }, { - "epoch": 0.98, - "learning_rate": 0.00015237075955114483, - "loss": 0.0144, + "epoch": 0.46, + "learning_rate": 0.00023110372280045003, + "loss": 0.0222, "step": 91040 }, { - "epoch": 0.98, - "learning_rate": 0.0001523545436855419, - "loss": 0.016, + "epoch": 0.46, + "learning_rate": 0.000231096155107436, + "loss": 0.0136, "step": 91050 }, { - "epoch": 0.98, - "learning_rate": 0.00015233832781993902, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.000231088587414422, + "loss": 0.0187, "step": 91060 }, { - "epoch": 0.98, - "learning_rate": 0.0001523221119543361, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.000231081019721408, + "loss": 0.0162, "step": 91070 }, { - "epoch": 0.98, - "learning_rate": 0.0001523058960887332, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023107345202839398, + "loss": 0.0177, "step": 91080 }, { - "epoch": 0.98, - "learning_rate": 0.0001522896802231303, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023106588433537996, + "loss": 0.0175, "step": 91090 }, { - "epoch": 0.98, - "learning_rate": 0.0001522734643575274, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.00023105831664236597, + "loss": 0.0169, "step": 91100 }, { - "epoch": 0.98, - "learning_rate": 0.00015225724849192448, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023105074894935195, + "loss": 0.0175, "step": 91110 }, { - "epoch": 0.99, - "learning_rate": 0.0001522410326263216, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023104318125633793, + "loss": 0.0212, "step": 91120 }, { - "epoch": 0.99, - "learning_rate": 0.00015222481676071867, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023103561356332389, + "loss": 0.0153, "step": 91130 }, { - "epoch": 0.99, - "learning_rate": 0.00015220860089511576, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.0002310280458703099, + "loss": 0.0164, "step": 91140 }, { - "epoch": 0.99, - "learning_rate": 0.00015219238502951285, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023102047817729588, + "loss": 0.0157, "step": 91150 }, { - "epoch": 0.99, - "learning_rate": 0.00015217616916390997, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023101291048428186, + "loss": 0.014, "step": 91160 }, { - "epoch": 0.99, - "learning_rate": 0.00015215995329830704, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023100534279126787, + "loss": 0.0172, "step": 91170 }, { - "epoch": 0.99, - "learning_rate": 0.00015214373743270413, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023099777509825385, + "loss": 0.019, "step": 91180 }, { - "epoch": 0.99, - "learning_rate": 0.00015212752156710125, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.00023099020740523983, + "loss": 0.0171, "step": 91190 }, { - "epoch": 0.99, - "learning_rate": 0.00015211130570149834, - "loss": 0.015, + "epoch": 0.46, + "learning_rate": 0.00023098263971222584, + "loss": 0.0161, "step": 91200 }, { - "epoch": 0.99, - "learning_rate": 0.0001520950898358954, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023097507201921182, + "loss": 0.0221, "step": 91210 }, { - "epoch": 0.99, - "learning_rate": 0.0001520788739702925, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.0002309675043261978, + "loss": 0.0144, "step": 91220 }, { - "epoch": 0.99, - "learning_rate": 0.00015206265810468962, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023095993663318378, + "loss": 0.0129, "step": 91230 }, { - "epoch": 0.99, - "learning_rate": 0.00015204644223908671, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.0002309523689401698, + "loss": 0.0206, "step": 91240 }, { - "epoch": 0.99, - "learning_rate": 0.00015203022637348378, - "loss": 0.0142, + "epoch": 0.46, + "learning_rate": 0.00023094480124715577, + "loss": 0.0123, "step": 91250 }, { - "epoch": 0.99, - "learning_rate": 0.0001520140105078809, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.00023093723355414175, + "loss": 0.0149, "step": 91260 }, { - "epoch": 0.99, - "learning_rate": 0.000151997794642278, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.00023092966586112776, + "loss": 0.0188, "step": 91270 }, { - "epoch": 0.99, - "learning_rate": 0.00015198157877667509, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023092209816811374, + "loss": 0.0197, "step": 91280 }, { - "epoch": 0.99, - "learning_rate": 0.00015196536291107215, - "loss": 0.0148, + "epoch": 0.46, + "learning_rate": 0.00023091453047509972, + "loss": 0.0165, "step": 91290 }, { - "epoch": 0.99, - "learning_rate": 0.00015194914704546927, - "loss": 0.0127, + "epoch": 0.46, + "learning_rate": 0.00023090696278208573, + "loss": 0.0179, "step": 91300 }, { - "epoch": 0.99, - "learning_rate": 0.00015193293117986636, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023089939508907171, + "loss": 0.0194, "step": 91310 }, { - "epoch": 0.99, - "learning_rate": 0.00015191671531426348, - "loss": 0.0157, + "epoch": 0.46, + "learning_rate": 0.0002308918273960577, + "loss": 0.022, "step": 91320 }, { - "epoch": 0.99, - "learning_rate": 0.00015190049944866055, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.0002308842597030437, + "loss": 0.0215, "step": 91330 }, { - "epoch": 0.99, - "learning_rate": 0.00015188428358305764, - "loss": 0.0142, + "epoch": 0.46, + "learning_rate": 0.00023087669201002969, + "loss": 0.0174, "step": 91340 }, { - "epoch": 0.99, - "learning_rate": 0.00015186806771745473, - "loss": 0.0165, + "epoch": 0.46, + "learning_rate": 0.00023086912431701567, + "loss": 0.0195, "step": 91350 }, { - "epoch": 0.99, - "learning_rate": 0.00015185185185185185, - "loss": 0.0163, + "epoch": 0.46, + "learning_rate": 0.00023086155662400168, + "loss": 0.0159, "step": 91360 }, { - "epoch": 0.99, - "learning_rate": 0.00015183563598624895, - "loss": 0.0127, + "epoch": 0.46, + "learning_rate": 0.00023085398893098766, + "loss": 0.018, "step": 91370 }, { - "epoch": 0.99, - "learning_rate": 0.000151819420120646, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.00023084642123797364, + "loss": 0.0177, "step": 91380 }, { - "epoch": 0.99, - "learning_rate": 0.00015180320425504313, - "loss": 0.0135, + "epoch": 0.46, + "learning_rate": 0.00023083885354495965, + "loss": 0.0251, "step": 91390 }, { - "epoch": 0.99, - "learning_rate": 0.00015178698838944023, - "loss": 0.015, + "epoch": 0.46, + "learning_rate": 0.00023083128585194563, + "loss": 0.0181, "step": 91400 }, { - "epoch": 0.99, - "learning_rate": 0.00015177077252383732, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.0002308237181589316, + "loss": 0.022, "step": 91410 }, { - "epoch": 0.99, - "learning_rate": 0.00015175455665823438, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.0002308161504659176, + "loss": 0.0176, "step": 91420 }, { - "epoch": 0.99, - "learning_rate": 0.0001517383407926315, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.0002308085827729036, + "loss": 0.0198, "step": 91430 }, { - "epoch": 0.99, - "learning_rate": 0.0001517221249270286, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023080101507988958, + "loss": 0.0189, "step": 91440 }, { - "epoch": 0.99, - "learning_rate": 0.0001517059090614257, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023079344738687556, + "loss": 0.0196, "step": 91450 }, { - "epoch": 0.99, - "learning_rate": 0.00015168969319582278, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023078587969386157, + "loss": 0.0166, "step": 91460 }, { - "epoch": 0.99, - "learning_rate": 0.00015167347733021987, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.00023077831200084755, + "loss": 0.0208, "step": 91470 }, { - "epoch": 0.99, - "learning_rate": 0.00015165726146461697, - "loss": 0.0156, + "epoch": 0.46, + "learning_rate": 0.00023077074430783353, + "loss": 0.0145, "step": 91480 }, { - "epoch": 0.99, - "learning_rate": 0.0001516410455990141, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023076317661481954, + "loss": 0.0164, "step": 91490 }, { - "epoch": 0.99, - "learning_rate": 0.00015162482973341115, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023075560892180552, + "loss": 0.0163, "step": 91500 }, { - "epoch": 0.99, - "learning_rate": 0.00015160861386780825, - "loss": 0.0148, + "epoch": 0.46, + "learning_rate": 0.0002307480412287915, + "loss": 0.0186, "step": 91510 }, { - "epoch": 0.99, - "learning_rate": 0.00015159239800220534, - "loss": 0.01, + "epoch": 0.46, + "learning_rate": 0.00023074047353577751, + "loss": 0.0174, "step": 91520 }, { - "epoch": 0.99, - "learning_rate": 0.00015157618213660246, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.0002307329058427635, + "loss": 0.0138, "step": 91530 }, { - "epoch": 0.99, - "learning_rate": 0.00015155996627099952, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023072533814974948, + "loss": 0.0204, "step": 91540 }, { - "epoch": 0.99, - "learning_rate": 0.00015154375040539662, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023071777045673549, + "loss": 0.0159, "step": 91550 }, { - "epoch": 0.99, - "learning_rate": 0.00015152753453979374, - "loss": 0.015, + "epoch": 0.46, + "learning_rate": 0.00023071020276372147, + "loss": 0.0135, "step": 91560 }, { - "epoch": 0.99, - "learning_rate": 0.00015151131867419083, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023070263507070745, + "loss": 0.017, "step": 91570 }, { - "epoch": 0.99, - "learning_rate": 0.0001514951028085879, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.00023069506737769343, + "loss": 0.0158, "step": 91580 }, { - "epoch": 0.99, - "learning_rate": 0.000151478886942985, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.00023068749968467944, + "loss": 0.0174, "step": 91590 }, { - "epoch": 0.99, - "learning_rate": 0.0001514626710773821, - "loss": 0.0133, + "epoch": 0.46, + "learning_rate": 0.00023067993199166542, + "loss": 0.0161, "step": 91600 }, { - "epoch": 0.99, - "learning_rate": 0.0001514464552117792, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.0002306723642986514, + "loss": 0.0202, "step": 91610 }, { - "epoch": 0.99, - "learning_rate": 0.00015143023934617627, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002306647966056374, + "loss": 0.0194, "step": 91620 }, { - "epoch": 0.99, - "learning_rate": 0.00015141402348057339, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.0002306572289126234, + "loss": 0.0195, "step": 91630 }, { - "epoch": 0.99, - "learning_rate": 0.00015139780761497048, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023064966121960937, + "loss": 0.0178, "step": 91640 }, { - "epoch": 0.99, - "learning_rate": 0.00015138159174936757, - "loss": 0.0144, + "epoch": 0.46, + "learning_rate": 0.00023064209352659538, + "loss": 0.0173, "step": 91650 }, { - "epoch": 0.99, - "learning_rate": 0.00015136537588376464, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023063452583358136, + "loss": 0.015, "step": 91660 }, { - "epoch": 0.99, - "learning_rate": 0.00015134916001816176, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023062695814056734, + "loss": 0.0153, "step": 91670 }, { - "epoch": 0.99, - "learning_rate": 0.00015133294415255885, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023061939044755335, + "loss": 0.0176, "step": 91680 }, { - "epoch": 0.99, - "learning_rate": 0.00015131672828695597, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023061182275453933, + "loss": 0.0178, "step": 91690 }, { - "epoch": 0.99, - "learning_rate": 0.00015130051242135303, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023060425506152532, + "loss": 0.0181, "step": 91700 }, { - "epoch": 0.99, - "learning_rate": 0.00015128429655575013, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023059668736851132, + "loss": 0.0195, "step": 91710 }, { - "epoch": 0.99, - "learning_rate": 0.00015126808069014722, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002305891196754973, + "loss": 0.0171, "step": 91720 }, { - "epoch": 0.99, - "learning_rate": 0.00015125186482454434, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.0002305815519824833, + "loss": 0.0165, "step": 91730 }, { - "epoch": 0.99, - "learning_rate": 0.0001512356489589414, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023057398428946927, + "loss": 0.0174, "step": 91740 }, { - "epoch": 0.99, - "learning_rate": 0.0001512194330933385, - "loss": 0.0153, + "epoch": 0.46, + "learning_rate": 0.00023056641659645528, + "loss": 0.0175, "step": 91750 }, { - "epoch": 0.99, - "learning_rate": 0.00015120321722773562, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.00023055884890344126, + "loss": 0.0185, "step": 91760 }, { - "epoch": 0.99, - "learning_rate": 0.0001511870013621327, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023055128121042724, + "loss": 0.0184, "step": 91770 }, { - "epoch": 0.99, - "learning_rate": 0.00015117078549652978, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023054371351741325, + "loss": 0.0161, "step": 91780 }, { - "epoch": 0.99, - "learning_rate": 0.00015115456963092687, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023053614582439923, + "loss": 0.0184, "step": 91790 }, { - "epoch": 0.99, - "learning_rate": 0.000151138353765324, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.0002305285781313852, + "loss": 0.016, "step": 91800 }, { - "epoch": 0.99, - "learning_rate": 0.00015112213789972108, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023052101043837122, + "loss": 0.0141, "step": 91810 }, { - "epoch": 0.99, - "learning_rate": 0.00015110592203411815, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002305134427453572, + "loss": 0.02, "step": 91820 }, { - "epoch": 0.99, - "learning_rate": 0.00015108970616851527, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023050587505234318, + "loss": 0.0146, "step": 91830 }, { - "epoch": 0.99, - "learning_rate": 0.00015107349030291236, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.0002304983073593292, + "loss": 0.0144, "step": 91840 }, { - "epoch": 0.99, - "learning_rate": 0.00015105727443730945, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023049073966631517, + "loss": 0.0144, "step": 91850 }, { - "epoch": 0.99, - "learning_rate": 0.00015104105857170652, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023048317197330115, + "loss": 0.0142, "step": 91860 }, { - "epoch": 0.99, - "learning_rate": 0.00015102484270610364, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023047560428028716, + "loss": 0.0161, "step": 91870 }, { - "epoch": 0.99, - "learning_rate": 0.00015100862684050073, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023046803658727314, + "loss": 0.0133, "step": 91880 }, { - "epoch": 0.99, - "learning_rate": 0.00015099241097489782, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023046046889425913, + "loss": 0.0168, "step": 91890 }, { - "epoch": 0.99, - "learning_rate": 0.00015097619510929492, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.00023045290120124513, + "loss": 0.0171, "step": 91900 }, { - "epoch": 0.99, - "learning_rate": 0.000150959979243692, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023044533350823112, + "loss": 0.0262, "step": 91910 }, { - "epoch": 0.99, - "learning_rate": 0.0001509437633780891, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.0002304377658152171, + "loss": 0.0167, "step": 91920 }, { - "epoch": 0.99, - "learning_rate": 0.00015092754751248622, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023043019812220308, + "loss": 0.0148, "step": 91930 }, { - "epoch": 0.99, - "learning_rate": 0.0001509113316468833, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.0002304226304291891, + "loss": 0.0152, "step": 91940 }, { - "epoch": 0.99, - "learning_rate": 0.00015089511578128038, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023041506273617507, + "loss": 0.0187, "step": 91950 }, { - "epoch": 0.99, - "learning_rate": 0.00015087889991567747, - "loss": 0.015, + "epoch": 0.46, + "learning_rate": 0.00023040749504316105, + "loss": 0.0157, "step": 91960 }, { - "epoch": 0.99, - "learning_rate": 0.0001508626840500746, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.00023039992735014706, + "loss": 0.0129, "step": 91970 }, { - "epoch": 0.99, - "learning_rate": 0.00015084646818447166, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023039235965713304, + "loss": 0.0174, "step": 91980 }, { - "epoch": 0.99, - "learning_rate": 0.00015083025231886875, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023038479196411902, + "loss": 0.016, "step": 91990 }, { - "epoch": 0.99, - "learning_rate": 0.00015081403645326587, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023037722427110503, + "loss": 0.017, "step": 92000 }, { - "epoch": 0.99, - "eval_cer": 0.9215434379652454, - "eval_loss": 0.009060974232852459, - "eval_runtime": 121.4309, - "eval_samples_per_second": 16.47, - "eval_steps_per_second": 4.118, + "epoch": 0.46, + "eval_cer": 0.9144974269946735, + "eval_loss": 0.011690773069858551, + "eval_runtime": 116.7969, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, "step": 92000 }, { - "epoch": 0.99, - "learning_rate": 0.00015079782058766296, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.000230369656578091, + "loss": 0.0172, "step": 92010 }, { - "epoch": 0.99, - "learning_rate": 0.00015078160472206003, - "loss": 0.016, + "epoch": 0.46, + "learning_rate": 0.000230362088885077, + "loss": 0.0176, "step": 92020 }, { - "epoch": 0.99, - "learning_rate": 0.00015076538885645715, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.000230354521192063, + "loss": 0.0148, "step": 92030 }, { - "epoch": 0.99, - "learning_rate": 0.00015074917299085424, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023034695349904898, + "loss": 0.0254, "step": 92040 }, { - "epoch": 1.0, - "learning_rate": 0.00015073295712525134, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.00023033938580603496, + "loss": 0.0176, "step": 92050 }, { - "epoch": 1.0, - "learning_rate": 0.0001507167412596484, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023033181811302097, + "loss": 0.0218, "step": 92060 }, { - "epoch": 1.0, - "learning_rate": 0.00015070052539404552, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023032425042000695, + "loss": 0.0184, "step": 92070 }, { - "epoch": 1.0, - "learning_rate": 0.0001506843095284426, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023031668272699294, + "loss": 0.0171, "step": 92080 }, { - "epoch": 1.0, - "learning_rate": 0.0001506680936628397, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.00023030911503397892, + "loss": 0.0169, "step": 92090 }, { - "epoch": 1.0, - "learning_rate": 0.00015065187779723683, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023030154734096493, + "loss": 0.0164, "step": 92100 }, { - "epoch": 1.0, - "learning_rate": 0.0001506356619316339, - "loss": 0.0158, + "epoch": 0.46, + "learning_rate": 0.0002302939796479509, + "loss": 0.0177, "step": 92110 }, { - "epoch": 1.0, - "learning_rate": 0.00015061944606603098, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.0002302864119549369, + "loss": 0.0184, "step": 92120 }, { - "epoch": 1.0, - "learning_rate": 0.0001506032302004281, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.0002302788442619229, + "loss": 0.019, "step": 92130 }, { - "epoch": 1.0, - "learning_rate": 0.0001505870143348252, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023027127656890888, + "loss": 0.0174, "step": 92140 }, { - "epoch": 1.0, - "learning_rate": 0.00015057079846922226, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023026370887589486, + "loss": 0.0162, "step": 92150 }, { - "epoch": 1.0, - "learning_rate": 0.00015055458260361936, - "loss": 0.0145, + "epoch": 0.46, + "learning_rate": 0.00023025614118288087, + "loss": 0.0189, "step": 92160 }, { - "epoch": 1.0, - "learning_rate": 0.00015053836673801648, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00023024857348986685, + "loss": 0.0166, "step": 92170 }, { - "epoch": 1.0, - "learning_rate": 0.00015052215087241357, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00023024100579685283, + "loss": 0.0175, "step": 92180 }, { - "epoch": 1.0, - "learning_rate": 0.00015050593500681063, - "loss": 0.0159, + "epoch": 0.47, + "learning_rate": 0.00023023343810383884, + "loss": 0.0141, "step": 92190 }, { - "epoch": 1.0, - "learning_rate": 0.00015048971914120775, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00023022587041082482, + "loss": 0.0188, "step": 92200 }, { - "epoch": 1.0, - "learning_rate": 0.00015047350327560485, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.0002302183027178108, + "loss": 0.0153, "step": 92210 }, { - "epoch": 1.0, - "learning_rate": 0.00015045728741000194, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.0002302107350247968, + "loss": 0.0183, "step": 92220 }, { - "epoch": 1.0, - "learning_rate": 0.000150441071544399, - "loss": 0.0161, + "epoch": 0.47, + "learning_rate": 0.0002302031673317828, + "loss": 0.0149, "step": 92230 }, { - "epoch": 1.0, - "learning_rate": 0.00015042485567879612, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00023019559963876877, + "loss": 0.0169, "step": 92240 }, { - "epoch": 1.0, - "learning_rate": 0.00015040863981319322, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00023018803194575476, + "loss": 0.015, "step": 92250 }, { - "epoch": 1.0, - "learning_rate": 0.00015039242394759034, - "loss": 0.0143, + "epoch": 0.47, + "learning_rate": 0.00023018046425274076, + "loss": 0.0173, "step": 92260 }, { - "epoch": 1.0, - "learning_rate": 0.0001503762080819874, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00023017289655972675, + "loss": 0.0177, "step": 92270 }, { - "epoch": 1.0, - "learning_rate": 0.0001503599922163845, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00023016532886671273, + "loss": 0.0205, "step": 92280 }, { - "epoch": 1.0, - "learning_rate": 0.0001503437763507816, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00023015776117369874, + "loss": 0.0171, "step": 92290 }, { - "epoch": 1.0, - "learning_rate": 0.0001503275604851787, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00023015019348068472, + "loss": 0.0143, "step": 92300 }, { - "epoch": 1.0, - "learning_rate": 0.00015031134461957577, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.0002301426257876707, + "loss": 0.0174, "step": 92310 }, { - "epoch": 1.0, - "learning_rate": 0.00015029512875397287, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.0002301350580946567, + "loss": 0.0189, "step": 92320 }, { - "epoch": 1.0, - "learning_rate": 0.00015027891288836999, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.0002301274904016427, + "loss": 0.015, "step": 92330 }, { - "epoch": 1.0, - "learning_rate": 0.00015026269702276708, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00023011992270862867, + "loss": 0.0153, "step": 92340 }, { - "epoch": 1.0, - "learning_rate": 0.00015024648115716414, - "loss": 0.0139, + "epoch": 0.47, + "learning_rate": 0.00023011235501561468, + "loss": 0.0169, "step": 92350 }, { - "epoch": 1.0, - "learning_rate": 0.00015023026529156124, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00023010478732260066, + "loss": 0.0132, "step": 92360 }, { - "epoch": 1.0, - "learning_rate": 0.00015021404942595836, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00023009721962958664, + "loss": 0.0149, "step": 92370 }, { - "epoch": 1.0, - "learning_rate": 0.00015019783356035545, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00023008965193657265, + "loss": 0.0155, "step": 92380 }, { - "epoch": 1.0, - "learning_rate": 0.00015018161769475252, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.0002300820842435586, + "loss": 0.0161, "step": 92390 }, { - "epoch": 1.0, - "learning_rate": 0.00015016540182914964, - "loss": 0.0155, + "epoch": 0.47, + "learning_rate": 0.0002300745165505446, + "loss": 0.0195, "step": 92400 }, { - "epoch": 1.0, - "learning_rate": 0.00015014918596354673, - "loss": 0.0139, + "epoch": 0.47, + "learning_rate": 0.00023006694885753057, + "loss": 0.0183, "step": 92410 }, { - "epoch": 1.0, - "learning_rate": 0.00015013297009794382, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00023005938116451658, + "loss": 0.0182, "step": 92420 }, { - "epoch": 1.0, - "learning_rate": 0.0001501167542323409, - "loss": 0.0156, + "epoch": 0.47, + "learning_rate": 0.00023005181347150256, + "loss": 0.0189, "step": 92430 }, { - "epoch": 1.0, - "learning_rate": 0.000150100538366738, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00023004424577848854, + "loss": 0.0171, "step": 92440 }, { - "epoch": 1.0, - "learning_rate": 0.0001500843225011351, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00023003667808547455, + "loss": 0.0221, "step": 92450 }, { - "epoch": 1.0, - "learning_rate": 0.0001500681066355322, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.00023002911039246053, + "loss": 0.0119, "step": 92460 }, { - "epoch": 1.0, - "learning_rate": 0.00015005189076992928, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002300215426994465, + "loss": 0.0139, "step": 92470 }, { - "epoch": 1.0, - "learning_rate": 0.00015003567490432638, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.0002300139750064325, + "loss": 0.0143, "step": 92480 }, { - "epoch": 1.0, - "learning_rate": 0.00015001945903872347, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.0002300064073134185, + "loss": 0.0151, "step": 92490 }, { - "epoch": 1.0, - "learning_rate": 0.0001500032431731206, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022999883962040448, + "loss": 0.0174, "step": 92500 }, { - "epoch": 1.0, - "learning_rate": 0.00014998702730751766, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.00022999127192739046, + "loss": 0.0144, "step": 92510 }, { - "epoch": 1.0, - "learning_rate": 0.00014997081144191475, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.00022998370423437647, + "loss": 0.0209, "step": 92520 }, { - "epoch": 1.0, - "learning_rate": 0.00014995459557631184, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022997613654136245, + "loss": 0.0164, "step": 92530 }, { - "epoch": 1.0, - "learning_rate": 0.00014993837971070893, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022996856884834844, + "loss": 0.0165, "step": 92540 }, { - "epoch": 1.0, - "learning_rate": 0.00014992216384510605, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022996100115533444, + "loss": 0.0144, "step": 92550 }, { - "epoch": 1.0, - "learning_rate": 0.00014990594797950312, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022995343346232043, + "loss": 0.0168, "step": 92560 }, { - "epoch": 1.0, - "learning_rate": 0.00014988973211390024, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.0002299458657693064, + "loss": 0.0142, "step": 92570 }, { - "epoch": 1.0, - "learning_rate": 0.0001498735162482973, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022993829807629242, + "loss": 0.0194, "step": 92580 }, { - "epoch": 1.0, - "learning_rate": 0.00014985730038269442, - "loss": 0.0139, + "epoch": 0.47, + "learning_rate": 0.0002299307303832784, + "loss": 0.0141, "step": 92590 }, { - "epoch": 1.0, - "learning_rate": 0.0001498410845170915, - "loss": 0.0088, + "epoch": 0.47, + "learning_rate": 0.00022992316269026438, + "loss": 0.0159, "step": 92600 }, { - "epoch": 1.0, - "learning_rate": 0.0001498248686514886, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.0002299155949972504, + "loss": 0.0163, "step": 92610 }, { - "epoch": 1.0, - "learning_rate": 0.0001498086527858857, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.00022990802730423637, + "loss": 0.0131, "step": 92620 }, { - "epoch": 1.0, - "learning_rate": 0.0001497924369202828, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022990045961122235, + "loss": 0.0157, "step": 92630 }, { - "epoch": 1.0, - "learning_rate": 0.0001497762210546799, - "loss": 0.014, + "epoch": 0.47, + "learning_rate": 0.00022989289191820833, + "loss": 0.0124, "step": 92640 }, { - "epoch": 1.0, - "learning_rate": 0.00014976000518907698, - "loss": 0.0089, + "epoch": 0.47, + "learning_rate": 0.00022988532422519434, + "loss": 0.0141, "step": 92650 }, { - "epoch": 1.0, - "learning_rate": 0.00014974378932347407, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022987775653218032, + "loss": 0.0173, "step": 92660 }, { - "epoch": 1.0, - "learning_rate": 0.00014972757345787117, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.0002298701888391663, + "loss": 0.0133, "step": 92670 }, { - "epoch": 1.0, - "learning_rate": 0.00014971135759226826, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.0002298626211461523, + "loss": 0.0157, "step": 92680 }, { - "epoch": 1.0, - "learning_rate": 0.00014969514172666535, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.0002298550534531383, + "loss": 0.0207, "step": 92690 }, { - "epoch": 1.0, - "learning_rate": 0.00014967892586106244, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022984748576012427, + "loss": 0.0155, "step": 92700 }, { - "epoch": 1.0, - "learning_rate": 0.00014966270999545954, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022983991806711028, + "loss": 0.0129, "step": 92710 }, { - "epoch": 1.0, - "learning_rate": 0.00014964649412985663, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022983235037409626, + "loss": 0.0137, "step": 92720 }, { - "epoch": 1.0, - "learning_rate": 0.00014963027826425372, - "loss": 0.0077, + "epoch": 0.47, + "learning_rate": 0.00022982478268108225, + "loss": 0.0151, "step": 92730 }, { - "epoch": 1.0, - "learning_rate": 0.00014961406239865082, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.00022981721498806825, + "loss": 0.0135, "step": 92740 }, { - "epoch": 1.0, - "learning_rate": 0.0001495978465330479, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.00022980964729505424, + "loss": 0.0148, "step": 92750 }, { - "epoch": 1.0, - "learning_rate": 0.000149581630667445, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022980207960204022, + "loss": 0.0153, "step": 92760 }, { - "epoch": 1.0, - "learning_rate": 0.00014956541480184212, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022979451190902623, + "loss": 0.0157, "step": 92770 }, { - "epoch": 1.0, - "learning_rate": 0.0001495491989362392, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.0002297869442160122, + "loss": 0.0168, "step": 92780 }, { - "epoch": 1.0, - "learning_rate": 0.0001495329830706363, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002297793765229982, + "loss": 0.0166, "step": 92790 }, { - "epoch": 1.0, - "learning_rate": 0.0001495167672050334, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.0002297718088299842, + "loss": 0.017, "step": 92800 }, { - "epoch": 1.0, - "learning_rate": 0.0001495005513394305, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022976424113697018, + "loss": 0.0166, "step": 92810 }, { - "epoch": 1.0, - "learning_rate": 0.00014948433547382758, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022975667344395616, + "loss": 0.0172, "step": 92820 }, { - "epoch": 1.0, - "learning_rate": 0.00014946811960822468, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022974910575094214, + "loss": 0.0156, "step": 92830 }, { - "epoch": 1.0, - "learning_rate": 0.00014945190374262177, - "loss": 0.0086, + "epoch": 0.47, + "learning_rate": 0.00022974153805792815, + "loss": 0.0179, "step": 92840 }, { - "epoch": 1.0, - "learning_rate": 0.00014943568787701886, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00022973397036491413, + "loss": 0.0188, "step": 92850 }, { - "epoch": 1.0, - "learning_rate": 0.00014941947201141596, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.0002297264026719001, + "loss": 0.0185, "step": 92860 }, { - "epoch": 1.0, - "learning_rate": 0.00014940325614581305, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.00022971883497888612, + "loss": 0.0144, "step": 92870 }, { - "epoch": 1.0, - "learning_rate": 0.00014938704028021014, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.0002297112672858721, + "loss": 0.0166, "step": 92880 }, { - "epoch": 1.0, - "learning_rate": 0.00014937082441460723, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022970369959285808, + "loss": 0.0168, "step": 92890 }, { - "epoch": 1.0, - "learning_rate": 0.00014935460854900433, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.0002296961318998441, + "loss": 0.0174, "step": 92900 }, { - "epoch": 1.0, - "learning_rate": 0.00014933839268340142, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022968856420683007, + "loss": 0.0187, "step": 92910 }, { - "epoch": 1.0, - "learning_rate": 0.00014932217681779854, - "loss": 0.0142, + "epoch": 0.47, + "learning_rate": 0.00022968099651381606, + "loss": 0.0147, "step": 92920 }, { - "epoch": 1.0, - "learning_rate": 0.0001493059609521956, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.00022967342882080206, + "loss": 0.0154, "step": 92930 }, { - "epoch": 1.0, - "learning_rate": 0.00014928974508659272, - "loss": 0.0147, + "epoch": 0.47, + "learning_rate": 0.00022966586112778805, + "loss": 0.0139, "step": 92940 }, { - "epoch": 1.0, - "learning_rate": 0.0001492735292209898, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022965829343477403, + "loss": 0.0155, "step": 92950 }, { - "epoch": 1.0, - "learning_rate": 0.0001492573133553869, - "loss": 0.0133, + "epoch": 0.47, + "learning_rate": 0.00022965072574176004, + "loss": 0.0153, "step": 92960 }, { - "epoch": 1.01, - "learning_rate": 0.00014924109748978398, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022964315804874602, + "loss": 0.0146, "step": 92970 }, { - "epoch": 1.01, - "learning_rate": 0.0001492248816241811, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.000229635590355732, + "loss": 0.0187, "step": 92980 }, { - "epoch": 1.01, - "learning_rate": 0.0001492086657585782, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022962802266271798, + "loss": 0.0197, "step": 92990 }, { - "epoch": 1.01, - "learning_rate": 0.00014919244989297528, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.000229620454969704, + "loss": 0.0164, "step": 93000 }, { - "epoch": 1.01, - "eval_cer": 0.9215599414214166, - "eval_loss": 0.008955257013440132, - "eval_runtime": 121.985, - "eval_samples_per_second": 16.395, - "eval_steps_per_second": 4.099, + "epoch": 0.47, + "eval_cer": 0.9144867526372941, + "eval_loss": 0.0119341891258955, + "eval_runtime": 116.7754, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, "step": 93000 }, { - "epoch": 1.01, - "learning_rate": 0.00014917623402737237, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.00022961288727668997, + "loss": 0.0171, "step": 93010 }, { - "epoch": 1.01, - "learning_rate": 0.00014916001816176947, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022960531958367595, + "loss": 0.0176, "step": 93020 }, { - "epoch": 1.01, - "learning_rate": 0.00014914380229616656, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022959775189066196, + "loss": 0.0171, "step": 93030 }, { - "epoch": 1.01, - "learning_rate": 0.00014912758643056365, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.00022959018419764794, + "loss": 0.0164, "step": 93040 }, { - "epoch": 1.01, - "learning_rate": 0.00014911137056496075, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022958261650463392, + "loss": 0.0181, "step": 93050 }, { - "epoch": 1.01, - "learning_rate": 0.00014909515469935784, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022957504881161993, + "loss": 0.0164, "step": 93060 }, { - "epoch": 1.01, - "learning_rate": 0.00014907893883375493, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002295674811186059, + "loss": 0.0162, "step": 93070 }, { - "epoch": 1.01, - "learning_rate": 0.00014906272296815202, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.0002295599134255919, + "loss": 0.0144, "step": 93080 }, { - "epoch": 1.01, - "learning_rate": 0.00014904650710254912, - "loss": 0.0089, + "epoch": 0.47, + "learning_rate": 0.0002295523457325779, + "loss": 0.0169, "step": 93090 }, { - "epoch": 1.01, - "learning_rate": 0.0001490302912369462, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00022954477803956388, + "loss": 0.0152, "step": 93100 }, { - "epoch": 1.01, - "learning_rate": 0.0001490140753713433, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022953721034654987, + "loss": 0.013, "step": 93110 }, { - "epoch": 1.01, - "learning_rate": 0.00014899785950574042, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022952964265353587, + "loss": 0.0171, "step": 93120 }, { - "epoch": 1.01, - "learning_rate": 0.0001489816436401375, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022952207496052186, + "loss": 0.0178, "step": 93130 }, { - "epoch": 1.01, - "learning_rate": 0.0001489654277745346, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022951450726750784, + "loss": 0.0179, "step": 93140 }, { - "epoch": 1.01, - "learning_rate": 0.00014894921190893167, - "loss": 0.0151, + "epoch": 0.47, + "learning_rate": 0.00022950693957449382, + "loss": 0.0142, "step": 93150 }, { - "epoch": 1.01, - "learning_rate": 0.0001489329960433288, - "loss": 0.0088, + "epoch": 0.47, + "learning_rate": 0.00022949937188147983, + "loss": 0.0143, "step": 93160 }, { - "epoch": 1.01, - "learning_rate": 0.00014891678017772586, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.0002294918041884658, + "loss": 0.015, "step": 93170 }, { - "epoch": 1.01, - "learning_rate": 0.00014890056431212298, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.0002294842364954518, + "loss": 0.0162, "step": 93180 }, { - "epoch": 1.01, - "learning_rate": 0.00014888434844652007, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.0002294766688024378, + "loss": 0.0168, "step": 93190 }, { - "epoch": 1.01, - "learning_rate": 0.00014886813258091716, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022946910110942378, + "loss": 0.0154, "step": 93200 }, { - "epoch": 1.01, - "learning_rate": 0.00014885191671531426, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022946153341640976, + "loss": 0.0138, "step": 93210 }, { - "epoch": 1.01, - "learning_rate": 0.00014883570084971135, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022945396572339577, + "loss": 0.0142, "step": 93220 }, { - "epoch": 1.01, - "learning_rate": 0.00014881948498410844, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022944639803038175, + "loss": 0.0178, "step": 93230 }, { - "epoch": 1.01, - "learning_rate": 0.00014880326911850553, - "loss": 0.0145, + "epoch": 0.47, + "learning_rate": 0.00022943883033736773, + "loss": 0.0164, "step": 93240 }, { - "epoch": 1.01, - "learning_rate": 0.00014878705325290263, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.00022943126264435374, + "loss": 0.0153, "step": 93250 }, { - "epoch": 1.01, - "learning_rate": 0.00014877083738729972, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022942369495133972, + "loss": 0.0153, "step": 93260 }, { - "epoch": 1.01, - "learning_rate": 0.0001487546215216968, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.0002294161272583257, + "loss": 0.02, "step": 93270 }, { - "epoch": 1.01, - "learning_rate": 0.0001487384056560939, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.0002294085595653117, + "loss": 0.0168, "step": 93280 }, { - "epoch": 1.01, - "learning_rate": 0.000148722189790491, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.0002294009918722977, + "loss": 0.0161, "step": 93290 }, { - "epoch": 1.01, - "learning_rate": 0.0001487059739248881, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022939342417928368, + "loss": 0.0146, "step": 93300 }, { - "epoch": 1.01, - "learning_rate": 0.00014868975805928518, - "loss": 0.0153, + "epoch": 0.47, + "learning_rate": 0.00022938585648626966, + "loss": 0.0162, "step": 93310 }, { - "epoch": 1.01, - "learning_rate": 0.00014867354219368228, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022937828879325567, + "loss": 0.0158, "step": 93320 }, { - "epoch": 1.01, - "learning_rate": 0.00014865732632807937, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022937072110024165, + "loss": 0.0166, "step": 93330 }, { - "epoch": 1.01, - "learning_rate": 0.0001486411104624765, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022936315340722763, + "loss": 0.0159, "step": 93340 }, { - "epoch": 1.01, - "learning_rate": 0.00014862489459687355, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.00022935558571421364, + "loss": 0.0178, "step": 93350 }, { - "epoch": 1.01, - "learning_rate": 0.00014860867873127067, - "loss": 0.0081, + "epoch": 0.47, + "learning_rate": 0.00022934801802119962, + "loss": 0.0145, "step": 93360 }, { - "epoch": 1.01, - "learning_rate": 0.00014859246286566774, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.0002293404503281856, + "loss": 0.0168, "step": 93370 }, { - "epoch": 1.01, - "learning_rate": 0.00014857624700006486, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.0002293328826351716, + "loss": 0.0142, "step": 93380 }, { - "epoch": 1.01, - "learning_rate": 0.00014856003113446193, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.0002293253149421576, + "loss": 0.0172, "step": 93390 }, { - "epoch": 1.01, - "learning_rate": 0.00014854381526885905, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022931774724914357, + "loss": 0.0138, "step": 93400 }, { - "epoch": 1.01, - "learning_rate": 0.00014852759940325614, - "loss": 0.0119, + "epoch": 0.47, + "learning_rate": 0.00022931017955612958, + "loss": 0.0148, "step": 93410 }, { - "epoch": 1.01, - "learning_rate": 0.00014851138353765323, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022930261186311556, + "loss": 0.014, "step": 93420 }, { - "epoch": 1.01, - "learning_rate": 0.00014849516767205032, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022929504417010154, + "loss": 0.015, "step": 93430 }, { - "epoch": 1.01, - "learning_rate": 0.00014847895180644742, - "loss": 0.0083, + "epoch": 0.47, + "learning_rate": 0.00022928747647708755, + "loss": 0.0141, "step": 93440 }, { - "epoch": 1.01, - "learning_rate": 0.0001484627359408445, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022927990878407353, + "loss": 0.0186, "step": 93450 }, { - "epoch": 1.01, - "learning_rate": 0.0001484465200752416, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022927234109105951, + "loss": 0.0208, "step": 93460 }, { - "epoch": 1.01, - "learning_rate": 0.0001484303042096387, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.00022926477339804552, + "loss": 0.0142, "step": 93470 }, { - "epoch": 1.01, - "learning_rate": 0.0001484140883440358, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.0002292572057050315, + "loss": 0.0183, "step": 93480 }, { - "epoch": 1.01, - "learning_rate": 0.00014839787247843288, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022924963801201749, + "loss": 0.0149, "step": 93490 }, { - "epoch": 1.01, - "learning_rate": 0.00014838165661282997, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022924207031900347, + "loss": 0.0197, "step": 93500 }, { - "epoch": 1.01, - "learning_rate": 0.0001483654407472271, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022923450262598948, + "loss": 0.0162, "step": 93510 }, { - "epoch": 1.01, - "learning_rate": 0.00014834922488162416, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022922693493297546, + "loss": 0.0183, "step": 93520 }, { - "epoch": 1.01, - "learning_rate": 0.00014833300901602128, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022921936723996144, + "loss": 0.0166, "step": 93530 }, { - "epoch": 1.01, - "learning_rate": 0.00014831679315041834, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022921179954694745, + "loss": 0.0161, "step": 93540 }, { - "epoch": 1.01, - "learning_rate": 0.00014830057728481546, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022920423185393343, + "loss": 0.0185, "step": 93550 }, { - "epoch": 1.01, - "learning_rate": 0.00014828436141921256, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.0002291966641609194, + "loss": 0.0173, "step": 93560 }, { - "epoch": 1.01, - "learning_rate": 0.00014826814555360965, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022918909646790542, + "loss": 0.0161, "step": 93570 }, { - "epoch": 1.01, - "learning_rate": 0.00014825192968800674, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.0002291815287748914, + "loss": 0.017, "step": 93580 }, { - "epoch": 1.01, - "learning_rate": 0.00014823571382240383, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022917396108187738, + "loss": 0.016, "step": 93590 }, { - "epoch": 1.01, - "learning_rate": 0.00014821949795680093, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.0002291663933888634, + "loss": 0.0143, "step": 93600 }, { - "epoch": 1.01, - "learning_rate": 0.00014820328209119802, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022915882569584937, + "loss": 0.0143, "step": 93610 }, { - "epoch": 1.01, - "learning_rate": 0.0001481870662255951, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022915125800283535, + "loss": 0.014, "step": 93620 }, { - "epoch": 1.01, - "learning_rate": 0.0001481708503599922, - "loss": 0.0083, + "epoch": 0.47, + "learning_rate": 0.00022914369030982136, + "loss": 0.0147, "step": 93630 }, { - "epoch": 1.01, - "learning_rate": 0.0001481546344943893, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.00022913612261680732, + "loss": 0.0186, "step": 93640 }, { - "epoch": 1.01, - "learning_rate": 0.0001481384186287864, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.0002291285549237933, + "loss": 0.0168, "step": 93650 }, { - "epoch": 1.01, - "learning_rate": 0.00014812220276318348, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00022912098723077928, + "loss": 0.0145, "step": 93660 }, { - "epoch": 1.01, - "learning_rate": 0.00014810598689758058, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002291134195377653, + "loss": 0.0159, "step": 93670 }, { - "epoch": 1.01, - "learning_rate": 0.00014808977103197767, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00022910585184475127, + "loss": 0.0151, "step": 93680 }, { - "epoch": 1.01, - "learning_rate": 0.00014807355516637476, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022909828415173725, + "loss": 0.0158, "step": 93690 }, { - "epoch": 1.01, - "learning_rate": 0.00014805733930077185, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022909071645872326, + "loss": 0.0286, "step": 93700 }, { - "epoch": 1.01, - "learning_rate": 0.00014804112343516897, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022908314876570924, + "loss": 0.0202, "step": 93710 }, { - "epoch": 1.01, - "learning_rate": 0.00014802490756956604, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022907558107269522, + "loss": 0.0162, "step": 93720 }, { - "epoch": 1.01, - "learning_rate": 0.00014800869170396316, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.0002290680133796812, + "loss": 0.0167, "step": 93730 }, { - "epoch": 1.01, - "learning_rate": 0.00014799247583836023, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.0002290604456866672, + "loss": 0.0191, "step": 93740 }, { - "epoch": 1.01, - "learning_rate": 0.00014797625997275735, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.0002290528779936532, + "loss": 0.0178, "step": 93750 }, { - "epoch": 1.01, - "learning_rate": 0.0001479600441071544, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022904531030063917, + "loss": 0.0186, "step": 93760 }, { - "epoch": 1.01, - "learning_rate": 0.00014794382824155153, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.00022903774260762518, + "loss": 0.0159, "step": 93770 }, { - "epoch": 1.01, - "learning_rate": 0.00014792761237594862, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022903017491461116, + "loss": 0.0166, "step": 93780 }, { - "epoch": 1.01, - "learning_rate": 0.00014791139651034572, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022902260722159715, + "loss": 0.0206, "step": 93790 }, { - "epoch": 1.01, - "learning_rate": 0.0001478951806447428, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022901503952858315, + "loss": 0.0184, "step": 93800 }, { - "epoch": 1.01, - "learning_rate": 0.0001478789647791399, - "loss": 0.008, + "epoch": 0.47, + "learning_rate": 0.00022900747183556914, + "loss": 0.0159, "step": 93810 }, { - "epoch": 1.01, - "learning_rate": 0.000147862748913537, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.00022899990414255512, + "loss": 0.0153, "step": 93820 }, { - "epoch": 1.01, - "learning_rate": 0.0001478465330479341, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022899233644954113, + "loss": 0.018, "step": 93830 }, { - "epoch": 1.01, - "learning_rate": 0.00014783031718233118, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.0002289847687565271, + "loss": 0.0178, "step": 93840 }, { - "epoch": 1.01, - "learning_rate": 0.00014781410131672827, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.0002289772010635131, + "loss": 0.0171, "step": 93850 }, { - "epoch": 1.01, - "learning_rate": 0.00014779788545112537, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.0002289696333704991, + "loss": 0.0188, "step": 93860 }, { - "epoch": 1.01, - "learning_rate": 0.00014778166958552246, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00022896206567748508, + "loss": 0.0165, "step": 93870 }, { - "epoch": 1.01, - "learning_rate": 0.00014776545371991955, - "loss": 0.0137, + "epoch": 0.47, + "learning_rate": 0.00022895449798447106, + "loss": 0.0183, "step": 93880 }, { - "epoch": 1.01, - "learning_rate": 0.00014774923785431664, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022894693029145704, + "loss": 0.013, "step": 93890 }, { - "epoch": 1.02, - "learning_rate": 0.00014773302198871374, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022893936259844305, + "loss": 0.0163, "step": 93900 }, { - "epoch": 1.02, - "learning_rate": 0.00014771680612311083, - "loss": 0.0119, + "epoch": 0.47, + "learning_rate": 0.00022893179490542903, + "loss": 0.0166, "step": 93910 }, { - "epoch": 1.02, - "learning_rate": 0.00014770059025750792, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.000228924227212415, + "loss": 0.0152, "step": 93920 }, { - "epoch": 1.02, - "learning_rate": 0.00014768437439190504, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.00022891665951940102, + "loss": 0.0181, "step": 93930 }, { - "epoch": 1.02, - "learning_rate": 0.0001476681585263021, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.000228909091826387, + "loss": 0.0155, "step": 93940 }, { - "epoch": 1.02, - "learning_rate": 0.00014765194266069923, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.00022890152413337298, + "loss": 0.012, "step": 93950 }, { - "epoch": 1.02, - "learning_rate": 0.0001476357267950963, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.000228893956440359, + "loss": 0.0129, "step": 93960 }, { - "epoch": 1.02, - "learning_rate": 0.0001476195109294934, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022888638874734497, + "loss": 0.0165, "step": 93970 }, { - "epoch": 1.02, - "learning_rate": 0.00014760329506389048, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022887882105433096, + "loss": 0.0173, "step": 93980 }, { - "epoch": 1.02, - "learning_rate": 0.0001475870791982876, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00022887125336131696, + "loss": 0.0153, "step": 93990 }, { - "epoch": 1.02, - "learning_rate": 0.0001475708633326847, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022886368566830295, + "loss": 0.0188, "step": 94000 }, { - "epoch": 1.02, - "eval_cer": 0.9215634158332421, - "eval_loss": 0.008654128760099411, - "eval_runtime": 121.8962, - "eval_samples_per_second": 16.407, - "eval_steps_per_second": 4.102, + "epoch": 0.47, + "eval_cer": 0.914481900656667, + "eval_loss": 0.011606461368501186, + "eval_runtime": 116.7314, + "eval_samples_per_second": 17.133, + "eval_steps_per_second": 4.283, "step": 94000 }, { - "epoch": 1.02, - "learning_rate": 0.00014755464746708178, - "loss": 0.0152, + "epoch": 0.47, + "learning_rate": 0.00022885611797528893, + "loss": 0.0187, "step": 94010 }, { - "epoch": 1.02, - "learning_rate": 0.00014753843160147888, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00022884855028227494, + "loss": 0.0155, "step": 94020 }, { - "epoch": 1.02, - "learning_rate": 0.00014752221573587597, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022884098258926092, + "loss": 0.014, "step": 94030 }, { - "epoch": 1.02, - "learning_rate": 0.00014750599987027306, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.0002288334148962469, + "loss": 0.0193, "step": 94040 }, { - "epoch": 1.02, - "learning_rate": 0.00014748978400467015, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022882584720323288, + "loss": 0.0132, "step": 94050 }, { - "epoch": 1.02, - "learning_rate": 0.00014747356813906725, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.0002288182795102189, + "loss": 0.0186, "step": 94060 }, { - "epoch": 1.02, - "learning_rate": 0.00014745735227346434, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022881071181720487, + "loss": 0.0152, "step": 94070 }, { - "epoch": 1.02, - "learning_rate": 0.00014744113640786143, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.00022880314412419085, + "loss": 0.0158, "step": 94080 }, { - "epoch": 1.02, - "learning_rate": 0.00014742492054225853, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.00022879557643117686, + "loss": 0.0151, "step": 94090 }, { - "epoch": 1.02, - "learning_rate": 0.00014740870467665562, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.00022878800873816284, + "loss": 0.0186, "step": 94100 }, { - "epoch": 1.02, - "learning_rate": 0.0001473924888110527, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022878044104514882, + "loss": 0.0133, "step": 94110 }, { - "epoch": 1.02, - "learning_rate": 0.0001473762729454498, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022877287335213483, + "loss": 0.0187, "step": 94120 }, { - "epoch": 1.02, - "learning_rate": 0.0001473600570798469, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.0002287653056591208, + "loss": 0.0217, "step": 94130 }, { - "epoch": 1.02, - "learning_rate": 0.000147343841214244, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.0002287577379661068, + "loss": 0.0153, "step": 94140 }, { - "epoch": 1.02, - "learning_rate": 0.0001473276253486411, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002287501702730928, + "loss": 0.0171, "step": 94150 }, { - "epoch": 1.02, - "learning_rate": 0.00014731140948303818, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022874260258007878, + "loss": 0.0178, "step": 94160 }, { - "epoch": 1.02, - "learning_rate": 0.0001472951936174353, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022873503488706477, + "loss": 0.0148, "step": 94170 }, { - "epoch": 1.02, - "learning_rate": 0.00014727897775183236, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022872746719405077, + "loss": 0.0225, "step": 94180 }, { - "epoch": 1.02, - "learning_rate": 0.00014726276188622948, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022871989950103676, + "loss": 0.0164, "step": 94190 }, { - "epoch": 1.02, - "learning_rate": 0.00014724654602062657, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022871233180802274, + "loss": 0.0153, "step": 94200 }, { - "epoch": 1.02, - "learning_rate": 0.00014723033015502367, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022870476411500872, + "loss": 0.014, "step": 94210 }, { - "epoch": 1.02, - "learning_rate": 0.00014721411428942076, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022869719642199473, + "loss": 0.0184, "step": 94220 }, { - "epoch": 1.02, - "learning_rate": 0.00014719789842381785, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.0002286896287289807, + "loss": 0.0149, "step": 94230 }, { - "epoch": 1.02, - "learning_rate": 0.00014718168255821494, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.0002286820610359667, + "loss": 0.0145, "step": 94240 }, { - "epoch": 1.02, - "learning_rate": 0.00014716546669261204, - "loss": 0.0133, + "epoch": 0.48, + "learning_rate": 0.0002286744933429527, + "loss": 0.0138, "step": 94250 }, { - "epoch": 1.02, - "learning_rate": 0.00014714925082700913, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022866692564993868, + "loss": 0.0158, "step": 94260 }, { - "epoch": 1.02, - "learning_rate": 0.00014713303496140622, - "loss": 0.0142, + "epoch": 0.48, + "learning_rate": 0.00022865935795692466, + "loss": 0.0149, "step": 94270 }, { - "epoch": 1.02, - "learning_rate": 0.00014711681909580334, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.00022865179026391067, + "loss": 0.0147, "step": 94280 }, { - "epoch": 1.02, - "learning_rate": 0.0001471006032302004, - "loss": 0.0074, + "epoch": 0.48, + "learning_rate": 0.00022864422257089665, + "loss": 0.0195, "step": 94290 }, { - "epoch": 1.02, - "learning_rate": 0.00014708438736459753, - "loss": 0.0131, + "epoch": 0.48, + "learning_rate": 0.00022863665487788263, + "loss": 0.0234, "step": 94300 }, { - "epoch": 1.02, - "learning_rate": 0.0001470681714989946, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.00022862908718486864, + "loss": 0.019, "step": 94310 }, { - "epoch": 1.02, - "learning_rate": 0.0001470519556333917, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022862151949185462, + "loss": 0.0175, "step": 94320 }, { - "epoch": 1.02, - "learning_rate": 0.00014703573976778878, - "loss": 0.0087, + "epoch": 0.48, + "learning_rate": 0.0002286139517988406, + "loss": 0.0148, "step": 94330 }, { - "epoch": 1.02, - "learning_rate": 0.0001470195239021859, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.0002286063841058266, + "loss": 0.017, "step": 94340 }, { - "epoch": 1.02, - "learning_rate": 0.000147003308036583, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.0002285988164128126, + "loss": 0.0187, "step": 94350 }, { - "epoch": 1.02, - "learning_rate": 0.00014698709217098008, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022859124871979858, + "loss": 0.0143, "step": 94360 }, { - "epoch": 1.02, - "learning_rate": 0.00014697087630537718, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022858368102678458, + "loss": 0.017, "step": 94370 }, { - "epoch": 1.02, - "learning_rate": 0.00014695466043977427, - "loss": 0.0079, + "epoch": 0.48, + "learning_rate": 0.00022857611333377057, + "loss": 0.0137, "step": 94380 }, { - "epoch": 1.02, - "learning_rate": 0.00014693844457417136, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022856854564075655, + "loss": 0.015, "step": 94390 }, { - "epoch": 1.02, - "learning_rate": 0.00014692222870856846, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022856097794774253, + "loss": 0.0181, "step": 94400 }, { - "epoch": 1.02, - "learning_rate": 0.00014690601284296555, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022855341025472854, + "loss": 0.0182, "step": 94410 }, { - "epoch": 1.02, - "learning_rate": 0.00014688979697736264, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022854584256171452, + "loss": 0.0202, "step": 94420 }, { - "epoch": 1.02, - "learning_rate": 0.00014687358111175973, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002285382748687005, + "loss": 0.0156, "step": 94430 }, { - "epoch": 1.02, - "learning_rate": 0.00014685736524615683, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.0002285307071756865, + "loss": 0.0179, "step": 94440 }, { - "epoch": 1.02, - "learning_rate": 0.00014684114938055392, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002285231394826725, + "loss": 0.0136, "step": 94450 }, { - "epoch": 1.02, - "learning_rate": 0.000146824933514951, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022851557178965847, + "loss": 0.0125, "step": 94460 }, { - "epoch": 1.02, - "learning_rate": 0.0001468087176493481, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022850800409664448, + "loss": 0.0137, "step": 94470 }, { - "epoch": 1.02, - "learning_rate": 0.0001467925017837452, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022850043640363046, + "loss": 0.0142, "step": 94480 }, { - "epoch": 1.02, - "learning_rate": 0.0001467762859181423, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022849286871061644, + "loss": 0.0159, "step": 94490 }, { - "epoch": 1.02, - "learning_rate": 0.0001467600700525394, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.00022848530101760245, + "loss": 0.0142, "step": 94500 }, { - "epoch": 1.02, - "learning_rate": 0.00014674385418693648, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022847773332458843, + "loss": 0.0142, "step": 94510 }, { - "epoch": 1.02, - "learning_rate": 0.0001467276383213336, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022847016563157441, + "loss": 0.0151, "step": 94520 }, { - "epoch": 1.02, - "learning_rate": 0.00014671142245573066, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022846259793856042, + "loss": 0.0179, "step": 94530 }, { - "epoch": 1.02, - "learning_rate": 0.00014669520659012778, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.0002284550302455464, + "loss": 0.0167, "step": 94540 }, { - "epoch": 1.02, - "learning_rate": 0.00014667899072452485, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022844746255253239, + "loss": 0.0168, "step": 94550 }, { - "epoch": 1.02, - "learning_rate": 0.00014666277485892197, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022843989485951837, + "loss": 0.0119, "step": 94560 }, { - "epoch": 1.02, - "learning_rate": 0.00014664655899331906, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022843232716650438, + "loss": 0.0192, "step": 94570 }, { - "epoch": 1.02, - "learning_rate": 0.00014663034312771615, - "loss": 0.0134, + "epoch": 0.48, + "learning_rate": 0.00022842475947349036, + "loss": 0.0196, "step": 94580 }, { - "epoch": 1.02, - "learning_rate": 0.00014661412726211324, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022841719178047634, + "loss": 0.0153, "step": 94590 }, { - "epoch": 1.02, - "learning_rate": 0.00014659791139651034, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022840962408746235, + "loss": 0.0139, "step": 94600 }, { - "epoch": 1.02, - "learning_rate": 0.00014658169553090743, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022840205639444833, + "loss": 0.0147, "step": 94610 }, { - "epoch": 1.02, - "learning_rate": 0.00014656547966530452, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.0002283944887014343, + "loss": 0.0126, "step": 94620 }, { - "epoch": 1.02, - "learning_rate": 0.00014654926379970162, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022838692100842032, + "loss": 0.0158, "step": 94630 }, { - "epoch": 1.02, - "learning_rate": 0.0001465330479340987, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.0002283793533154063, + "loss": 0.0156, "step": 94640 }, { - "epoch": 1.02, - "learning_rate": 0.0001465168320684958, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022837178562239228, + "loss": 0.0156, "step": 94650 }, { - "epoch": 1.02, - "learning_rate": 0.0001465006162028929, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002283642179293783, + "loss": 0.0148, "step": 94660 }, { - "epoch": 1.02, - "learning_rate": 0.00014648440033728999, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022835665023636427, + "loss": 0.0146, "step": 94670 }, { - "epoch": 1.02, - "learning_rate": 0.00014646818447168708, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022834908254335025, + "loss": 0.0193, "step": 94680 }, { - "epoch": 1.02, - "learning_rate": 0.00014645196860608417, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022834151485033626, + "loss": 0.019, "step": 94690 }, { - "epoch": 1.02, - "learning_rate": 0.00014643575274048126, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022833394715732224, + "loss": 0.0185, "step": 94700 }, { - "epoch": 1.02, - "learning_rate": 0.00014641953687487836, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022832637946430822, + "loss": 0.0194, "step": 94710 }, { - "epoch": 1.02, - "learning_rate": 0.00014640332100927548, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.0002283188117712942, + "loss": 0.0153, "step": 94720 }, { - "epoch": 1.02, - "learning_rate": 0.00014638710514367254, - "loss": 0.0092, + "epoch": 0.48, + "learning_rate": 0.00022831124407828021, + "loss": 0.0188, "step": 94730 }, { - "epoch": 1.02, - "learning_rate": 0.00014637088927806966, - "loss": 0.0144, + "epoch": 0.48, + "learning_rate": 0.0002283036763852662, + "loss": 0.0141, "step": 94740 }, { - "epoch": 1.02, - "learning_rate": 0.00014635467341246673, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022829610869225218, + "loss": 0.0192, "step": 94750 }, { - "epoch": 1.02, - "learning_rate": 0.00014633845754686385, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022828854099923819, + "loss": 0.0184, "step": 94760 }, { - "epoch": 1.02, - "learning_rate": 0.00014632224168126091, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022828097330622417, + "loss": 0.0151, "step": 94770 }, { - "epoch": 1.02, - "learning_rate": 0.00014630602581565803, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022827340561321015, + "loss": 0.015, "step": 94780 }, { - "epoch": 1.02, - "learning_rate": 0.00014628980995005513, - "loss": 0.0152, + "epoch": 0.48, + "learning_rate": 0.00022826583792019616, + "loss": 0.0161, "step": 94790 }, { - "epoch": 1.02, - "learning_rate": 0.00014627359408445222, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022825827022718214, + "loss": 0.0218, "step": 94800 }, { - "epoch": 1.02, - "learning_rate": 0.0001462573782188493, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022825070253416812, + "loss": 0.0139, "step": 94810 }, { - "epoch": 1.03, - "learning_rate": 0.0001462411623532464, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022824313484115413, + "loss": 0.0153, "step": 94820 }, { - "epoch": 1.03, - "learning_rate": 0.0001462249464876435, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.0002282355671481401, + "loss": 0.015, "step": 94830 }, { - "epoch": 1.03, - "learning_rate": 0.0001462087306220406, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002282279994551261, + "loss": 0.0205, "step": 94840 }, { - "epoch": 1.03, - "learning_rate": 0.00014619251475643768, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.0002282204317621121, + "loss": 0.012, "step": 94850 }, { - "epoch": 1.03, - "learning_rate": 0.00014617629889083478, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022821286406909808, + "loss": 0.0166, "step": 94860 }, { - "epoch": 1.03, - "learning_rate": 0.00014616008302523187, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022820529637608406, + "loss": 0.0121, "step": 94870 }, { - "epoch": 1.03, - "learning_rate": 0.00014614386715962896, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022819772868307007, + "loss": 0.014, "step": 94880 }, { - "epoch": 1.03, - "learning_rate": 0.00014612765129402605, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022819016099005605, + "loss": 0.0148, "step": 94890 }, { - "epoch": 1.03, - "learning_rate": 0.00014611143542842315, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.000228182593297042, + "loss": 0.0174, "step": 94900 }, { - "epoch": 1.03, - "learning_rate": 0.00014609521956282024, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.000228175025604028, + "loss": 0.0202, "step": 94910 }, { - "epoch": 1.03, - "learning_rate": 0.00014607900369721733, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.000228167457911014, + "loss": 0.0141, "step": 94920 }, { - "epoch": 1.03, - "learning_rate": 0.00014606278783161442, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022815989021799998, + "loss": 0.015, "step": 94930 }, { - "epoch": 1.03, - "learning_rate": 0.00014604657196601154, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022815232252498596, + "loss": 0.0167, "step": 94940 }, { - "epoch": 1.03, - "learning_rate": 0.00014603035610040864, - "loss": 0.0134, + "epoch": 0.48, + "learning_rate": 0.00022814475483197194, + "loss": 0.0169, "step": 94950 }, { - "epoch": 1.03, - "learning_rate": 0.00014601414023480573, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022813718713895795, + "loss": 0.0167, "step": 94960 }, { - "epoch": 1.03, - "learning_rate": 0.00014599792436920282, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022812961944594393, + "loss": 0.0165, "step": 94970 }, { - "epoch": 1.03, - "learning_rate": 0.00014598170850359992, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.0002281220517529299, + "loss": 0.0185, "step": 94980 }, { - "epoch": 1.03, - "learning_rate": 0.000145965492637997, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022811448405991592, + "loss": 0.0203, "step": 94990 }, { - "epoch": 1.03, - "learning_rate": 0.0001459492767723941, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.0002281069163669019, + "loss": 0.0173, "step": 95000 }, { - "epoch": 1.03, - "eval_cer": 0.9215477809800273, - "eval_loss": 0.009139502421021461, - "eval_runtime": 121.5893, - "eval_samples_per_second": 16.449, - "eval_steps_per_second": 4.112, + "epoch": 0.48, + "eval_cer": 0.9144848118450433, + "eval_loss": 0.012143060564994812, + "eval_runtime": 116.8022, + "eval_samples_per_second": 17.123, + "eval_steps_per_second": 4.281, "step": 95000 }, { - "epoch": 1.03, - "learning_rate": 0.0001459330609067912, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022809934867388788, + "loss": 0.0176, "step": 95010 }, { - "epoch": 1.03, - "learning_rate": 0.0001459168450411883, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002280917809808739, + "loss": 0.014, "step": 95020 }, { - "epoch": 1.03, - "learning_rate": 0.00014590062917558538, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022808421328785987, + "loss": 0.0155, "step": 95030 }, { - "epoch": 1.03, - "learning_rate": 0.00014588441330998247, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022807664559484586, + "loss": 0.0143, "step": 95040 }, { - "epoch": 1.03, - "learning_rate": 0.00014586819744437956, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022806907790183186, + "loss": 0.015, "step": 95050 }, { - "epoch": 1.03, - "learning_rate": 0.00014585198157877666, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.00022806151020881785, + "loss": 0.0133, "step": 95060 }, { - "epoch": 1.03, - "learning_rate": 0.00014583576571317375, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022805394251580383, + "loss": 0.0157, "step": 95070 }, { - "epoch": 1.03, - "learning_rate": 0.00014581954984757084, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022804637482278984, + "loss": 0.0126, "step": 95080 }, { - "epoch": 1.03, - "learning_rate": 0.00014580333398196796, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022803880712977582, + "loss": 0.0153, "step": 95090 }, { - "epoch": 1.03, - "learning_rate": 0.00014578711811636503, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.0002280312394367618, + "loss": 0.0156, "step": 95100 }, { - "epoch": 1.03, - "learning_rate": 0.00014577090225076215, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022802367174374778, + "loss": 0.0134, "step": 95110 }, { - "epoch": 1.03, - "learning_rate": 0.00014575468638515921, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002280161040507338, + "loss": 0.0182, "step": 95120 }, { - "epoch": 1.03, - "learning_rate": 0.00014573847051955633, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022800853635771977, + "loss": 0.0154, "step": 95130 }, { - "epoch": 1.03, - "learning_rate": 0.0001457222546539534, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022800096866470575, + "loss": 0.0159, "step": 95140 }, { - "epoch": 1.03, - "learning_rate": 0.00014570603878835052, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022799340097169176, + "loss": 0.0168, "step": 95150 }, { - "epoch": 1.03, - "learning_rate": 0.0001456898229227476, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022798583327867774, + "loss": 0.015, "step": 95160 }, { - "epoch": 1.03, - "learning_rate": 0.0001456736070571447, - "loss": 0.0092, + "epoch": 0.48, + "learning_rate": 0.00022797826558566372, + "loss": 0.0139, "step": 95170 }, { - "epoch": 1.03, - "learning_rate": 0.0001456573911915418, - "loss": 0.0091, + "epoch": 0.48, + "learning_rate": 0.00022797069789264973, + "loss": 0.0164, "step": 95180 }, { - "epoch": 1.03, - "learning_rate": 0.0001456411753259389, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.0002279631301996357, + "loss": 0.018, "step": 95190 }, { - "epoch": 1.03, - "learning_rate": 0.00014562495946033598, - "loss": 0.0135, + "epoch": 0.48, + "learning_rate": 0.0002279555625066217, + "loss": 0.0143, "step": 95200 }, { - "epoch": 1.03, - "learning_rate": 0.00014560874359473308, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.0002279479948136077, + "loss": 0.0156, "step": 95210 }, { - "epoch": 1.03, - "learning_rate": 0.00014559252772913017, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022794042712059368, + "loss": 0.0145, "step": 95220 }, { - "epoch": 1.03, - "learning_rate": 0.00014557631186352726, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022793285942757967, + "loss": 0.0156, "step": 95230 }, { - "epoch": 1.03, - "learning_rate": 0.00014556009599792435, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.00022792529173456567, + "loss": 0.0157, "step": 95240 }, { - "epoch": 1.03, - "learning_rate": 0.00014554388013232145, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022791772404155166, + "loss": 0.0172, "step": 95250 }, { - "epoch": 1.03, - "learning_rate": 0.00014552766426671854, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022791015634853764, + "loss": 0.0164, "step": 95260 }, { - "epoch": 1.03, - "learning_rate": 0.00014551144840111563, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022790258865552365, + "loss": 0.0146, "step": 95270 }, { - "epoch": 1.03, - "learning_rate": 0.00014549523253551273, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.00022789502096250963, + "loss": 0.0165, "step": 95280 }, { - "epoch": 1.03, - "learning_rate": 0.00014547901666990984, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002278874532694956, + "loss": 0.0332, "step": 95290 }, { - "epoch": 1.03, - "learning_rate": 0.0001454628008043069, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002278798855764816, + "loss": 0.0154, "step": 95300 }, { - "epoch": 1.03, - "learning_rate": 0.00014544658493870403, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002278723178834676, + "loss": 0.0166, "step": 95310 }, { - "epoch": 1.03, - "learning_rate": 0.0001454303690731011, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.00022786475019045358, + "loss": 0.0529, "step": 95320 }, { - "epoch": 1.03, - "learning_rate": 0.00014541415320749822, - "loss": 0.0089, + "epoch": 0.48, + "learning_rate": 0.00022785718249743956, + "loss": 0.0173, "step": 95330 }, { - "epoch": 1.03, - "learning_rate": 0.00014539793734189528, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022784961480442557, + "loss": 0.0187, "step": 95340 }, { - "epoch": 1.03, - "learning_rate": 0.0001453817214762924, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022784204711141155, + "loss": 0.0175, "step": 95350 }, { - "epoch": 1.03, - "learning_rate": 0.0001453655056106895, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022783447941839753, + "loss": 0.0157, "step": 95360 }, { - "epoch": 1.03, - "learning_rate": 0.0001453492897450866, - "loss": 0.0084, + "epoch": 0.48, + "learning_rate": 0.00022782691172538354, + "loss": 0.0186, "step": 95370 }, { - "epoch": 1.03, - "learning_rate": 0.00014533307387948368, - "loss": 0.0129, + "epoch": 0.48, + "learning_rate": 0.00022781934403236952, + "loss": 0.0187, "step": 95380 }, { - "epoch": 1.03, - "learning_rate": 0.00014531685801388077, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.0002278117763393555, + "loss": 0.0146, "step": 95390 }, { - "epoch": 1.03, - "learning_rate": 0.00014530064214827787, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.0002278042086463415, + "loss": 0.017, "step": 95400 }, { - "epoch": 1.03, - "learning_rate": 0.00014528442628267496, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.0002277966409533275, + "loss": 0.0155, "step": 95410 }, { - "epoch": 1.03, - "learning_rate": 0.00014526821041707205, - "loss": 0.0091, + "epoch": 0.48, + "learning_rate": 0.00022778907326031348, + "loss": 0.0159, "step": 95420 }, { - "epoch": 1.03, - "learning_rate": 0.00014525199455146914, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022778150556729948, + "loss": 0.0171, "step": 95430 }, { - "epoch": 1.03, - "learning_rate": 0.00014523577868586624, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022777393787428547, + "loss": 0.0189, "step": 95440 }, { - "epoch": 1.03, - "learning_rate": 0.00014521956282026333, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022776637018127145, + "loss": 0.018, "step": 95450 }, { - "epoch": 1.03, - "learning_rate": 0.00014520334695466042, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022775880248825743, + "loss": 0.0197, "step": 95460 }, { - "epoch": 1.03, - "learning_rate": 0.00014518713108905751, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022775123479524344, + "loss": 0.0179, "step": 95470 }, { - "epoch": 1.03, - "learning_rate": 0.0001451709152234546, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022774366710222942, + "loss": 0.0147, "step": 95480 }, { - "epoch": 1.03, - "learning_rate": 0.0001451546993578517, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.0002277360994092154, + "loss": 0.0176, "step": 95490 }, { - "epoch": 1.03, - "learning_rate": 0.0001451384834922488, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.0002277285317162014, + "loss": 0.0155, "step": 95500 }, { - "epoch": 1.03, - "learning_rate": 0.0001451222676266459, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.0002277209640231874, + "loss": 0.014, "step": 95510 }, { - "epoch": 1.03, - "learning_rate": 0.00014510605176104298, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022771339633017337, + "loss": 0.019, "step": 95520 }, { - "epoch": 1.03, - "learning_rate": 0.0001450898358954401, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022770582863715938, + "loss": 0.0147, "step": 95530 }, { - "epoch": 1.03, - "learning_rate": 0.00014507362002983716, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022769826094414536, + "loss": 0.0153, "step": 95540 }, { - "epoch": 1.03, - "learning_rate": 0.00014505740416423428, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022769069325113134, + "loss": 0.0166, "step": 95550 }, { - "epoch": 1.03, - "learning_rate": 0.00014504118829863135, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022768312555811735, + "loss": 0.0147, "step": 95560 }, { - "epoch": 1.03, - "learning_rate": 0.00014502497243302847, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022767555786510333, + "loss": 0.0152, "step": 95570 }, { - "epoch": 1.03, - "learning_rate": 0.00014500875656742556, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022766799017208931, + "loss": 0.017, "step": 95580 }, { - "epoch": 1.03, - "learning_rate": 0.00014499254070182265, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022766042247907532, + "loss": 0.0192, "step": 95590 }, { - "epoch": 1.03, - "learning_rate": 0.00014497632483621975, - "loss": 0.0084, + "epoch": 0.48, + "learning_rate": 0.0002276528547860613, + "loss": 0.0194, "step": 95600 }, { - "epoch": 1.03, - "learning_rate": 0.00014496010897061684, - "loss": 0.0124, + "epoch": 0.48, + "learning_rate": 0.00022764528709304729, + "loss": 0.0181, "step": 95610 }, { - "epoch": 1.03, - "learning_rate": 0.00014494389310501393, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022763771940003327, + "loss": 0.0169, "step": 95620 }, { - "epoch": 1.03, - "learning_rate": 0.00014492767723941103, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.00022763015170701928, + "loss": 0.0168, "step": 95630 }, { - "epoch": 1.03, - "learning_rate": 0.00014491146137380812, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022762258401400526, + "loss": 0.0175, "step": 95640 }, { - "epoch": 1.03, - "learning_rate": 0.0001448952455082052, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022761501632099124, + "loss": 0.0158, "step": 95650 }, { - "epoch": 1.03, - "learning_rate": 0.0001448790296426023, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.00022760744862797725, + "loss": 0.0144, "step": 95660 }, { - "epoch": 1.03, - "learning_rate": 0.0001448628137769994, - "loss": 0.0146, + "epoch": 0.48, + "learning_rate": 0.00022759988093496323, + "loss": 0.0214, "step": 95670 }, { - "epoch": 1.03, - "learning_rate": 0.00014484659791139652, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.0002275923132419492, + "loss": 0.0203, "step": 95680 }, { - "epoch": 1.03, - "learning_rate": 0.00014483038204579358, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.00022758474554893522, + "loss": 0.0149, "step": 95690 }, { - "epoch": 1.03, - "learning_rate": 0.0001448141661801907, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.0002275771778559212, + "loss": 0.0146, "step": 95700 }, { - "epoch": 1.03, - "learning_rate": 0.00014479795031458777, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022756961016290718, + "loss": 0.0123, "step": 95710 }, { - "epoch": 1.03, - "learning_rate": 0.0001447817344489849, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.0002275620424698932, + "loss": 0.0182, "step": 95720 }, { - "epoch": 1.03, - "learning_rate": 0.00014476551858338198, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022755447477687917, + "loss": 0.0166, "step": 95730 }, { - "epoch": 1.03, - "learning_rate": 0.00014474930271777907, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022754690708386515, + "loss": 0.0231, "step": 95740 }, { - "epoch": 1.04, - "learning_rate": 0.00014473308685217617, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.00022753933939085116, + "loss": 0.0151, "step": 95750 }, { - "epoch": 1.04, - "learning_rate": 0.00014471687098657326, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022753177169783714, + "loss": 0.018, "step": 95760 }, { - "epoch": 1.04, - "learning_rate": 0.00014470065512097035, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022752420400482312, + "loss": 0.0167, "step": 95770 }, { - "epoch": 1.04, - "learning_rate": 0.00014468443925536744, - "loss": 0.0092, + "epoch": 0.48, + "learning_rate": 0.00022751663631180913, + "loss": 0.017, "step": 95780 }, { - "epoch": 1.04, - "learning_rate": 0.00014466822338976454, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022750906861879511, + "loss": 0.0186, "step": 95790 }, { - "epoch": 1.04, - "learning_rate": 0.00014465200752416163, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.0002275015009257811, + "loss": 0.017, "step": 95800 }, { - "epoch": 1.04, - "learning_rate": 0.00014463579165855872, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.00022749393323276708, + "loss": 0.0172, "step": 95810 }, { - "epoch": 1.04, - "learning_rate": 0.00014461957579295581, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022748636553975309, + "loss": 0.0189, "step": 95820 }, { - "epoch": 1.04, - "learning_rate": 0.0001446033599273529, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022747879784673907, + "loss": 0.018, "step": 95830 }, { - "epoch": 1.04, - "learning_rate": 0.00014458714406175, - "loss": 0.0089, + "epoch": 0.48, + "learning_rate": 0.00022747123015372505, + "loss": 0.0173, "step": 95840 }, { - "epoch": 1.04, - "learning_rate": 0.0001445709281961471, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022746366246071106, + "loss": 0.0138, "step": 95850 }, { - "epoch": 1.04, - "learning_rate": 0.00014455471233054419, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022745609476769704, + "loss": 0.0167, "step": 95860 }, { - "epoch": 1.04, - "learning_rate": 0.00014453849646494128, - "loss": 0.007, + "epoch": 0.48, + "learning_rate": 0.00022744852707468302, + "loss": 0.0192, "step": 95870 }, { - "epoch": 1.04, - "learning_rate": 0.0001445222805993384, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.00022744095938166903, + "loss": 0.0165, "step": 95880 }, { - "epoch": 1.04, - "learning_rate": 0.00014450606473373546, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.000227433391688655, + "loss": 0.0162, "step": 95890 }, { - "epoch": 1.04, - "learning_rate": 0.00014448984886813258, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.000227425823995641, + "loss": 0.0163, "step": 95900 }, { - "epoch": 1.04, - "learning_rate": 0.00014447363300252965, - "loss": 0.015, + "epoch": 0.48, + "learning_rate": 0.000227418256302627, + "loss": 0.0139, "step": 95910 }, { - "epoch": 1.04, - "learning_rate": 0.00014445741713692677, - "loss": 0.014, + "epoch": 0.48, + "learning_rate": 0.00022741068860961298, + "loss": 0.0175, "step": 95920 }, { - "epoch": 1.04, - "learning_rate": 0.00014444120127132383, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022740312091659896, + "loss": 0.0179, "step": 95930 }, { - "epoch": 1.04, - "learning_rate": 0.00014442498540572095, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022739555322358497, + "loss": 0.0145, "step": 95940 }, { - "epoch": 1.04, - "learning_rate": 0.00014440876954011805, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022738798553057095, + "loss": 0.0156, "step": 95950 }, { - "epoch": 1.04, - "learning_rate": 0.00014439255367451514, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022738041783755693, + "loss": 0.0186, "step": 95960 }, { - "epoch": 1.04, - "learning_rate": 0.00014437633780891223, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.00022737285014454292, + "loss": 0.0191, "step": 95970 }, { - "epoch": 1.04, - "learning_rate": 0.00014436012194330933, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022736528245152892, + "loss": 0.0161, "step": 95980 }, { - "epoch": 1.04, - "learning_rate": 0.00014434390607770642, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.0002273577147585149, + "loss": 0.0155, "step": 95990 }, { - "epoch": 1.04, - "learning_rate": 0.0001443276902121035, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002273501470655009, + "loss": 0.0244, "step": 96000 }, { - "epoch": 1.04, - "eval_cer": 0.9215503867888964, - "eval_loss": 0.008839464746415615, - "eval_runtime": 121.6744, - "eval_samples_per_second": 16.437, - "eval_steps_per_second": 4.109, + "epoch": 0.48, + "eval_cer": 0.9144906342217957, + "eval_loss": 0.011497566476464272, + "eval_runtime": 116.7865, + "eval_samples_per_second": 17.125, + "eval_steps_per_second": 4.281, "step": 96000 }, { - "epoch": 1.04, - "learning_rate": 0.0001443114743465006, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.0002273425793724869, + "loss": 0.0185, "step": 96010 }, { - "epoch": 1.04, - "learning_rate": 0.0001442952584808977, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022733501167947288, + "loss": 0.0161, "step": 96020 }, { - "epoch": 1.04, - "learning_rate": 0.0001442790426152948, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022732744398645886, + "loss": 0.0142, "step": 96030 }, { - "epoch": 1.04, - "learning_rate": 0.00014426282674969188, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022731987629344487, + "loss": 0.0165, "step": 96040 }, { - "epoch": 1.04, - "learning_rate": 0.00014424661088408897, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022731230860043085, + "loss": 0.0148, "step": 96050 }, { - "epoch": 1.04, - "learning_rate": 0.00014423039501848607, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022730474090741683, + "loss": 0.0147, "step": 96060 }, { - "epoch": 1.04, - "learning_rate": 0.00014421417915288316, - "loss": 0.0083, + "epoch": 0.48, + "learning_rate": 0.00022729717321440284, + "loss": 0.0204, "step": 96070 }, { - "epoch": 1.04, - "learning_rate": 0.00014419796328728025, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022728960552138882, + "loss": 0.0153, "step": 96080 }, { - "epoch": 1.04, - "learning_rate": 0.00014418174742167735, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.0002272820378283748, + "loss": 0.0146, "step": 96090 }, { - "epoch": 1.04, - "learning_rate": 0.00014416553155607447, - "loss": 0.0147, + "epoch": 0.48, + "learning_rate": 0.0002272744701353608, + "loss": 0.0183, "step": 96100 }, { - "epoch": 1.04, - "learning_rate": 0.00014414931569047153, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.0002272669024423468, + "loss": 0.0193, "step": 96110 }, { - "epoch": 1.04, - "learning_rate": 0.00014413309982486865, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022725933474933277, + "loss": 0.0197, "step": 96120 }, { - "epoch": 1.04, - "learning_rate": 0.00014411688395926572, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022725176705631875, + "loss": 0.0213, "step": 96130 }, { - "epoch": 1.04, - "learning_rate": 0.00014410066809366284, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.00022724419936330476, + "loss": 0.015, "step": 96140 }, { - "epoch": 1.04, - "learning_rate": 0.0001440844522280599, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022723663167029074, + "loss": 0.0164, "step": 96150 }, { - "epoch": 1.04, - "learning_rate": 0.00014406823636245702, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.0002272290639772767, + "loss": 0.0148, "step": 96160 }, { - "epoch": 1.04, - "learning_rate": 0.00014405202049685411, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.0002272214962842627, + "loss": 0.0158, "step": 96170 }, { - "epoch": 1.04, - "learning_rate": 0.0001440358046312512, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.0002272139285912487, + "loss": 0.0164, "step": 96180 }, { - "epoch": 1.04, - "learning_rate": 0.0001440195887656483, - "loss": 0.0082, + "epoch": 0.49, + "learning_rate": 0.00022720636089823467, + "loss": 0.0181, "step": 96190 }, { - "epoch": 1.04, - "learning_rate": 0.0001440033729000454, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022719879320522065, + "loss": 0.0146, "step": 96200 }, { - "epoch": 1.04, - "learning_rate": 0.00014398715703444249, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022719122551220666, + "loss": 0.0146, "step": 96210 }, { - "epoch": 1.04, - "learning_rate": 0.00014397094116883958, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022718365781919264, + "loss": 0.0197, "step": 96220 }, { - "epoch": 1.04, - "learning_rate": 0.00014395472530323667, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022717609012617862, + "loss": 0.0201, "step": 96230 }, { - "epoch": 1.04, - "learning_rate": 0.00014393850943763376, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022716852243316463, + "loss": 0.0176, "step": 96240 }, { - "epoch": 1.04, - "learning_rate": 0.00014392229357203086, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002271609547401506, + "loss": 0.017, "step": 96250 }, { - "epoch": 1.04, - "learning_rate": 0.00014390607770642795, - "loss": 0.0138, + "epoch": 0.49, + "learning_rate": 0.0002271533870471366, + "loss": 0.0186, "step": 96260 }, { - "epoch": 1.04, - "learning_rate": 0.00014388986184082504, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002271458193541226, + "loss": 0.0141, "step": 96270 }, { - "epoch": 1.04, - "learning_rate": 0.00014387364597522213, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022713825166110858, + "loss": 0.0153, "step": 96280 }, { - "epoch": 1.04, - "learning_rate": 0.00014385743010961923, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022713068396809457, + "loss": 0.0153, "step": 96290 }, { - "epoch": 1.04, - "learning_rate": 0.00014384121424401635, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022712311627508057, + "loss": 0.013, "step": 96300 }, { - "epoch": 1.04, - "learning_rate": 0.0001438249983784134, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022711554858206656, + "loss": 0.0132, "step": 96310 }, { - "epoch": 1.04, - "learning_rate": 0.00014380878251281053, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022710798088905254, + "loss": 0.0177, "step": 96320 }, { - "epoch": 1.04, - "learning_rate": 0.0001437925666472076, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022710041319603855, + "loss": 0.017, "step": 96330 }, { - "epoch": 1.04, - "learning_rate": 0.00014377635078160472, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.00022709284550302453, + "loss": 0.0189, "step": 96340 }, { - "epoch": 1.04, - "learning_rate": 0.00014376013491600178, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.0002270852778100105, + "loss": 0.0149, "step": 96350 }, { - "epoch": 1.04, - "learning_rate": 0.0001437439190503989, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002270777101169965, + "loss": 0.0176, "step": 96360 }, { - "epoch": 1.04, - "learning_rate": 0.000143727703184796, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.0002270701424239825, + "loss": 0.0188, "step": 96370 }, { - "epoch": 1.04, - "learning_rate": 0.0001437114873191931, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.00022706257473096848, + "loss": 0.0173, "step": 96380 }, { - "epoch": 1.04, - "learning_rate": 0.00014369527145359018, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022705500703795446, + "loss": 0.016, "step": 96390 }, { - "epoch": 1.04, - "learning_rate": 0.00014367905558798727, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022704743934494047, + "loss": 0.0153, "step": 96400 }, { - "epoch": 1.04, - "learning_rate": 0.00014366283972238437, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.00022703987165192645, + "loss": 0.0158, "step": 96410 }, { - "epoch": 1.04, - "learning_rate": 0.00014364662385678146, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022703230395891243, + "loss": 0.0153, "step": 96420 }, { - "epoch": 1.04, - "learning_rate": 0.00014363040799117855, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.00022702473626589844, + "loss": 0.0166, "step": 96430 }, { - "epoch": 1.04, - "learning_rate": 0.00014361419212557565, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022701716857288442, + "loss": 0.0172, "step": 96440 }, { - "epoch": 1.04, - "learning_rate": 0.00014359797625997277, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002270096008798704, + "loss": 0.0163, "step": 96450 }, { - "epoch": 1.04, - "learning_rate": 0.00014358176039436983, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.0002270020331868564, + "loss": 0.0169, "step": 96460 }, { - "epoch": 1.04, - "learning_rate": 0.00014356554452876695, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002269944654938424, + "loss": 0.0123, "step": 96470 }, { - "epoch": 1.04, - "learning_rate": 0.00014354932866316402, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022698689780082838, + "loss": 0.0148, "step": 96480 }, { - "epoch": 1.04, - "learning_rate": 0.00014353311279756114, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022697933010781438, + "loss": 0.0138, "step": 96490 }, { - "epoch": 1.04, - "learning_rate": 0.0001435168969319582, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022697176241480037, + "loss": 0.0142, "step": 96500 }, { - "epoch": 1.04, - "learning_rate": 0.00014350068106635532, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022696419472178635, + "loss": 0.0183, "step": 96510 }, { - "epoch": 1.04, - "learning_rate": 0.00014348446520075241, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022695662702877233, + "loss": 0.0156, "step": 96520 }, { - "epoch": 1.04, - "learning_rate": 0.0001434682493351495, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022694905933575834, + "loss": 0.0164, "step": 96530 }, { - "epoch": 1.04, - "learning_rate": 0.0001434520334695466, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022694149164274432, + "loss": 0.0202, "step": 96540 }, { - "epoch": 1.04, - "learning_rate": 0.0001434358176039437, - "loss": 0.0133, + "epoch": 0.49, + "learning_rate": 0.0002269339239497303, + "loss": 0.0155, "step": 96550 }, { - "epoch": 1.04, - "learning_rate": 0.00014341960173834079, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.0002269263562567163, + "loss": 0.0146, "step": 96560 }, { - "epoch": 1.04, - "learning_rate": 0.00014340338587273788, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002269187885637023, + "loss": 0.0142, "step": 96570 }, { - "epoch": 1.04, - "learning_rate": 0.00014338717000713497, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022691122087068827, + "loss": 0.0137, "step": 96580 }, { - "epoch": 1.04, - "learning_rate": 0.00014337095414153206, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022690365317767428, + "loss": 0.0171, "step": 96590 }, { - "epoch": 1.04, - "learning_rate": 0.00014335473827592916, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022689608548466026, + "loss": 0.0173, "step": 96600 }, { - "epoch": 1.04, - "learning_rate": 0.00014333852241032625, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.00022688851779164624, + "loss": 0.0161, "step": 96610 }, { - "epoch": 1.04, - "learning_rate": 0.00014332230654472334, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022688095009863225, + "loss": 0.0156, "step": 96620 }, { - "epoch": 1.04, - "learning_rate": 0.00014330609067912044, - "loss": 0.0142, + "epoch": 0.49, + "learning_rate": 0.00022687338240561823, + "loss": 0.0162, "step": 96630 }, { - "epoch": 1.04, - "learning_rate": 0.00014328987481351753, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022686581471260421, + "loss": 0.0169, "step": 96640 }, { - "epoch": 1.04, - "learning_rate": 0.00014327365894791462, - "loss": 0.0085, + "epoch": 0.49, + "learning_rate": 0.00022685824701959022, + "loss": 0.0116, "step": 96650 }, { - "epoch": 1.04, - "learning_rate": 0.0001432574430823117, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.0002268506793265762, + "loss": 0.0159, "step": 96660 }, { - "epoch": 1.05, - "learning_rate": 0.00014324122721670883, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022684311163356219, + "loss": 0.014, "step": 96670 }, { - "epoch": 1.05, - "learning_rate": 0.0001432250113511059, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.0002268355439405482, + "loss": 0.0166, "step": 96680 }, { - "epoch": 1.05, - "learning_rate": 0.00014320879548550302, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022682797624753418, + "loss": 0.0157, "step": 96690 }, { - "epoch": 1.05, - "learning_rate": 0.00014319257961990008, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022682040855452016, + "loss": 0.0149, "step": 96700 }, { - "epoch": 1.05, - "learning_rate": 0.0001431763637542972, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.00022681284086150614, + "loss": 0.0144, "step": 96710 }, { - "epoch": 1.05, - "learning_rate": 0.00014316014788869427, - "loss": 0.0083, + "epoch": 0.49, + "learning_rate": 0.00022680527316849215, + "loss": 0.0157, "step": 96720 }, { - "epoch": 1.05, - "learning_rate": 0.0001431439320230914, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022679770547547813, + "loss": 0.0143, "step": 96730 }, { - "epoch": 1.05, - "learning_rate": 0.00014312771615748848, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.0002267901377824641, + "loss": 0.0199, "step": 96740 }, { - "epoch": 1.05, - "learning_rate": 0.00014311150029188558, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022678257008945012, + "loss": 0.0149, "step": 96750 }, { - "epoch": 1.05, - "learning_rate": 0.00014309528442628267, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.0002267750023964361, + "loss": 0.0136, "step": 96760 }, { - "epoch": 1.05, - "learning_rate": 0.00014307906856067976, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022676743470342208, + "loss": 0.0176, "step": 96770 }, { - "epoch": 1.05, - "learning_rate": 0.00014306285269507685, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.0002267598670104081, + "loss": 0.0144, "step": 96780 }, { - "epoch": 1.05, - "learning_rate": 0.00014304663682947395, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022675229931739407, + "loss": 0.0163, "step": 96790 }, { - "epoch": 1.05, - "learning_rate": 0.00014303042096387104, - "loss": 0.0087, + "epoch": 0.49, + "learning_rate": 0.00022674473162438005, + "loss": 0.0152, "step": 96800 }, { - "epoch": 1.05, - "learning_rate": 0.00014301420509826813, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022673716393136606, + "loss": 0.0138, "step": 96810 }, { - "epoch": 1.05, - "learning_rate": 0.00014299798923266522, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022672959623835204, + "loss": 0.0171, "step": 96820 }, { - "epoch": 1.05, - "learning_rate": 0.00014298177336706232, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022672202854533802, + "loss": 0.0184, "step": 96830 }, { - "epoch": 1.05, - "learning_rate": 0.0001429655575014594, - "loss": 0.0134, + "epoch": 0.49, + "learning_rate": 0.00022671446085232403, + "loss": 0.0129, "step": 96840 }, { - "epoch": 1.05, - "learning_rate": 0.0001429493416358565, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022670689315931001, + "loss": 0.0134, "step": 96850 }, { - "epoch": 1.05, - "learning_rate": 0.0001429331257702536, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.000226699325466296, + "loss": 0.0167, "step": 96860 }, { - "epoch": 1.05, - "learning_rate": 0.0001429169099046507, - "loss": 0.0131, + "epoch": 0.49, + "learning_rate": 0.00022669175777328198, + "loss": 0.0128, "step": 96870 }, { - "epoch": 1.05, - "learning_rate": 0.00014290069403904778, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022668419008026799, + "loss": 0.0195, "step": 96880 }, { - "epoch": 1.05, - "learning_rate": 0.0001428844781734449, - "loss": 0.0078, + "epoch": 0.49, + "learning_rate": 0.00022667662238725397, + "loss": 0.0161, "step": 96890 }, { - "epoch": 1.05, - "learning_rate": 0.00014286826230784197, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022666905469423995, + "loss": 0.0183, "step": 96900 }, { - "epoch": 1.05, - "learning_rate": 0.00014285204644223909, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.00022666148700122596, + "loss": 0.0137, "step": 96910 }, { - "epoch": 1.05, - "learning_rate": 0.00014283583057663615, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022665391930821194, + "loss": 0.0152, "step": 96920 }, { - "epoch": 1.05, - "learning_rate": 0.00014281961471103327, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022664635161519792, + "loss": 0.016, "step": 96930 }, { - "epoch": 1.05, - "learning_rate": 0.00014280339884543034, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022663878392218393, + "loss": 0.015, "step": 96940 }, { - "epoch": 1.05, - "learning_rate": 0.00014278718297982746, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002266312162291699, + "loss": 0.0149, "step": 96950 }, { - "epoch": 1.05, - "learning_rate": 0.00014277096711422455, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002266236485361559, + "loss": 0.0227, "step": 96960 }, { - "epoch": 1.05, - "learning_rate": 0.00014275475124862164, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002266160808431419, + "loss": 0.0148, "step": 96970 }, { - "epoch": 1.05, - "learning_rate": 0.00014273853538301874, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022660851315012788, + "loss": 0.0175, "step": 96980 }, { - "epoch": 1.05, - "learning_rate": 0.00014272231951741583, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022660094545711386, + "loss": 0.015, "step": 96990 }, { - "epoch": 1.05, - "learning_rate": 0.00014270610365181292, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022659337776409987, + "loss": 0.0174, "step": 97000 }, { - "epoch": 1.05, - "eval_cer": 0.9215321461268126, - "eval_loss": 0.008719232864677906, - "eval_runtime": 121.1881, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.49, + "eval_cer": 0.9144644335264098, + "eval_loss": 0.011374830268323421, + "eval_runtime": 116.7311, + "eval_samples_per_second": 17.133, + "eval_steps_per_second": 4.283, "step": 97000 }, { - "epoch": 1.05, - "learning_rate": 0.00014268988778621001, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022658581007108585, + "loss": 0.015, "step": 97010 }, { - "epoch": 1.05, - "learning_rate": 0.0001426736719206071, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.00022657824237807183, + "loss": 0.015, "step": 97020 }, { - "epoch": 1.05, - "learning_rate": 0.0001426574560550042, - "loss": 0.0153, + "epoch": 0.49, + "learning_rate": 0.00022657067468505782, + "loss": 0.0158, "step": 97030 }, { - "epoch": 1.05, - "learning_rate": 0.0001426412401894013, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022656310699204382, + "loss": 0.0217, "step": 97040 }, { - "epoch": 1.05, - "learning_rate": 0.00014262502432379838, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.0002265555392990298, + "loss": 0.0149, "step": 97050 }, { - "epoch": 1.05, - "learning_rate": 0.00014260880845819548, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002265479716060158, + "loss": 0.0156, "step": 97060 }, { - "epoch": 1.05, - "learning_rate": 0.00014259259259259257, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002265404039130018, + "loss": 0.0147, "step": 97070 }, { - "epoch": 1.05, - "learning_rate": 0.00014257637672698966, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022653283621998778, + "loss": 0.0138, "step": 97080 }, { - "epoch": 1.05, - "learning_rate": 0.00014256016086138676, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022652526852697376, + "loss": 0.0137, "step": 97090 }, { - "epoch": 1.05, - "learning_rate": 0.00014254394499578385, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022651770083395977, + "loss": 0.0159, "step": 97100 }, { - "epoch": 1.05, - "learning_rate": 0.00014252772913018097, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.00022651013314094575, + "loss": 0.0136, "step": 97110 }, { - "epoch": 1.05, - "learning_rate": 0.00014251151326457806, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022650256544793173, + "loss": 0.0191, "step": 97120 }, { - "epoch": 1.05, - "learning_rate": 0.00014249529739897515, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.00022649499775491774, + "loss": 0.0144, "step": 97130 }, { - "epoch": 1.05, - "learning_rate": 0.00014247908153337225, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022648743006190372, + "loss": 0.0108, "step": 97140 }, { - "epoch": 1.05, - "learning_rate": 0.00014246286566776934, - "loss": 0.0151, + "epoch": 0.49, + "learning_rate": 0.0002264798623688897, + "loss": 0.0161, "step": 97150 }, { - "epoch": 1.05, - "learning_rate": 0.00014244664980216643, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.0002264722946758757, + "loss": 0.0153, "step": 97160 }, { - "epoch": 1.05, - "learning_rate": 0.00014243043393656352, - "loss": 0.0143, + "epoch": 0.49, + "learning_rate": 0.0002264647269828617, + "loss": 0.0145, "step": 97170 }, { - "epoch": 1.05, - "learning_rate": 0.00014241421807096062, - "loss": 0.0144, + "epoch": 0.49, + "learning_rate": 0.00022645715928984767, + "loss": 0.0152, "step": 97180 }, { - "epoch": 1.05, - "learning_rate": 0.0001423980022053577, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022644959159683365, + "loss": 0.0168, "step": 97190 }, { - "epoch": 1.05, - "learning_rate": 0.0001423817863397548, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022644202390381966, + "loss": 0.0151, "step": 97200 }, { - "epoch": 1.05, - "learning_rate": 0.0001423655704741519, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022643445621080564, + "loss": 0.014, "step": 97210 }, { - "epoch": 1.05, - "learning_rate": 0.000142349354608549, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022642688851779163, + "loss": 0.0143, "step": 97220 }, { - "epoch": 1.05, - "learning_rate": 0.00014233313874294608, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022641932082477763, + "loss": 0.0146, "step": 97230 }, { - "epoch": 1.05, - "learning_rate": 0.00014231692287734317, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022641175313176362, + "loss": 0.0161, "step": 97240 }, { - "epoch": 1.05, - "learning_rate": 0.00014230070701174027, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.0002264041854387496, + "loss": 0.0166, "step": 97250 }, { - "epoch": 1.05, - "learning_rate": 0.00014228449114613739, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002263966177457356, + "loss": 0.0162, "step": 97260 }, { - "epoch": 1.05, - "learning_rate": 0.00014226827528053445, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.0002263890500527216, + "loss": 0.0173, "step": 97270 }, { - "epoch": 1.05, - "learning_rate": 0.00014225205941493157, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022638148235970757, + "loss": 0.0171, "step": 97280 }, { - "epoch": 1.05, - "learning_rate": 0.00014223584354932864, - "loss": 0.0134, + "epoch": 0.49, + "learning_rate": 0.00022637391466669358, + "loss": 0.0161, "step": 97290 }, { - "epoch": 1.05, - "learning_rate": 0.00014221962768372576, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022636634697367956, + "loss": 0.0176, "step": 97300 }, { - "epoch": 1.05, - "learning_rate": 0.00014220341181812285, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022635877928066554, + "loss": 0.0161, "step": 97310 }, { - "epoch": 1.05, - "learning_rate": 0.00014218719595251994, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022635121158765155, + "loss": 0.0192, "step": 97320 }, { - "epoch": 1.05, - "learning_rate": 0.00014217098008691704, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022634364389463753, + "loss": 0.016, "step": 97330 }, { - "epoch": 1.05, - "learning_rate": 0.00014215476422131413, - "loss": 0.0082, + "epoch": 0.49, + "learning_rate": 0.0002263360762016235, + "loss": 0.0149, "step": 97340 }, { - "epoch": 1.05, - "learning_rate": 0.00014213854835571122, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022632850850860952, + "loss": 0.0205, "step": 97350 }, { - "epoch": 1.05, - "learning_rate": 0.00014212233249010831, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002263209408155955, + "loss": 0.0146, "step": 97360 }, { - "epoch": 1.05, - "learning_rate": 0.0001421061166245054, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.00022631337312258148, + "loss": 0.0188, "step": 97370 }, { - "epoch": 1.05, - "learning_rate": 0.0001420899007589025, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022630580542956746, + "loss": 0.0165, "step": 97380 }, { - "epoch": 1.05, - "learning_rate": 0.0001420736848932996, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022629823773655347, + "loss": 0.0168, "step": 97390 }, { - "epoch": 1.05, - "learning_rate": 0.00014205746902769668, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022629067004353945, + "loss": 0.0132, "step": 97400 }, { - "epoch": 1.05, - "learning_rate": 0.00014204125316209378, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.0002262831023505254, + "loss": 0.0175, "step": 97410 }, { - "epoch": 1.05, - "learning_rate": 0.00014202503729649087, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.0002262755346575114, + "loss": 0.0175, "step": 97420 }, { - "epoch": 1.05, - "learning_rate": 0.00014200882143088796, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.0002262679669644974, + "loss": 0.0176, "step": 97430 }, { - "epoch": 1.05, - "learning_rate": 0.00014199260556528506, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022626039927148338, + "loss": 0.0171, "step": 97440 }, { - "epoch": 1.05, - "learning_rate": 0.00014197638969968215, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.00022625283157846936, + "loss": 0.0173, "step": 97450 }, { - "epoch": 1.05, - "learning_rate": 0.00014196017383407927, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022624526388545537, + "loss": 0.0154, "step": 97460 }, { - "epoch": 1.05, - "learning_rate": 0.00014194395796847633, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022623769619244135, + "loss": 0.0131, "step": 97470 }, { - "epoch": 1.05, - "learning_rate": 0.00014192774210287345, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022623012849942733, + "loss": 0.0161, "step": 97480 }, { - "epoch": 1.05, - "learning_rate": 0.00014191152623727052, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022622256080641334, + "loss": 0.0154, "step": 97490 }, { - "epoch": 1.05, - "learning_rate": 0.00014189531037166764, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022621499311339932, + "loss": 0.0146, "step": 97500 }, { - "epoch": 1.05, - "learning_rate": 0.0001418790945060647, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.0002262074254203853, + "loss": 0.0161, "step": 97510 }, { - "epoch": 1.05, - "learning_rate": 0.00014186287864046182, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002261998577273713, + "loss": 0.0156, "step": 97520 }, { - "epoch": 1.05, - "learning_rate": 0.00014184666277485892, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.0002261922900343573, + "loss": 0.0162, "step": 97530 }, { - "epoch": 1.05, - "learning_rate": 0.000141830446909256, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022618472234134328, + "loss": 0.0156, "step": 97540 }, { - "epoch": 1.05, - "learning_rate": 0.0001418142310436531, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022617715464832928, + "loss": 0.0154, "step": 97550 }, { - "epoch": 1.05, - "learning_rate": 0.0001417980151780502, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.00022616958695531527, + "loss": 0.0147, "step": 97560 }, { - "epoch": 1.05, - "learning_rate": 0.0001417817993124473, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022616201926230125, + "loss": 0.0186, "step": 97570 }, { - "epoch": 1.05, - "learning_rate": 0.00014176558344684438, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022615445156928726, + "loss": 0.0147, "step": 97580 }, { - "epoch": 1.05, - "learning_rate": 0.00014174936758124147, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022614688387627324, + "loss": 0.0153, "step": 97590 }, { - "epoch": 1.06, - "learning_rate": 0.00014173315171563857, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022613931618325922, + "loss": 0.0165, "step": 97600 }, { - "epoch": 1.06, - "learning_rate": 0.00014171693585003566, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.0002261317484902452, + "loss": 0.0112, "step": 97610 }, { - "epoch": 1.06, - "learning_rate": 0.00014170071998443275, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.0002261241807972312, + "loss": 0.014, "step": 97620 }, { - "epoch": 1.06, - "learning_rate": 0.00014168450411882985, - "loss": 0.0082, + "epoch": 0.49, + "learning_rate": 0.0002261166131042172, + "loss": 0.015, "step": 97630 }, { - "epoch": 1.06, - "learning_rate": 0.00014166828825322694, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022610904541120317, + "loss": 0.0125, "step": 97640 }, { - "epoch": 1.06, - "learning_rate": 0.00014165207238762403, - "loss": 0.008, + "epoch": 0.49, + "learning_rate": 0.00022610147771818918, + "loss": 0.0181, "step": 97650 }, { - "epoch": 1.06, - "learning_rate": 0.00014163585652202112, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022609391002517516, + "loss": 0.0149, "step": 97660 }, { - "epoch": 1.06, - "learning_rate": 0.00014161964065641822, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022608634233216114, + "loss": 0.0154, "step": 97670 }, { - "epoch": 1.06, - "learning_rate": 0.00014160342479081534, - "loss": 0.0128, + "epoch": 0.49, + "learning_rate": 0.00022607877463914715, + "loss": 0.0148, "step": 97680 }, { - "epoch": 1.06, - "learning_rate": 0.0001415872089252124, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022607120694613313, + "loss": 0.0171, "step": 97690 }, { - "epoch": 1.06, - "learning_rate": 0.00014157099305960952, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022606363925311911, + "loss": 0.0166, "step": 97700 }, { - "epoch": 1.06, - "learning_rate": 0.0001415547771940066, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.00022605607156010512, + "loss": 0.0154, "step": 97710 }, { - "epoch": 1.06, - "learning_rate": 0.0001415385613284037, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.0002260485038670911, + "loss": 0.0138, "step": 97720 }, { - "epoch": 1.06, - "learning_rate": 0.00014152234546280077, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022604093617407709, + "loss": 0.0142, "step": 97730 }, { - "epoch": 1.06, - "learning_rate": 0.0001415061295971979, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.0002260333684810631, + "loss": 0.0158, "step": 97740 }, { - "epoch": 1.06, - "learning_rate": 0.00014148991373159499, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022602580078804908, + "loss": 0.0166, "step": 97750 }, { - "epoch": 1.06, - "learning_rate": 0.00014147369786599208, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.00022601823309503506, + "loss": 0.0156, "step": 97760 }, { - "epoch": 1.06, - "learning_rate": 0.00014145748200038917, - "loss": 0.0078, + "epoch": 0.49, + "learning_rate": 0.00022601066540202104, + "loss": 0.0197, "step": 97770 }, { - "epoch": 1.06, - "learning_rate": 0.00014144126613478626, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022600309770900705, + "loss": 0.0141, "step": 97780 }, { - "epoch": 1.06, - "learning_rate": 0.00014142505026918336, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022599553001599303, + "loss": 0.0131, "step": 97790 }, { - "epoch": 1.06, - "learning_rate": 0.00014140883440358045, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.000225987962322979, + "loss": 0.0169, "step": 97800 }, { - "epoch": 1.06, - "learning_rate": 0.00014139261853797754, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022598039462996502, + "loss": 0.0127, "step": 97810 }, { - "epoch": 1.06, - "learning_rate": 0.00014137640267237463, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.000225972826936951, + "loss": 0.0176, "step": 97820 }, { - "epoch": 1.06, - "learning_rate": 0.00014136018680677175, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022596525924393698, + "loss": 0.0144, "step": 97830 }, { - "epoch": 1.06, - "learning_rate": 0.00014134397094116882, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.000225957691550923, + "loss": 0.0178, "step": 97840 }, { - "epoch": 1.06, - "learning_rate": 0.00014132775507556594, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022595012385790897, + "loss": 0.0165, "step": 97850 }, { - "epoch": 1.06, - "learning_rate": 0.000141311539209963, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022594255616489495, + "loss": 0.0182, "step": 97860 }, { - "epoch": 1.06, - "learning_rate": 0.00014129532334436013, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022593498847188096, + "loss": 0.0152, "step": 97870 }, { - "epoch": 1.06, - "learning_rate": 0.0001412791074787572, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022592742077886694, + "loss": 0.0165, "step": 97880 }, { - "epoch": 1.06, - "learning_rate": 0.0001412628916131543, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022591985308585292, + "loss": 0.0179, "step": 97890 }, { - "epoch": 1.06, - "learning_rate": 0.0001412466757475514, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.00022591228539283893, + "loss": 0.0192, "step": 97900 }, { - "epoch": 1.06, - "learning_rate": 0.0001412304598819485, - "loss": 0.0074, + "epoch": 0.49, + "learning_rate": 0.00022590471769982491, + "loss": 0.0176, "step": 97910 }, { - "epoch": 1.06, - "learning_rate": 0.0001412142440163456, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.0002258971500068109, + "loss": 0.0158, "step": 97920 }, { - "epoch": 1.06, - "learning_rate": 0.00014119802815074268, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022588958231379688, + "loss": 0.0187, "step": 97930 }, { - "epoch": 1.06, - "learning_rate": 0.00014118181228513977, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022588201462078289, + "loss": 0.0178, "step": 97940 }, { - "epoch": 1.06, - "learning_rate": 0.00014116559641953687, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022587444692776887, + "loss": 0.02, "step": 97950 }, { - "epoch": 1.06, - "learning_rate": 0.00014114938055393396, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022586687923475485, + "loss": 0.0153, "step": 97960 }, { - "epoch": 1.06, - "learning_rate": 0.00014113316468833105, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022585931154174086, + "loss": 0.0165, "step": 97970 }, { - "epoch": 1.06, - "learning_rate": 0.00014111694882272815, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022585174384872684, + "loss": 0.0226, "step": 97980 }, { - "epoch": 1.06, - "learning_rate": 0.00014110073295712524, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022584417615571282, + "loss": 0.016, "step": 97990 }, { - "epoch": 1.06, - "learning_rate": 0.00014108451709152233, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022583660846269883, + "loss": 0.0241, "step": 98000 }, { - "epoch": 1.06, - "eval_cer": 0.9215616786273294, - "eval_loss": 0.008956007659435272, - "eval_runtime": 121.1479, - "eval_samples_per_second": 16.509, - "eval_steps_per_second": 4.127, + "epoch": 0.49, + "eval_cer": 0.9144799598644162, + "eval_loss": 0.011652790941298008, + "eval_runtime": 116.7303, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, "step": 98000 }, { - "epoch": 1.06, - "learning_rate": 0.00014106830122591942, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.0002258290407696848, + "loss": 0.0164, "step": 98010 }, { - "epoch": 1.06, - "learning_rate": 0.00014105208536031652, - "loss": 0.0076, + "epoch": 0.49, + "learning_rate": 0.0002258214730766708, + "loss": 0.0178, "step": 98020 }, { - "epoch": 1.06, - "learning_rate": 0.0001410358694947136, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.0002258139053836568, + "loss": 0.0155, "step": 98030 }, { - "epoch": 1.06, - "learning_rate": 0.0001410196536291107, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022580633769064278, + "loss": 0.0136, "step": 98040 }, { - "epoch": 1.06, - "learning_rate": 0.00014100343776350782, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022579876999762876, + "loss": 0.016, "step": 98050 }, { - "epoch": 1.06, - "learning_rate": 0.0001409872218979049, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022579120230461477, + "loss": 0.0171, "step": 98060 }, { - "epoch": 1.06, - "learning_rate": 0.000140971006032302, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022578363461160075, + "loss": 0.0166, "step": 98070 }, { - "epoch": 1.06, - "learning_rate": 0.00014095479016669907, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022577606691858673, + "loss": 0.0158, "step": 98080 }, { - "epoch": 1.06, - "learning_rate": 0.0001409385743010962, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022576849922557272, + "loss": 0.0232, "step": 98090 }, { - "epoch": 1.06, - "learning_rate": 0.00014092235843549326, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.00022576093153255872, + "loss": 0.0201, "step": 98100 }, { - "epoch": 1.06, - "learning_rate": 0.00014090614256989038, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.0002257533638395447, + "loss": 0.0174, "step": 98110 }, { - "epoch": 1.06, - "learning_rate": 0.00014088992670428747, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.0002257457961465307, + "loss": 0.0155, "step": 98120 }, { - "epoch": 1.06, - "learning_rate": 0.00014087371083868456, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002257382284535167, + "loss": 0.0171, "step": 98130 }, { - "epoch": 1.06, - "learning_rate": 0.00014085749497308166, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022573066076050268, + "loss": 0.0146, "step": 98140 }, { - "epoch": 1.06, - "learning_rate": 0.00014084127910747875, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.00022572309306748866, + "loss": 0.019, "step": 98150 }, { - "epoch": 1.06, - "learning_rate": 0.00014082506324187584, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022571552537447467, + "loss": 0.0157, "step": 98160 }, { - "epoch": 1.06, - "learning_rate": 0.00014080884737627293, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022570795768146065, + "loss": 0.0203, "step": 98170 }, { - "epoch": 1.06, - "learning_rate": 0.00014079263151067003, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022570038998844663, + "loss": 0.0153, "step": 98180 }, { - "epoch": 1.06, - "learning_rate": 0.00014077641564506712, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.00022569282229543264, + "loss": 0.0159, "step": 98190 }, { - "epoch": 1.06, - "learning_rate": 0.0001407601997794642, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022568525460241862, + "loss": 0.0148, "step": 98200 }, { - "epoch": 1.06, - "learning_rate": 0.0001407439839138613, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.0002256776869094046, + "loss": 0.0161, "step": 98210 }, { - "epoch": 1.06, - "learning_rate": 0.0001407277680482584, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.0002256701192163906, + "loss": 0.0164, "step": 98220 }, { - "epoch": 1.06, - "learning_rate": 0.0001407115521826555, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.0002256625515233766, + "loss": 0.0165, "step": 98230 }, { - "epoch": 1.06, - "learning_rate": 0.00014069533631705258, - "loss": 0.0084, + "epoch": 0.5, + "learning_rate": 0.00022565498383036257, + "loss": 0.014, "step": 98240 }, { - "epoch": 1.06, - "learning_rate": 0.00014067912045144968, - "loss": 0.0085, + "epoch": 0.5, + "learning_rate": 0.00022564741613734858, + "loss": 0.0178, "step": 98250 }, { - "epoch": 1.06, - "learning_rate": 0.00014066290458584677, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022563984844433456, + "loss": 0.0131, "step": 98260 }, { - "epoch": 1.06, - "learning_rate": 0.0001406466887202439, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022563228075132055, + "loss": 0.0209, "step": 98270 }, { - "epoch": 1.06, - "learning_rate": 0.00014063047285464095, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022562471305830653, + "loss": 0.0115, "step": 98280 }, { - "epoch": 1.06, - "learning_rate": 0.00014061425698903807, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022561714536529253, + "loss": 0.0183, "step": 98290 }, { - "epoch": 1.06, - "learning_rate": 0.00014059804112343514, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022560957767227852, + "loss": 0.0143, "step": 98300 }, { - "epoch": 1.06, - "learning_rate": 0.00014058182525783226, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002256020099792645, + "loss": 0.015, "step": 98310 }, { - "epoch": 1.06, - "learning_rate": 0.00014056560939222933, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002255944422862505, + "loss": 0.0122, "step": 98320 }, { - "epoch": 1.06, - "learning_rate": 0.00014054939352662645, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002255868745932365, + "loss": 0.0149, "step": 98330 }, { - "epoch": 1.06, - "learning_rate": 0.00014053317766102354, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022557930690022247, + "loss": 0.0157, "step": 98340 }, { - "epoch": 1.06, - "learning_rate": 0.00014051696179542063, - "loss": 0.0148, + "epoch": 0.5, + "learning_rate": 0.00022557173920720848, + "loss": 0.0168, "step": 98350 }, { - "epoch": 1.06, - "learning_rate": 0.00014050074592981772, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022556417151419446, + "loss": 0.0139, "step": 98360 }, { - "epoch": 1.06, - "learning_rate": 0.00014048453006421482, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022555660382118044, + "loss": 0.0133, "step": 98370 }, { - "epoch": 1.06, - "learning_rate": 0.0001404683141986119, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022554903612816645, + "loss": 0.0243, "step": 98380 }, { - "epoch": 1.06, - "learning_rate": 0.000140452098333009, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022554146843515243, + "loss": 0.0139, "step": 98390 }, { - "epoch": 1.06, - "learning_rate": 0.0001404358824674061, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.0002255339007421384, + "loss": 0.0148, "step": 98400 }, { - "epoch": 1.06, - "learning_rate": 0.0001404196666018032, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022552633304912442, + "loss": 0.0178, "step": 98410 }, { - "epoch": 1.06, - "learning_rate": 0.00014040345073620028, - "loss": 0.0147, + "epoch": 0.5, + "learning_rate": 0.0002255187653561104, + "loss": 0.015, "step": 98420 }, { - "epoch": 1.06, - "learning_rate": 0.00014038723487059737, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022551119766309638, + "loss": 0.0176, "step": 98430 }, { - "epoch": 1.06, - "learning_rate": 0.00014037101900499447, - "loss": 0.0148, + "epoch": 0.5, + "learning_rate": 0.00022550362997008237, + "loss": 0.0164, "step": 98440 }, { - "epoch": 1.06, - "learning_rate": 0.00014035480313939156, - "loss": 0.014, + "epoch": 0.5, + "learning_rate": 0.00022549606227706837, + "loss": 0.0171, "step": 98450 }, { - "epoch": 1.06, - "learning_rate": 0.00014033858727378865, - "loss": 0.0088, + "epoch": 0.5, + "learning_rate": 0.00022548849458405436, + "loss": 0.013, "step": 98460 }, { - "epoch": 1.06, - "learning_rate": 0.00014032237140818577, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022548092689104034, + "loss": 0.0157, "step": 98470 }, { - "epoch": 1.06, - "learning_rate": 0.00014030615554258284, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022547335919802635, + "loss": 0.0169, "step": 98480 }, { - "epoch": 1.06, - "learning_rate": 0.00014028993967697996, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022546579150501233, + "loss": 0.0159, "step": 98490 }, { - "epoch": 1.06, - "learning_rate": 0.00014027372381137702, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.0002254582238119983, + "loss": 0.0276, "step": 98500 }, { - "epoch": 1.06, - "learning_rate": 0.00014025750794577414, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022545065611898432, + "loss": 0.0217, "step": 98510 }, { - "epoch": 1.07, - "learning_rate": 0.0001402412920801712, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.0002254430884259703, + "loss": 0.0157, "step": 98520 }, { - "epoch": 1.07, - "learning_rate": 0.00014022507621456833, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022543552073295628, + "loss": 0.0147, "step": 98530 }, { - "epoch": 1.07, - "learning_rate": 0.00014020886034896542, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.0002254279530399423, + "loss": 0.0137, "step": 98540 }, { - "epoch": 1.07, - "learning_rate": 0.0001401926444833625, - "loss": 0.0132, + "epoch": 0.5, + "learning_rate": 0.00022542038534692827, + "loss": 0.0151, "step": 98550 }, { - "epoch": 1.07, - "learning_rate": 0.0001401764286177596, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022541281765391425, + "loss": 0.0161, "step": 98560 }, { - "epoch": 1.07, - "learning_rate": 0.0001401602127521567, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022540524996090026, + "loss": 0.0158, "step": 98570 }, { - "epoch": 1.07, - "learning_rate": 0.0001401439968865538, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022539768226788624, + "loss": 0.0195, "step": 98580 }, { - "epoch": 1.07, - "learning_rate": 0.00014012778102095088, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022539011457487222, + "loss": 0.0179, "step": 98590 }, { - "epoch": 1.07, - "learning_rate": 0.00014011156515534798, - "loss": 0.013, + "epoch": 0.5, + "learning_rate": 0.0002253825468818582, + "loss": 0.0153, "step": 98600 }, { - "epoch": 1.07, - "learning_rate": 0.00014009534928974507, - "loss": 0.0132, + "epoch": 0.5, + "learning_rate": 0.0002253749791888442, + "loss": 0.0187, "step": 98610 }, { - "epoch": 1.07, - "learning_rate": 0.0001400791334241422, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.0002253674114958302, + "loss": 0.0156, "step": 98620 }, { - "epoch": 1.07, - "learning_rate": 0.00014006291755853925, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022535984380281618, + "loss": 0.0126, "step": 98630 }, { - "epoch": 1.07, - "learning_rate": 0.00014004670169293637, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022535227610980218, + "loss": 0.0159, "step": 98640 }, { - "epoch": 1.07, - "learning_rate": 0.00014003048582733344, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022534470841678817, + "loss": 0.0154, "step": 98650 }, { - "epoch": 1.07, - "learning_rate": 0.00014001426996173056, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022533714072377415, + "loss": 0.0157, "step": 98660 }, { - "epoch": 1.07, - "learning_rate": 0.00013999805409612763, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002253295730307601, + "loss": 0.0134, "step": 98670 }, { - "epoch": 1.07, - "learning_rate": 0.00013998183823052475, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.0002253220053377461, + "loss": 0.017, "step": 98680 }, { - "epoch": 1.07, - "learning_rate": 0.00013996562236492184, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.0002253144376447321, + "loss": 0.014, "step": 98690 }, { - "epoch": 1.07, - "learning_rate": 0.00013994940649931893, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022530686995171807, + "loss": 0.0188, "step": 98700 }, { - "epoch": 1.07, - "learning_rate": 0.00013993319063371602, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022529930225870408, + "loss": 0.0153, "step": 98710 }, { - "epoch": 1.07, - "learning_rate": 0.00013991697476811312, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022529173456569006, + "loss": 0.0156, "step": 98720 }, { - "epoch": 1.07, - "learning_rate": 0.0001399007589025102, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.00022528416687267604, + "loss": 0.0142, "step": 98730 }, { - "epoch": 1.07, - "learning_rate": 0.0001398845430369073, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022527659917966205, + "loss": 0.0156, "step": 98740 }, { - "epoch": 1.07, - "learning_rate": 0.0001398683271713044, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022526903148664803, + "loss": 0.0203, "step": 98750 }, { - "epoch": 1.07, - "learning_rate": 0.0001398521113057015, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022526146379363402, + "loss": 0.014, "step": 98760 }, { - "epoch": 1.07, - "learning_rate": 0.00013983589544009858, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022525389610062002, + "loss": 0.0125, "step": 98770 }, { - "epoch": 1.07, - "learning_rate": 0.00013981967957449567, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.000225246328407606, + "loss": 0.0155, "step": 98780 }, { - "epoch": 1.07, - "learning_rate": 0.00013980346370889277, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.000225238760714592, + "loss": 0.0176, "step": 98790 }, { - "epoch": 1.07, - "learning_rate": 0.00013978724784328986, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.000225231193021578, + "loss": 0.0164, "step": 98800 }, { - "epoch": 1.07, - "learning_rate": 0.00013977103197768695, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022522362532856398, + "loss": 0.0132, "step": 98810 }, { - "epoch": 1.07, - "learning_rate": 0.00013975481611208404, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022521605763554996, + "loss": 0.0171, "step": 98820 }, { - "epoch": 1.07, - "learning_rate": 0.00013973860024648114, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022520848994253594, + "loss": 0.0187, "step": 98830 }, { - "epoch": 1.07, - "learning_rate": 0.00013972238438087826, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022520092224952195, + "loss": 0.0168, "step": 98840 }, { - "epoch": 1.07, - "learning_rate": 0.00013970616851527532, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022519335455650793, + "loss": 0.0166, "step": 98850 }, { - "epoch": 1.07, - "learning_rate": 0.00013968995264967244, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.0002251857868634939, + "loss": 0.0135, "step": 98860 }, { - "epoch": 1.07, - "learning_rate": 0.0001396737367840695, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022517821917047992, + "loss": 0.0213, "step": 98870 }, { - "epoch": 1.07, - "learning_rate": 0.00013965752091846663, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.0002251706514774659, + "loss": 0.0151, "step": 98880 }, { - "epoch": 1.07, - "learning_rate": 0.0001396413050528637, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022516308378445188, + "loss": 0.0165, "step": 98890 }, { - "epoch": 1.07, - "learning_rate": 0.0001396250891872608, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.0002251555160914379, + "loss": 0.0156, "step": 98900 }, { - "epoch": 1.07, - "learning_rate": 0.0001396088733216579, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022514794839842387, + "loss": 0.0125, "step": 98910 }, { - "epoch": 1.07, - "learning_rate": 0.000139592657456055, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022514038070540985, + "loss": 0.0159, "step": 98920 }, { - "epoch": 1.07, - "learning_rate": 0.0001395764415904521, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.00022513281301239586, + "loss": 0.0143, "step": 98930 }, { - "epoch": 1.07, - "learning_rate": 0.00013956022572484918, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022512524531938184, + "loss": 0.0142, "step": 98940 }, { - "epoch": 1.07, - "learning_rate": 0.00013954400985924628, - "loss": 0.0136, + "epoch": 0.5, + "learning_rate": 0.00022511767762636783, + "loss": 0.0143, "step": 98950 }, { - "epoch": 1.07, - "learning_rate": 0.00013952779399364337, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022511010993335383, + "loss": 0.0153, "step": 98960 }, { - "epoch": 1.07, - "learning_rate": 0.00013951157812804046, - "loss": 0.0142, + "epoch": 0.5, + "learning_rate": 0.00022510254224033982, + "loss": 0.0134, "step": 98970 }, { - "epoch": 1.07, - "learning_rate": 0.00013949536226243756, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002250949745473258, + "loss": 0.0167, "step": 98980 }, { - "epoch": 1.07, - "learning_rate": 0.00013947914639683465, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022508740685431178, + "loss": 0.0195, "step": 98990 }, { - "epoch": 1.07, - "learning_rate": 0.00013946293053123174, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.0002250798391612978, + "loss": 0.0132, "step": 99000 }, { - "epoch": 1.07, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.008673109114170074, - "eval_runtime": 121.2918, - "eval_samples_per_second": 16.489, - "eval_steps_per_second": 4.122, + "epoch": 0.5, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.011587457731366158, + "eval_runtime": 116.7415, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, "step": 99000 }, { - "epoch": 1.07, - "learning_rate": 0.00013944671466562883, - "loss": 0.0079, + "epoch": 0.5, + "learning_rate": 0.00022507227146828377, + "loss": 0.0159, "step": 99010 }, { - "epoch": 1.07, - "learning_rate": 0.00013943049880002593, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022506470377526975, + "loss": 0.0158, "step": 99020 }, { - "epoch": 1.07, - "learning_rate": 0.00013941428293442302, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022505713608225576, + "loss": 0.0154, "step": 99030 }, { - "epoch": 1.07, - "learning_rate": 0.0001393980670688201, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022504956838924174, + "loss": 0.0127, "step": 99040 }, { - "epoch": 1.07, - "learning_rate": 0.0001393818512032172, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.00022504200069622772, + "loss": 0.0199, "step": 99050 }, { - "epoch": 1.07, - "learning_rate": 0.00013936563533761432, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022503443300321373, + "loss": 0.0172, "step": 99060 }, { - "epoch": 1.07, - "learning_rate": 0.0001393494194720114, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002250268653101997, + "loss": 0.0162, "step": 99070 }, { - "epoch": 1.07, - "learning_rate": 0.0001393332036064085, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.0002250192976171857, + "loss": 0.0187, "step": 99080 }, { - "epoch": 1.07, - "learning_rate": 0.00013931698774080558, - "loss": 0.008, + "epoch": 0.5, + "learning_rate": 0.0002250117299241717, + "loss": 0.0157, "step": 99090 }, { - "epoch": 1.07, - "learning_rate": 0.0001393007718752027, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022500416223115768, + "loss": 0.014, "step": 99100 }, { - "epoch": 1.07, - "learning_rate": 0.00013928455600959976, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022499659453814366, + "loss": 0.0151, "step": 99110 }, { - "epoch": 1.07, - "learning_rate": 0.00013926834014399688, - "loss": 0.0135, + "epoch": 0.5, + "learning_rate": 0.00022498902684512967, + "loss": 0.013, "step": 99120 }, { - "epoch": 1.07, - "learning_rate": 0.00013925212427839397, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022498145915211565, + "loss": 0.0151, "step": 99130 }, { - "epoch": 1.07, - "learning_rate": 0.00013923590841279107, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.00022497389145910164, + "loss": 0.0135, "step": 99140 }, { - "epoch": 1.07, - "learning_rate": 0.00013921969254718816, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.00022496632376608764, + "loss": 0.0234, "step": 99150 }, { - "epoch": 1.07, - "learning_rate": 0.00013920347668158525, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022495875607307363, + "loss": 0.013, "step": 99160 }, { - "epoch": 1.07, - "learning_rate": 0.00013918726081598234, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.0002249511883800596, + "loss": 0.0175, "step": 99170 }, { - "epoch": 1.07, - "learning_rate": 0.00013917104495037944, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.0002249436206870456, + "loss": 0.0171, "step": 99180 }, { - "epoch": 1.07, - "learning_rate": 0.00013915482908477653, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.0002249360529940316, + "loss": 0.0166, "step": 99190 }, { - "epoch": 1.07, - "learning_rate": 0.00013913861321917362, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022492848530101758, + "loss": 0.0174, "step": 99200 }, { - "epoch": 1.07, - "learning_rate": 0.00013912239735357072, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022492091760800356, + "loss": 0.0122, "step": 99210 }, { - "epoch": 1.07, - "learning_rate": 0.0001391061814879678, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022491334991498957, + "loss": 0.0156, "step": 99220 }, { - "epoch": 1.07, - "learning_rate": 0.0001390899656223649, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022490578222197555, + "loss": 0.0146, "step": 99230 }, { - "epoch": 1.07, - "learning_rate": 0.000139073749756762, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022489821452896153, + "loss": 0.0159, "step": 99240 }, { - "epoch": 1.07, - "learning_rate": 0.00013905753389115909, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022489064683594754, + "loss": 0.0176, "step": 99250 }, { - "epoch": 1.07, - "learning_rate": 0.00013904131802555618, - "loss": 0.0084, + "epoch": 0.5, + "learning_rate": 0.00022488307914293352, + "loss": 0.0172, "step": 99260 }, { - "epoch": 1.07, - "learning_rate": 0.0001390251021599533, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002248755114499195, + "loss": 0.0116, "step": 99270 }, { - "epoch": 1.07, - "learning_rate": 0.0001390088862943504, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.0002248679437569055, + "loss": 0.0152, "step": 99280 }, { - "epoch": 1.07, - "learning_rate": 0.00013899267042874748, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002248603760638915, + "loss": 0.0368, "step": 99290 }, { - "epoch": 1.07, - "learning_rate": 0.00013897645456314458, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022485280837087747, + "loss": 0.0209, "step": 99300 }, { - "epoch": 1.07, - "learning_rate": 0.00013896023869754167, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022484524067786348, + "loss": 0.0144, "step": 99310 }, { - "epoch": 1.07, - "learning_rate": 0.00013894402283193876, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.00022483767298484946, + "loss": 0.019, "step": 99320 }, { - "epoch": 1.07, - "learning_rate": 0.00013892780696633586, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022483010529183545, + "loss": 0.0153, "step": 99330 }, { - "epoch": 1.07, - "learning_rate": 0.00013891159110073295, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022482253759882143, + "loss": 0.0179, "step": 99340 }, { - "epoch": 1.07, - "learning_rate": 0.00013889537523513004, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022481496990580744, + "loss": 0.0215, "step": 99350 }, { - "epoch": 1.07, - "learning_rate": 0.00013887915936952713, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022480740221279342, + "loss": 0.0174, "step": 99360 }, { - "epoch": 1.07, - "learning_rate": 0.00013886294350392423, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.0002247998345197794, + "loss": 0.0178, "step": 99370 }, { - "epoch": 1.07, - "learning_rate": 0.00013884672763832132, - "loss": 0.0157, + "epoch": 0.5, + "learning_rate": 0.0002247922668267654, + "loss": 0.0148, "step": 99380 }, { - "epoch": 1.07, - "learning_rate": 0.0001388305117727184, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002247846991337514, + "loss": 0.0166, "step": 99390 }, { - "epoch": 1.07, - "learning_rate": 0.0001388142959071155, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022477713144073737, + "loss": 0.015, "step": 99400 }, { - "epoch": 1.07, - "learning_rate": 0.0001387980800415126, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022476956374772338, + "loss": 0.0157, "step": 99410 }, { - "epoch": 1.07, - "learning_rate": 0.0001387818641759097, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022476199605470936, + "loss": 0.0192, "step": 99420 }, { - "epoch": 1.07, - "learning_rate": 0.0001387656483103068, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022475442836169534, + "loss": 0.0247, "step": 99430 }, { - "epoch": 1.07, - "learning_rate": 0.00013874943244470388, + "epoch": 0.5, + "learning_rate": 0.00022474686066868135, "loss": 0.0166, "step": 99440 }, { - "epoch": 1.08, - "learning_rate": 0.000138733216579101, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022473929297566733, + "loss": 0.0193, "step": 99450 }, { - "epoch": 1.08, - "learning_rate": 0.00013871700071349806, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.0002247317252826533, + "loss": 0.0129, "step": 99460 }, { - "epoch": 1.08, - "learning_rate": 0.00013870078484789518, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.00022472415758963932, + "loss": 0.0173, "step": 99470 }, { - "epoch": 1.08, - "learning_rate": 0.00013868456898229227, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002247165898966253, + "loss": 0.015, "step": 99480 }, { - "epoch": 1.08, - "learning_rate": 0.00013866835311668937, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022470902220361128, + "loss": 0.0155, "step": 99490 }, { - "epoch": 1.08, - "learning_rate": 0.00013865213725108646, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022470145451059727, + "loss": 0.0151, "step": 99500 }, { - "epoch": 1.08, - "learning_rate": 0.00013863592138548355, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022469388681758327, + "loss": 0.0148, "step": 99510 }, { - "epoch": 1.08, - "learning_rate": 0.00013861970551988064, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022468631912456926, + "loss": 0.0152, "step": 99520 }, { - "epoch": 1.08, - "learning_rate": 0.00013860348965427774, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022467875143155524, + "loss": 0.0137, "step": 99530 }, { - "epoch": 1.08, - "learning_rate": 0.00013858727378867483, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022467118373854125, + "loss": 0.0168, "step": 99540 }, { - "epoch": 1.08, - "learning_rate": 0.00013857105792307192, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.00022466361604552723, + "loss": 0.0198, "step": 99550 }, { - "epoch": 1.08, - "learning_rate": 0.00013855484205746902, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.0002246560483525132, + "loss": 0.0177, "step": 99560 }, { - "epoch": 1.08, - "learning_rate": 0.0001385386261918661, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022464848065949922, + "loss": 0.0186, "step": 99570 }, { - "epoch": 1.08, - "learning_rate": 0.0001385224103262632, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002246409129664852, + "loss": 0.0164, "step": 99580 }, { - "epoch": 1.08, - "learning_rate": 0.0001385061944606603, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022463334527347118, + "loss": 0.0136, "step": 99590 }, { - "epoch": 1.08, - "learning_rate": 0.0001384899785950574, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002246257775804572, + "loss": 0.0159, "step": 99600 }, { - "epoch": 1.08, - "learning_rate": 0.00013847376272945448, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022461820988744317, + "loss": 0.0155, "step": 99610 }, { - "epoch": 1.08, - "learning_rate": 0.00013845754686385157, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022461064219442915, + "loss": 0.0147, "step": 99620 }, { - "epoch": 1.08, - "learning_rate": 0.0001384413309982487, - "loss": 0.007, + "epoch": 0.5, + "learning_rate": 0.00022460307450141516, + "loss": 0.024, "step": 99630 }, { - "epoch": 1.08, - "learning_rate": 0.00013842511513264576, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022459550680840114, + "loss": 0.0168, "step": 99640 }, { - "epoch": 1.08, - "learning_rate": 0.00013840889926704288, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.00022458793911538712, + "loss": 0.0164, "step": 99650 }, { - "epoch": 1.08, - "learning_rate": 0.00013839268340143994, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022458037142237313, + "loss": 0.0136, "step": 99660 }, { - "epoch": 1.08, - "learning_rate": 0.00013837646753583706, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.0002245728037293591, + "loss": 0.0141, "step": 99670 }, { - "epoch": 1.08, - "learning_rate": 0.00013836025167023413, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.0002245652360363451, + "loss": 0.0173, "step": 99680 }, { - "epoch": 1.08, - "learning_rate": 0.00013834403580463125, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022455766834333108, + "loss": 0.0183, "step": 99690 }, { - "epoch": 1.08, - "learning_rate": 0.00013832781993902834, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022455010065031708, + "loss": 0.0212, "step": 99700 }, { - "epoch": 1.08, - "learning_rate": 0.00013831160407342543, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.00022454253295730307, + "loss": 0.0146, "step": 99710 }, { - "epoch": 1.08, - "learning_rate": 0.00013829538820782253, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022453496526428905, + "loss": 0.0161, "step": 99720 }, { - "epoch": 1.08, - "learning_rate": 0.00013827917234221962, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022452739757127506, + "loss": 0.0134, "step": 99730 }, { - "epoch": 1.08, - "learning_rate": 0.0001382629564766167, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022451982987826104, + "loss": 0.0173, "step": 99740 }, { - "epoch": 1.08, - "learning_rate": 0.0001382467406110138, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022451226218524702, + "loss": 0.0166, "step": 99750 }, { - "epoch": 1.08, - "learning_rate": 0.0001382305247454109, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022450469449223303, + "loss": 0.0138, "step": 99760 }, { - "epoch": 1.08, - "learning_rate": 0.000138214308879808, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.000224497126799219, + "loss": 0.0198, "step": 99770 }, { - "epoch": 1.08, - "learning_rate": 0.00013819809301420508, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.000224489559106205, + "loss": 0.0162, "step": 99780 }, { - "epoch": 1.08, - "learning_rate": 0.00013818187714860218, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.000224481991413191, + "loss": 0.0143, "step": 99790 }, { - "epoch": 1.08, - "learning_rate": 0.00013816566128299927, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022447442372017698, + "loss": 0.0166, "step": 99800 }, { - "epoch": 1.08, - "learning_rate": 0.00013814944541739636, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022446685602716296, + "loss": 0.014, "step": 99810 }, { - "epoch": 1.08, - "learning_rate": 0.00013813322955179345, - "loss": 0.013, + "epoch": 0.5, + "learning_rate": 0.00022445928833414897, + "loss": 0.0141, "step": 99820 }, { - "epoch": 1.08, - "learning_rate": 0.00013811701368619055, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022445172064113495, + "loss": 0.0152, "step": 99830 }, { - "epoch": 1.08, - "learning_rate": 0.00013810079782058764, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022444415294812093, + "loss": 0.0156, "step": 99840 }, { - "epoch": 1.08, - "learning_rate": 0.00013808458195498476, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022443658525510691, + "loss": 0.0165, "step": 99850 }, { - "epoch": 1.08, - "learning_rate": 0.00013806836608938182, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022442901756209292, + "loss": 0.0169, "step": 99860 }, { - "epoch": 1.08, - "learning_rate": 0.00013805215022377894, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002244214498690789, + "loss": 0.0164, "step": 99870 }, { - "epoch": 1.08, - "learning_rate": 0.000138035934358176, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022441388217606489, + "loss": 0.0172, "step": 99880 }, { - "epoch": 1.08, - "learning_rate": 0.00013801971849257313, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.0002244063144830509, + "loss": 0.0153, "step": 99890 }, { - "epoch": 1.08, - "learning_rate": 0.0001380035026269702, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022439874679003688, + "loss": 0.018, "step": 99900 }, { - "epoch": 1.08, - "learning_rate": 0.00013798728676136732, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022439117909702286, + "loss": 0.0136, "step": 99910 }, { - "epoch": 1.08, - "learning_rate": 0.0001379710708957644, - "loss": 0.0153, + "epoch": 0.5, + "learning_rate": 0.00022438361140400887, + "loss": 0.0163, "step": 99920 }, { - "epoch": 1.08, - "learning_rate": 0.0001379548550301615, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022437604371099482, + "loss": 0.0155, "step": 99930 }, { - "epoch": 1.08, - "learning_rate": 0.0001379386391645586, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.0002243684760179808, + "loss": 0.0164, "step": 99940 }, { - "epoch": 1.08, - "learning_rate": 0.0001379224232989557, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.00022436090832496678, + "loss": 0.013, "step": 99950 }, { - "epoch": 1.08, - "learning_rate": 0.00013790620743335278, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.0002243533406319528, + "loss": 0.0189, "step": 99960 }, { - "epoch": 1.08, - "learning_rate": 0.00013788999156774987, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022434577293893877, + "loss": 0.0168, "step": 99970 }, { - "epoch": 1.08, - "learning_rate": 0.00013787377570214696, - "loss": 0.013, + "epoch": 0.5, + "learning_rate": 0.00022433820524592475, + "loss": 0.0188, "step": 99980 }, { - "epoch": 1.08, - "learning_rate": 0.00013785755983654406, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022433063755291076, + "loss": 0.0171, "step": 99990 }, { - "epoch": 1.08, - "learning_rate": 0.00013784134397094118, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022432306985989674, + "loss": 0.0151, "step": 100000 }, { - "epoch": 1.08, - "eval_cer": 0.921535620538638, - "eval_loss": 0.008387841284275055, - "eval_runtime": 121.0639, - "eval_samples_per_second": 16.52, - "eval_steps_per_second": 4.13, + "epoch": 0.5, + "eval_cer": 0.9145051901636767, + "eval_loss": 0.011643487960100174, + "eval_runtime": 116.6776, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, "step": 100000 }, { - "epoch": 1.08, - "learning_rate": 0.00013782512810533824, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022431550216688273, + "loss": 0.0137, "step": 100010 }, { - "epoch": 1.08, - "learning_rate": 0.00013780891223973536, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022430793447386873, + "loss": 0.0181, "step": 100020 }, { - "epoch": 1.08, - "learning_rate": 0.00013779269637413243, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022430036678085472, + "loss": 0.0136, "step": 100030 }, { - "epoch": 1.08, - "learning_rate": 0.00013777648050852955, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.0002242927990878407, + "loss": 0.0213, "step": 100040 }, { - "epoch": 1.08, - "learning_rate": 0.00013776026464292661, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.0002242852313948267, + "loss": 0.0172, "step": 100050 }, { - "epoch": 1.08, - "learning_rate": 0.00013774404877732373, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.0002242776637018127, + "loss": 0.0217, "step": 100060 }, { - "epoch": 1.08, - "learning_rate": 0.00013772783291172083, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022427009600879867, + "loss": 0.0161, "step": 100070 }, { - "epoch": 1.08, - "learning_rate": 0.00013771161704611792, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022426252831578465, + "loss": 0.0185, "step": 100080 }, { - "epoch": 1.08, - "learning_rate": 0.000137695401180515, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022425496062277066, + "loss": 0.0164, "step": 100090 }, { - "epoch": 1.08, - "learning_rate": 0.0001376791853149121, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022424739292975664, + "loss": 0.0131, "step": 100100 }, { - "epoch": 1.08, - "learning_rate": 0.0001376629694493092, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022423982523674262, + "loss": 0.0179, "step": 100110 }, { - "epoch": 1.08, - "learning_rate": 0.0001376467535837063, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022423225754372863, + "loss": 0.0163, "step": 100120 }, { - "epoch": 1.08, - "learning_rate": 0.00013763053771810338, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.0002242246898507146, + "loss": 0.0154, "step": 100130 }, { - "epoch": 1.08, - "learning_rate": 0.00013761432185250048, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.0002242171221577006, + "loss": 0.0144, "step": 100140 }, { - "epoch": 1.08, - "learning_rate": 0.00013759810598689757, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.0002242095544646866, + "loss": 0.0158, "step": 100150 }, { - "epoch": 1.08, - "learning_rate": 0.00013758189012129466, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022420198677167258, + "loss": 0.0171, "step": 100160 }, { - "epoch": 1.08, - "learning_rate": 0.00013756567425569175, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022419441907865856, + "loss": 0.0147, "step": 100170 }, { - "epoch": 1.08, - "learning_rate": 0.00013754945839008885, - "loss": 0.0082, + "epoch": 0.51, + "learning_rate": 0.00022418685138564457, + "loss": 0.0154, "step": 100180 }, { - "epoch": 1.08, - "learning_rate": 0.00013753324252448594, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022417928369263055, + "loss": 0.017, "step": 100190 }, { - "epoch": 1.08, - "learning_rate": 0.00013751702665888303, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.00022417171599961654, + "loss": 0.014, "step": 100200 }, { - "epoch": 1.08, - "learning_rate": 0.00013750081079328013, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022416414830660254, + "loss": 0.0143, "step": 100210 }, { - "epoch": 1.08, - "learning_rate": 0.00013748459492767725, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022415658061358853, + "loss": 0.0157, "step": 100220 }, { - "epoch": 1.08, - "learning_rate": 0.0001374683790620743, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.0002241490129205745, + "loss": 0.0151, "step": 100230 }, { - "epoch": 1.08, - "learning_rate": 0.00013745216319647143, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.0002241414452275605, + "loss": 0.016, "step": 100240 }, { - "epoch": 1.08, - "learning_rate": 0.0001374359473308685, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.0002241338775345465, + "loss": 0.0186, "step": 100250 }, { - "epoch": 1.08, - "learning_rate": 0.00013741973146526562, - "loss": 0.012, + "epoch": 0.51, + "learning_rate": 0.00022412630984153248, + "loss": 0.015, "step": 100260 }, { - "epoch": 1.08, - "learning_rate": 0.00013740351559966268, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022411874214851846, + "loss": 0.0182, "step": 100270 }, { - "epoch": 1.08, - "learning_rate": 0.0001373872997340598, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022411117445550447, + "loss": 0.0151, "step": 100280 }, { - "epoch": 1.08, - "learning_rate": 0.0001373710838684569, - "loss": 0.0132, + "epoch": 0.51, + "learning_rate": 0.00022410360676249045, + "loss": 0.0149, "step": 100290 }, { - "epoch": 1.08, - "learning_rate": 0.000137354868002854, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022409603906947643, + "loss": 0.0164, "step": 100300 }, { - "epoch": 1.08, - "learning_rate": 0.00013733865213725108, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022408847137646244, + "loss": 0.0151, "step": 100310 }, { - "epoch": 1.08, - "learning_rate": 0.00013732243627164817, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022408090368344842, + "loss": 0.0162, "step": 100320 }, { - "epoch": 1.08, - "learning_rate": 0.00013730622040604527, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.0002240733359904344, + "loss": 0.0181, "step": 100330 }, { - "epoch": 1.08, - "learning_rate": 0.00013729000454044236, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.0002240657682974204, + "loss": 0.0162, "step": 100340 }, { - "epoch": 1.08, - "learning_rate": 0.00013727378867483945, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.0002240582006044064, + "loss": 0.0133, "step": 100350 }, { - "epoch": 1.08, - "learning_rate": 0.00013725757280923654, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022405063291139237, + "loss": 0.0144, "step": 100360 }, { - "epoch": 1.09, - "learning_rate": 0.00013724135694363364, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022404306521837838, + "loss": 0.0195, "step": 100370 }, { - "epoch": 1.09, - "learning_rate": 0.00013722514107803073, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022403549752536436, + "loss": 0.0173, "step": 100380 }, { - "epoch": 1.09, - "learning_rate": 0.00013720892521242782, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022402792983235035, + "loss": 0.0145, "step": 100390 }, { - "epoch": 1.09, - "learning_rate": 0.00013719270934682491, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022402036213933633, + "loss": 0.0156, "step": 100400 }, { - "epoch": 1.09, - "learning_rate": 0.000137176493481222, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022401279444632234, + "loss": 0.0224, "step": 100410 }, { - "epoch": 1.09, - "learning_rate": 0.0001371602776156191, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.00022400522675330832, + "loss": 0.019, "step": 100420 }, { - "epoch": 1.09, - "learning_rate": 0.0001371440617500162, - "loss": 0.008, + "epoch": 0.51, + "learning_rate": 0.0002239976590602943, + "loss": 0.0199, "step": 100430 }, { - "epoch": 1.09, - "learning_rate": 0.0001371278458844133, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.0002239900913672803, + "loss": 0.0168, "step": 100440 }, { - "epoch": 1.09, - "learning_rate": 0.00013711163001881038, - "loss": 0.0126, + "epoch": 0.51, + "learning_rate": 0.0002239825236742663, + "loss": 0.016, "step": 100450 }, { - "epoch": 1.09, - "learning_rate": 0.0001370954141532075, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022397495598125227, + "loss": 0.0193, "step": 100460 }, { - "epoch": 1.09, - "learning_rate": 0.00013707919828760456, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022396738828823828, + "loss": 0.0125, "step": 100470 }, { - "epoch": 1.09, - "learning_rate": 0.00013706298242200168, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022395982059522426, + "loss": 0.0158, "step": 100480 }, { - "epoch": 1.09, - "learning_rate": 0.00013704676655639878, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022395225290221024, + "loss": 0.016, "step": 100490 }, { - "epoch": 1.09, - "learning_rate": 0.00013703055069079587, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022394468520919625, + "loss": 0.016, "step": 100500 }, { - "epoch": 1.09, - "learning_rate": 0.00013701433482519296, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022393711751618223, + "loss": 0.0171, "step": 100510 }, { - "epoch": 1.09, - "learning_rate": 0.00013699811895959005, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002239295498231682, + "loss": 0.016, "step": 100520 }, { - "epoch": 1.09, - "learning_rate": 0.00013698190309398715, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022392198213015422, + "loss": 0.0196, "step": 100530 }, { - "epoch": 1.09, - "learning_rate": 0.00013696568722838424, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002239144144371402, + "loss": 0.0155, "step": 100540 }, { - "epoch": 1.09, - "learning_rate": 0.00013694947136278133, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022390684674412618, + "loss": 0.0164, "step": 100550 }, { - "epoch": 1.09, - "learning_rate": 0.00013693325549717843, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.0002238992790511122, + "loss": 0.0164, "step": 100560 }, { - "epoch": 1.09, - "learning_rate": 0.00013691703963157552, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022389171135809817, + "loss": 0.018, "step": 100570 }, { - "epoch": 1.09, - "learning_rate": 0.0001369008237659726, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022388414366508416, + "loss": 0.0132, "step": 100580 }, { - "epoch": 1.09, - "learning_rate": 0.0001368846079003697, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.00022387657597207014, + "loss": 0.0154, "step": 100590 }, { - "epoch": 1.09, - "learning_rate": 0.0001368683920347668, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022386900827905615, + "loss": 0.0143, "step": 100600 }, { - "epoch": 1.09, - "learning_rate": 0.0001368521761691639, - "loss": 0.0082, + "epoch": 0.51, + "learning_rate": 0.00022386144058604213, + "loss": 0.0159, "step": 100610 }, { - "epoch": 1.09, - "learning_rate": 0.00013683596030356098, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.0002238538728930281, + "loss": 0.0119, "step": 100620 }, { - "epoch": 1.09, - "learning_rate": 0.00013681974443795807, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022384630520001412, + "loss": 0.0146, "step": 100630 }, { - "epoch": 1.09, - "learning_rate": 0.0001368035285723552, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002238387375070001, + "loss": 0.0145, "step": 100640 }, { - "epoch": 1.09, - "learning_rate": 0.00013678731270675226, - "loss": 0.0126, + "epoch": 0.51, + "learning_rate": 0.00022383116981398608, + "loss": 0.0137, "step": 100650 }, { - "epoch": 1.09, - "learning_rate": 0.00013677109684114938, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.0002238236021209721, + "loss": 0.016, "step": 100660 }, { - "epoch": 1.09, - "learning_rate": 0.00013675488097554645, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022381603442795807, + "loss": 0.0168, "step": 100670 }, { - "epoch": 1.09, - "learning_rate": 0.00013673866510994357, - "loss": 0.0137, + "epoch": 0.51, + "learning_rate": 0.00022380846673494405, + "loss": 0.0135, "step": 100680 }, { - "epoch": 1.09, - "learning_rate": 0.00013672244924434063, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022380089904193006, + "loss": 0.0151, "step": 100690 }, { - "epoch": 1.09, - "learning_rate": 0.00013670623337873775, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022379333134891604, + "loss": 0.018, "step": 100700 }, { - "epoch": 1.09, - "learning_rate": 0.00013669001751313484, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022378576365590202, + "loss": 0.018, "step": 100710 }, { - "epoch": 1.09, - "learning_rate": 0.00013667380164753194, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022377819596288803, + "loss": 0.0127, "step": 100720 }, { - "epoch": 1.09, - "learning_rate": 0.00013665758578192903, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.000223770628269874, + "loss": 0.0173, "step": 100730 }, { - "epoch": 1.09, - "learning_rate": 0.00013664136991632612, - "loss": 0.0078, + "epoch": 0.51, + "learning_rate": 0.00022376306057686, + "loss": 0.0169, "step": 100740 }, { - "epoch": 1.09, - "learning_rate": 0.00013662515405072321, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022375549288384598, + "loss": 0.0149, "step": 100750 }, { - "epoch": 1.09, - "learning_rate": 0.0001366089381851203, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022374792519083198, + "loss": 0.0138, "step": 100760 }, { - "epoch": 1.09, - "learning_rate": 0.0001365927223195174, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022374035749781797, + "loss": 0.0162, "step": 100770 }, { - "epoch": 1.09, - "learning_rate": 0.0001365765064539145, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022373278980480395, + "loss": 0.0126, "step": 100780 }, { - "epoch": 1.09, - "learning_rate": 0.0001365602905883116, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022372522211178996, + "loss": 0.0143, "step": 100790 }, { - "epoch": 1.09, - "learning_rate": 0.00013654407472270868, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022371765441877594, + "loss": 0.018, "step": 100800 }, { - "epoch": 1.09, - "learning_rate": 0.0001365278588571058, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022371008672576192, + "loss": 0.0144, "step": 100810 }, { - "epoch": 1.09, - "learning_rate": 0.00013651164299150286, - "loss": 0.0123, + "epoch": 0.51, + "learning_rate": 0.00022370251903274793, + "loss": 0.0145, "step": 100820 }, { - "epoch": 1.09, - "learning_rate": 0.00013649542712589998, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.0002236949513397339, + "loss": 0.0171, "step": 100830 }, { - "epoch": 1.09, - "learning_rate": 0.00013647921126029705, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.0002236873836467199, + "loss": 0.0142, "step": 100840 }, { - "epoch": 1.09, - "learning_rate": 0.00013646299539469417, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.0002236798159537059, + "loss": 0.0141, "step": 100850 }, { - "epoch": 1.09, - "learning_rate": 0.00013644677952909126, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.00022367224826069188, + "loss": 0.0159, "step": 100860 }, { - "epoch": 1.09, - "learning_rate": 0.00013643056366348835, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.00022366468056767786, + "loss": 0.0126, "step": 100870 }, { - "epoch": 1.09, - "learning_rate": 0.00013641434779788545, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022365711287466387, + "loss": 0.0148, "step": 100880 }, { - "epoch": 1.09, - "learning_rate": 0.00013639813193228254, - "loss": 0.0152, + "epoch": 0.51, + "learning_rate": 0.00022364954518164985, + "loss": 0.0176, "step": 100890 }, { - "epoch": 1.09, - "learning_rate": 0.00013638191606667963, - "loss": 0.0117, + "epoch": 0.51, + "learning_rate": 0.00022364197748863583, + "loss": 0.0147, "step": 100900 }, { - "epoch": 1.09, - "learning_rate": 0.00013636570020107673, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022363440979562181, + "loss": 0.0138, "step": 100910 }, { - "epoch": 1.09, - "learning_rate": 0.00013634948433547382, - "loss": 0.008, + "epoch": 0.51, + "learning_rate": 0.00022362684210260782, + "loss": 0.013, "step": 100920 }, { - "epoch": 1.09, - "learning_rate": 0.0001363332684698709, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.0002236192744095938, + "loss": 0.0135, "step": 100930 }, { - "epoch": 1.09, - "learning_rate": 0.000136317052604268, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022361170671657979, + "loss": 0.025, "step": 100940 }, { - "epoch": 1.09, - "learning_rate": 0.0001363008367386651, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.0002236041390235658, + "loss": 0.0175, "step": 100950 }, { - "epoch": 1.09, - "learning_rate": 0.0001362846208730622, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022359657133055178, + "loss": 0.0153, "step": 100960 }, { - "epoch": 1.09, - "learning_rate": 0.00013626840500745928, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022358900363753776, + "loss": 0.0167, "step": 100970 }, { - "epoch": 1.09, - "learning_rate": 0.00013625218914185637, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022358143594452377, + "loss": 0.0173, "step": 100980 }, { - "epoch": 1.09, - "learning_rate": 0.00013623597327625347, - "loss": 0.0148, + "epoch": 0.51, + "learning_rate": 0.00022357386825150975, + "loss": 0.016, "step": 100990 }, { - "epoch": 1.09, - "learning_rate": 0.00013621975741065056, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.00022356630055849573, + "loss": 0.0195, "step": 101000 }, { - "epoch": 1.09, - "eval_cer": 0.9215312775238562, - "eval_loss": 0.008509015664458275, - "eval_runtime": 121.1391, - "eval_samples_per_second": 16.51, - "eval_steps_per_second": 4.127, + "epoch": 0.51, + "eval_cer": 0.9145022789753005, + "eval_loss": 0.011683492921292782, + "eval_runtime": 116.7876, + "eval_samples_per_second": 17.125, + "eval_steps_per_second": 4.281, "step": 101000 }, { - "epoch": 1.09, - "learning_rate": 0.00013620354154504768, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022355873286548174, + "loss": 0.0174, "step": 101010 }, { - "epoch": 1.09, - "learning_rate": 0.00013618732567944475, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022355116517246772, + "loss": 0.0147, "step": 101020 }, { - "epoch": 1.09, - "learning_rate": 0.00013617110981384187, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.0002235435974794537, + "loss": 0.0156, "step": 101030 }, { - "epoch": 1.09, - "learning_rate": 0.00013615489394823893, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.0002235360297864397, + "loss": 0.0193, "step": 101040 }, { - "epoch": 1.09, - "learning_rate": 0.00013613867808263605, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.0002235284620934257, + "loss": 0.0137, "step": 101050 }, { - "epoch": 1.09, - "learning_rate": 0.00013612246221703312, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022352089440041167, + "loss": 0.0148, "step": 101060 }, { - "epoch": 1.09, - "learning_rate": 0.00013610624635143024, - "loss": 0.0131, + "epoch": 0.51, + "learning_rate": 0.00022351332670739765, + "loss": 0.0113, "step": 101070 }, { - "epoch": 1.09, - "learning_rate": 0.00013609003048582733, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022350575901438366, + "loss": 0.0157, "step": 101080 }, { - "epoch": 1.09, - "learning_rate": 0.00013607381462022442, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022349819132136964, + "loss": 0.0162, "step": 101090 }, { - "epoch": 1.09, - "learning_rate": 0.00013605759875462151, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022349062362835562, + "loss": 0.0157, "step": 101100 }, { - "epoch": 1.09, - "learning_rate": 0.0001360413828890186, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022348305593534163, + "loss": 0.0161, "step": 101110 }, { - "epoch": 1.09, - "learning_rate": 0.0001360251670234157, - "loss": 0.0081, + "epoch": 0.51, + "learning_rate": 0.00022347548824232761, + "loss": 0.0133, "step": 101120 }, { - "epoch": 1.09, - "learning_rate": 0.0001360089511578128, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.0002234679205493136, + "loss": 0.0164, "step": 101130 }, { - "epoch": 1.09, - "learning_rate": 0.00013599273529220989, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.0002234603528562996, + "loss": 0.0149, "step": 101140 }, { - "epoch": 1.09, - "learning_rate": 0.00013597651942660698, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022345278516328559, + "loss": 0.0146, "step": 101150 }, { - "epoch": 1.09, - "learning_rate": 0.00013596030356100407, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022344521747027157, + "loss": 0.0147, "step": 101160 }, { - "epoch": 1.09, - "learning_rate": 0.00013594408769540116, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022343764977725758, + "loss": 0.0145, "step": 101170 }, { - "epoch": 1.09, - "learning_rate": 0.00013592787182979826, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022343008208424353, + "loss": 0.0172, "step": 101180 }, { - "epoch": 1.09, - "learning_rate": 0.00013591165596419535, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.0002234225143912295, + "loss": 0.0138, "step": 101190 }, { - "epoch": 1.09, - "learning_rate": 0.00013589544009859244, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.0002234149466982155, + "loss": 0.0153, "step": 101200 }, { - "epoch": 1.09, - "learning_rate": 0.00013587922423298954, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.0002234073790052015, + "loss": 0.0155, "step": 101210 }, { - "epoch": 1.09, - "learning_rate": 0.00013586300836738663, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022339981131218748, + "loss": 0.0124, "step": 101220 }, { - "epoch": 1.09, - "learning_rate": 0.00013584679250178375, - "loss": 0.0146, + "epoch": 0.51, + "learning_rate": 0.00022339224361917346, + "loss": 0.0125, "step": 101230 }, { - "epoch": 1.09, - "learning_rate": 0.0001358305766361808, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022338467592615947, + "loss": 0.0152, "step": 101240 }, { - "epoch": 1.09, - "learning_rate": 0.00013581436077057793, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022337710823314545, + "loss": 0.0146, "step": 101250 }, { - "epoch": 1.09, - "learning_rate": 0.000135798144904975, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.00022336954054013144, + "loss": 0.0158, "step": 101260 }, { - "epoch": 1.09, - "learning_rate": 0.00013578192903937212, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022336197284711744, + "loss": 0.0157, "step": 101270 }, { - "epoch": 1.09, - "learning_rate": 0.00013576571317376918, - "loss": 0.0079, + "epoch": 0.51, + "learning_rate": 0.00022335440515410343, + "loss": 0.0123, "step": 101280 }, { - "epoch": 1.09, - "learning_rate": 0.0001357494973081663, - "loss": 0.012, + "epoch": 0.51, + "learning_rate": 0.0002233468374610894, + "loss": 0.0158, "step": 101290 }, { - "epoch": 1.1, - "learning_rate": 0.0001357332814425634, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.0002233392697680754, + "loss": 0.0153, "step": 101300 }, { - "epoch": 1.1, - "learning_rate": 0.0001357170655769605, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.0002233317020750614, + "loss": 0.0169, "step": 101310 }, { - "epoch": 1.1, - "learning_rate": 0.00013570084971135758, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022332413438204738, + "loss": 0.0219, "step": 101320 }, { - "epoch": 1.1, - "learning_rate": 0.00013568463384575468, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022331656668903336, + "loss": 0.0145, "step": 101330 }, { - "epoch": 1.1, - "learning_rate": 0.00013566841798015177, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.00022330899899601937, + "loss": 0.0162, "step": 101340 }, { - "epoch": 1.1, - "learning_rate": 0.00013565220211454886, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022330143130300535, + "loss": 0.0124, "step": 101350 }, { - "epoch": 1.1, - "learning_rate": 0.00013563598624894595, - "loss": 0.0134, + "epoch": 0.51, + "learning_rate": 0.00022329386360999133, + "loss": 0.0125, "step": 101360 }, { - "epoch": 1.1, - "learning_rate": 0.00013561977038334305, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022328629591697734, + "loss": 0.0153, "step": 101370 }, { - "epoch": 1.1, - "learning_rate": 0.00013560355451774014, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022327872822396332, + "loss": 0.0144, "step": 101380 }, { - "epoch": 1.1, - "learning_rate": 0.00013558733865213723, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.0002232711605309493, + "loss": 0.0207, "step": 101390 }, { - "epoch": 1.1, - "learning_rate": 0.00013557112278653432, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002232635928379353, + "loss": 0.0154, "step": 101400 }, { - "epoch": 1.1, - "learning_rate": 0.00013555490692093142, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.0002232560251449213, + "loss": 0.0133, "step": 101410 }, { - "epoch": 1.1, - "learning_rate": 0.0001355386910553285, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022324845745190727, + "loss": 0.0153, "step": 101420 }, { - "epoch": 1.1, - "learning_rate": 0.0001355224751897256, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022324088975889328, + "loss": 0.0181, "step": 101430 }, { - "epoch": 1.1, - "learning_rate": 0.00013550625932412272, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022323332206587926, + "loss": 0.0198, "step": 101440 }, { - "epoch": 1.1, - "learning_rate": 0.00013549004345851982, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022322575437286525, + "loss": 0.0147, "step": 101450 }, { - "epoch": 1.1, - "learning_rate": 0.0001354738275929169, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022321818667985125, + "loss": 0.0171, "step": 101460 }, { - "epoch": 1.1, - "learning_rate": 0.000135457611727314, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022321061898683724, + "loss": 0.0182, "step": 101470 }, { - "epoch": 1.1, - "learning_rate": 0.0001354413958617111, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022320305129382322, + "loss": 0.0147, "step": 101480 }, { - "epoch": 1.1, - "learning_rate": 0.00013542517999610819, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002231954836008092, + "loss": 0.0152, "step": 101490 }, { - "epoch": 1.1, - "learning_rate": 0.00013540896413050528, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002231879159077952, + "loss": 0.0168, "step": 101500 }, { - "epoch": 1.1, - "learning_rate": 0.00013539274826490237, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002231803482147812, + "loss": 0.0165, "step": 101510 }, { - "epoch": 1.1, - "learning_rate": 0.00013537653239929946, - "loss": 0.0085, + "epoch": 0.51, + "learning_rate": 0.00022317278052176717, + "loss": 0.0142, "step": 101520 }, { - "epoch": 1.1, - "learning_rate": 0.00013536031653369656, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022316521282875318, + "loss": 0.0134, "step": 101530 }, { - "epoch": 1.1, - "learning_rate": 0.00013534410066809365, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022315764513573916, + "loss": 0.0169, "step": 101540 }, { - "epoch": 1.1, - "learning_rate": 0.00013532788480249074, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022315007744272514, + "loss": 0.0154, "step": 101550 }, { - "epoch": 1.1, - "learning_rate": 0.00013531166893688784, - "loss": 0.0123, + "epoch": 0.51, + "learning_rate": 0.00022314250974971115, + "loss": 0.0188, "step": 101560 }, { - "epoch": 1.1, - "learning_rate": 0.00013529545307128493, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022313494205669713, + "loss": 0.0159, "step": 101570 }, { - "epoch": 1.1, - "learning_rate": 0.00013527923720568202, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.0002231273743636831, + "loss": 0.0193, "step": 101580 }, { - "epoch": 1.1, - "learning_rate": 0.0001352630213400791, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022311980667066912, + "loss": 0.0147, "step": 101590 }, { - "epoch": 1.1, - "learning_rate": 0.00013524680547447623, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.0002231122389776551, + "loss": 0.0205, "step": 101600 }, { - "epoch": 1.1, - "learning_rate": 0.0001352305896088733, - "loss": 0.0117, + "epoch": 0.51, + "learning_rate": 0.00022310467128464108, + "loss": 0.0143, "step": 101610 }, { - "epoch": 1.1, - "learning_rate": 0.00013521437374327042, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.0002230971035916271, + "loss": 0.0144, "step": 101620 }, { - "epoch": 1.1, - "learning_rate": 0.00013519815787766748, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022308953589861307, + "loss": 0.0148, "step": 101630 }, { - "epoch": 1.1, - "learning_rate": 0.0001351819420120646, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022308196820559906, + "loss": 0.0162, "step": 101640 }, { - "epoch": 1.1, - "learning_rate": 0.0001351657261464617, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022307440051258504, + "loss": 0.018, "step": 101650 }, { - "epoch": 1.1, - "learning_rate": 0.0001351495102808588, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022306683281957105, + "loss": 0.0131, "step": 101660 }, { - "epoch": 1.1, - "learning_rate": 0.00013513329441525588, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022305926512655703, + "loss": 0.0148, "step": 101670 }, { - "epoch": 1.1, - "learning_rate": 0.00013511707854965298, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.000223051697433543, + "loss": 0.015, "step": 101680 }, { - "epoch": 1.1, - "learning_rate": 0.00013510086268405007, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022304412974052902, + "loss": 0.0176, "step": 101690 }, { - "epoch": 1.1, - "learning_rate": 0.00013508464681844716, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.000223036562047515, + "loss": 0.0174, "step": 101700 }, { - "epoch": 1.1, - "learning_rate": 0.00013506843095284425, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022302899435450098, + "loss": 0.0174, "step": 101710 }, { - "epoch": 1.1, - "learning_rate": 0.00013505221508724135, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.000223021426661487, + "loss": 0.0142, "step": 101720 }, { - "epoch": 1.1, - "learning_rate": 0.00013503599922163844, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022301385896847297, + "loss": 0.0143, "step": 101730 }, { - "epoch": 1.1, - "learning_rate": 0.00013501978335603553, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022300629127545895, + "loss": 0.0193, "step": 101740 }, { - "epoch": 1.1, - "learning_rate": 0.00013500356749043262, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.00022299872358244496, + "loss": 0.0144, "step": 101750 }, { - "epoch": 1.1, - "learning_rate": 0.00013498735162482972, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022299115588943094, + "loss": 0.016, "step": 101760 }, { - "epoch": 1.1, - "learning_rate": 0.0001349711357592268, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022298358819641692, + "loss": 0.0147, "step": 101770 }, { - "epoch": 1.1, - "learning_rate": 0.0001349549198936239, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.00022297602050340293, + "loss": 0.0142, "step": 101780 }, { - "epoch": 1.1, - "learning_rate": 0.000134938704028021, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.0002229684528103889, + "loss": 0.0119, "step": 101790 }, { - "epoch": 1.1, - "learning_rate": 0.00013492248816241812, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.0002229608851173749, + "loss": 0.0143, "step": 101800 }, { - "epoch": 1.1, - "learning_rate": 0.00013490627229681518, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022295331742436088, + "loss": 0.0134, "step": 101810 }, { - "epoch": 1.1, - "learning_rate": 0.0001348900564312123, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022294574973134688, + "loss": 0.0136, "step": 101820 }, { - "epoch": 1.1, - "learning_rate": 0.00013487384056560937, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022293818203833287, + "loss": 0.0145, "step": 101830 }, { - "epoch": 1.1, - "learning_rate": 0.00013485762470000649, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022293061434531885, + "loss": 0.0158, "step": 101840 }, { - "epoch": 1.1, - "learning_rate": 0.00013484140883440355, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.00022292304665230486, + "loss": 0.0152, "step": 101850 }, { - "epoch": 1.1, - "learning_rate": 0.00013482519296880067, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022291547895929084, + "loss": 0.0188, "step": 101860 }, { - "epoch": 1.1, - "learning_rate": 0.00013480897710319776, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022290791126627682, + "loss": 0.0135, "step": 101870 }, { - "epoch": 1.1, - "learning_rate": 0.00013479276123759486, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022290034357326283, + "loss": 0.0136, "step": 101880 }, { - "epoch": 1.1, - "learning_rate": 0.00013477654537199195, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.0002228927758802488, + "loss": 0.0166, "step": 101890 }, { - "epoch": 1.1, - "learning_rate": 0.00013476032950638904, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002228852081872348, + "loss": 0.016, "step": 101900 }, { - "epoch": 1.1, - "learning_rate": 0.00013474411364078614, - "loss": 0.0137, + "epoch": 0.51, + "learning_rate": 0.0002228776404942208, + "loss": 0.0161, "step": 101910 }, { - "epoch": 1.1, - "learning_rate": 0.00013472789777518323, - "loss": 0.0133, + "epoch": 0.51, + "learning_rate": 0.00022287007280120678, + "loss": 0.0154, "step": 101920 }, { - "epoch": 1.1, - "learning_rate": 0.00013471168190958032, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.00022286250510819276, + "loss": 0.0179, "step": 101930 }, { - "epoch": 1.1, - "learning_rate": 0.00013469546604397741, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022285493741517877, + "loss": 0.0133, "step": 101940 }, { - "epoch": 1.1, - "learning_rate": 0.0001346792501783745, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022284736972216475, + "loss": 0.0145, "step": 101950 }, { - "epoch": 1.1, - "learning_rate": 0.0001346630343127716, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.00022283980202915073, + "loss": 0.0141, "step": 101960 }, { - "epoch": 1.1, - "learning_rate": 0.0001346468184471687, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.00022283223433613671, + "loss": 0.0124, "step": 101970 }, { - "epoch": 1.1, - "learning_rate": 0.00013463060258156578, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022282466664312272, + "loss": 0.0195, "step": 101980 }, { - "epoch": 1.1, - "learning_rate": 0.00013461438671596288, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.0002228170989501087, + "loss": 0.0167, "step": 101990 }, { - "epoch": 1.1, - "learning_rate": 0.00013459817085035997, - "loss": 0.0085, + "epoch": 0.51, + "learning_rate": 0.00022280953125709469, + "loss": 0.0192, "step": 102000 }, { - "epoch": 1.1, - "eval_cer": 0.921579050686457, - "eval_loss": 0.008401263505220413, - "eval_runtime": 121.0675, - "eval_samples_per_second": 16.52, - "eval_steps_per_second": 4.13, + "epoch": 0.51, + "eval_cer": 0.9145119829365546, + "eval_loss": 0.01138813141733408, + "eval_runtime": 116.604, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, "step": 102000 }, { - "epoch": 1.1, - "learning_rate": 0.00013458195498475706, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.0002228019635640807, + "loss": 0.0137, "step": 102010 }, { - "epoch": 1.1, - "learning_rate": 0.00013456573911915418, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022279439587106668, + "loss": 0.0162, "step": 102020 }, { - "epoch": 1.1, - "learning_rate": 0.00013454952325355125, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022278682817805266, + "loss": 0.0133, "step": 102030 }, { - "epoch": 1.1, - "learning_rate": 0.00013453330738794837, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.00022277926048503867, + "loss": 0.0145, "step": 102040 }, { - "epoch": 1.1, - "learning_rate": 0.00013451709152234543, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022277169279202465, + "loss": 0.0159, "step": 102050 }, { - "epoch": 1.1, - "learning_rate": 0.00013450087565674255, - "loss": 0.0131, + "epoch": 0.51, + "learning_rate": 0.00022276412509901063, + "loss": 0.0133, "step": 102060 }, { - "epoch": 1.1, - "learning_rate": 0.00013448465979113962, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.00022275655740599664, + "loss": 0.0162, "step": 102070 }, { - "epoch": 1.1, - "learning_rate": 0.00013446844392553674, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022274898971298262, + "loss": 0.0128, "step": 102080 }, { - "epoch": 1.1, - "learning_rate": 0.00013445222805993383, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002227414220199686, + "loss": 0.0179, "step": 102090 }, { - "epoch": 1.1, - "learning_rate": 0.00013443601219433092, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.0002227338543269546, + "loss": 0.015, "step": 102100 }, { - "epoch": 1.1, - "learning_rate": 0.00013441979632872802, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.0002227262866339406, + "loss": 0.0145, "step": 102110 }, { - "epoch": 1.1, - "learning_rate": 0.0001344035804631251, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022271871894092657, + "loss": 0.0146, "step": 102120 }, { - "epoch": 1.1, - "learning_rate": 0.0001343873645975222, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022271115124791258, + "loss": 0.0182, "step": 102130 }, { - "epoch": 1.1, - "learning_rate": 0.0001343711487319193, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022270358355489856, + "loss": 0.0148, "step": 102140 }, { - "epoch": 1.1, - "learning_rate": 0.0001343549328663164, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022269601586188454, + "loss": 0.0123, "step": 102150 }, { - "epoch": 1.1, - "learning_rate": 0.00013433871700071348, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022268844816887052, + "loss": 0.0175, "step": 102160 }, { - "epoch": 1.1, - "learning_rate": 0.0001343225011351106, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022268088047585653, + "loss": 0.0134, "step": 102170 }, { - "epoch": 1.1, - "learning_rate": 0.00013430628526950767, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022267331278284251, + "loss": 0.016, "step": 102180 }, { - "epoch": 1.1, - "learning_rate": 0.0001342900694039048, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.0002226657450898285, + "loss": 0.014, "step": 102190 }, { - "epoch": 1.1, - "learning_rate": 0.00013427385353830185, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.0002226581773968145, + "loss": 0.0111, "step": 102200 }, { - "epoch": 1.1, - "learning_rate": 0.00013425763767269897, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022265060970380049, + "loss": 0.0173, "step": 102210 }, { - "epoch": 1.11, - "learning_rate": 0.00013424142180709604, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022264304201078647, + "loss": 0.017, "step": 102220 }, { - "epoch": 1.11, - "learning_rate": 0.00013422520594149316, - "loss": 0.0138, + "epoch": 0.52, + "learning_rate": 0.00022263547431777248, + "loss": 0.0149, "step": 102230 }, { - "epoch": 1.11, - "learning_rate": 0.00013420899007589025, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022262790662475846, + "loss": 0.0152, "step": 102240 }, { - "epoch": 1.11, - "learning_rate": 0.00013419277421028734, - "loss": 0.0147, + "epoch": 0.52, + "learning_rate": 0.00022262033893174444, + "loss": 0.0172, "step": 102250 }, { - "epoch": 1.11, - "learning_rate": 0.00013417655834468444, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022261277123873045, + "loss": 0.0135, "step": 102260 }, { - "epoch": 1.11, - "learning_rate": 0.00013416034247908153, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022260520354571643, + "loss": 0.0133, "step": 102270 }, { - "epoch": 1.11, - "learning_rate": 0.00013414412661347862, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.0002225976358527024, + "loss": 0.0167, "step": 102280 }, { - "epoch": 1.11, - "learning_rate": 0.00013412791074787571, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022259006815968842, + "loss": 0.0186, "step": 102290 }, { - "epoch": 1.11, - "learning_rate": 0.0001341116948822728, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.0002225825004666744, + "loss": 0.0169, "step": 102300 }, { - "epoch": 1.11, - "learning_rate": 0.0001340954790166699, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022257493277366038, + "loss": 0.0156, "step": 102310 }, { - "epoch": 1.11, - "learning_rate": 0.000134079263151067, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022256736508064636, + "loss": 0.0163, "step": 102320 }, { - "epoch": 1.11, - "learning_rate": 0.00013406304728546408, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022255979738763237, + "loss": 0.0146, "step": 102330 }, { - "epoch": 1.11, - "learning_rate": 0.00013404683141986118, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022255222969461835, + "loss": 0.0174, "step": 102340 }, { - "epoch": 1.11, - "learning_rate": 0.00013403061555425827, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022254466200160433, + "loss": 0.0162, "step": 102350 }, { - "epoch": 1.11, - "learning_rate": 0.00013401439968865536, - "loss": 0.0124, + "epoch": 0.52, + "learning_rate": 0.00022253709430859034, + "loss": 0.0138, "step": 102360 }, { - "epoch": 1.11, - "learning_rate": 0.00013399818382305246, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022252952661557632, + "loss": 0.0161, "step": 102370 }, { - "epoch": 1.11, - "learning_rate": 0.00013398196795744955, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002225219589225623, + "loss": 0.0181, "step": 102380 }, { - "epoch": 1.11, - "learning_rate": 0.00013396575209184667, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022251439122954831, + "loss": 0.0213, "step": 102390 }, { - "epoch": 1.11, - "learning_rate": 0.00013394953622624373, - "loss": 0.0145, + "epoch": 0.52, + "learning_rate": 0.0002225068235365343, + "loss": 0.0141, "step": 102400 }, { - "epoch": 1.11, - "learning_rate": 0.00013393332036064085, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022249925584352028, + "loss": 0.0218, "step": 102410 }, { - "epoch": 1.11, - "learning_rate": 0.00013391710449503792, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.00022249168815050629, + "loss": 0.0169, "step": 102420 }, { - "epoch": 1.11, - "learning_rate": 0.00013390088862943504, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022248412045749227, + "loss": 0.0152, "step": 102430 }, { - "epoch": 1.11, - "learning_rate": 0.0001338846727638321, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022247655276447822, + "loss": 0.0142, "step": 102440 }, { - "epoch": 1.11, - "learning_rate": 0.00013386845689822922, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002224689850714642, + "loss": 0.0187, "step": 102450 }, { - "epoch": 1.11, - "learning_rate": 0.00013385224103262632, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.0002224614173784502, + "loss": 0.0159, "step": 102460 }, { - "epoch": 1.11, - "learning_rate": 0.0001338360251670234, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.0002224538496854362, + "loss": 0.0148, "step": 102470 }, { - "epoch": 1.11, - "learning_rate": 0.0001338198093014205, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022244628199242217, + "loss": 0.0145, "step": 102480 }, { - "epoch": 1.11, - "learning_rate": 0.0001338035934358176, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022243871429940818, + "loss": 0.014, "step": 102490 }, { - "epoch": 1.11, - "learning_rate": 0.0001337873775702147, - "loss": 0.0132, + "epoch": 0.52, + "learning_rate": 0.00022243114660639416, + "loss": 0.0149, "step": 102500 }, { - "epoch": 1.11, - "learning_rate": 0.00013377116170461178, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022242357891338015, + "loss": 0.0132, "step": 102510 }, { - "epoch": 1.11, - "learning_rate": 0.00013375494583900887, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.00022241601122036615, + "loss": 0.0168, "step": 102520 }, { - "epoch": 1.11, - "learning_rate": 0.00013373872997340597, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022240844352735214, + "loss": 0.0139, "step": 102530 }, { - "epoch": 1.11, - "learning_rate": 0.00013372251410780306, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022240087583433812, + "loss": 0.0145, "step": 102540 }, { - "epoch": 1.11, - "learning_rate": 0.00013370629824220015, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.0002223933081413241, + "loss": 0.0173, "step": 102550 }, { - "epoch": 1.11, - "learning_rate": 0.00013369008237659725, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.0002223857404483101, + "loss": 0.0205, "step": 102560 }, { - "epoch": 1.11, - "learning_rate": 0.00013367386651099434, - "loss": 0.0115, + "epoch": 0.52, + "learning_rate": 0.0002223781727552961, + "loss": 0.0146, "step": 102570 }, { - "epoch": 1.11, - "learning_rate": 0.00013365765064539143, - "loss": 0.0121, + "epoch": 0.52, + "learning_rate": 0.00022237060506228207, + "loss": 0.0136, "step": 102580 }, { - "epoch": 1.11, - "learning_rate": 0.00013364143477978852, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022236303736926808, + "loss": 0.0149, "step": 102590 }, { - "epoch": 1.11, - "learning_rate": 0.00013362521891418562, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022235546967625406, + "loss": 0.0143, "step": 102600 }, { - "epoch": 1.11, - "learning_rate": 0.00013360900304858274, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022234790198324004, + "loss": 0.0159, "step": 102610 }, { - "epoch": 1.11, - "learning_rate": 0.0001335927871829798, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022234033429022605, + "loss": 0.0169, "step": 102620 }, { - "epoch": 1.11, - "learning_rate": 0.00013357657131737692, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.00022233276659721203, + "loss": 0.0129, "step": 102630 }, { - "epoch": 1.11, - "learning_rate": 0.000133560355451774, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.000222325198904198, + "loss": 0.0146, "step": 102640 }, { - "epoch": 1.11, - "learning_rate": 0.0001335441395861711, - "loss": 0.0116, + "epoch": 0.52, + "learning_rate": 0.00022231763121118402, + "loss": 0.0179, "step": 102650 }, { - "epoch": 1.11, - "learning_rate": 0.0001335279237205682, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022231006351817, + "loss": 0.0157, "step": 102660 }, { - "epoch": 1.11, - "learning_rate": 0.0001335117078549653, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022230249582515598, + "loss": 0.0201, "step": 102670 }, { - "epoch": 1.11, - "learning_rate": 0.00013349549198936239, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.000222294928132142, + "loss": 0.0174, "step": 102680 }, { - "epoch": 1.11, - "learning_rate": 0.00013347927612375948, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022228736043912797, + "loss": 0.0153, "step": 102690 }, { - "epoch": 1.11, - "learning_rate": 0.00013346306025815657, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.00022227979274611396, + "loss": 0.0131, "step": 102700 }, { - "epoch": 1.11, - "learning_rate": 0.00013344684439255366, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022227222505309994, + "loss": 0.0157, "step": 102710 }, { - "epoch": 1.11, - "learning_rate": 0.00013343062852695076, - "loss": 0.0121, + "epoch": 0.52, + "learning_rate": 0.00022226465736008595, + "loss": 0.0172, "step": 102720 }, { - "epoch": 1.11, - "learning_rate": 0.00013341441266134785, - "loss": 0.0124, + "epoch": 0.52, + "learning_rate": 0.00022225708966707193, + "loss": 0.0176, "step": 102730 }, { - "epoch": 1.11, - "learning_rate": 0.00013339819679574494, - "loss": 0.0132, + "epoch": 0.52, + "learning_rate": 0.0002222495219740579, + "loss": 0.0145, "step": 102740 }, { - "epoch": 1.11, - "learning_rate": 0.00013338198093014203, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022224195428104392, + "loss": 0.0181, "step": 102750 }, { - "epoch": 1.11, - "learning_rate": 0.00013336576506453913, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.0002222343865880299, + "loss": 0.0167, "step": 102760 }, { - "epoch": 1.11, - "learning_rate": 0.00013334954919893622, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022222681889501588, + "loss": 0.0166, "step": 102770 }, { - "epoch": 1.11, - "learning_rate": 0.0001333333333333333, - "loss": 0.0134, + "epoch": 0.52, + "learning_rate": 0.0002222192512020019, + "loss": 0.0138, "step": 102780 }, { - "epoch": 1.11, - "learning_rate": 0.0001333171174677304, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022221168350898787, + "loss": 0.0157, "step": 102790 }, { - "epoch": 1.11, - "learning_rate": 0.0001333009016021275, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.00022220411581597385, + "loss": 0.0216, "step": 102800 }, { - "epoch": 1.11, - "learning_rate": 0.00013328468573652462, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022219654812295986, + "loss": 0.0148, "step": 102810 }, { - "epoch": 1.11, - "learning_rate": 0.00013326846987092168, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022218898042994584, + "loss": 0.0175, "step": 102820 }, { - "epoch": 1.11, - "learning_rate": 0.0001332522540053188, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.00022218141273693182, + "loss": 0.0178, "step": 102830 }, { - "epoch": 1.11, - "learning_rate": 0.00013323603813971587, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022217384504391783, + "loss": 0.0176, "step": 102840 }, { - "epoch": 1.11, - "learning_rate": 0.000133219822274113, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002221662773509038, + "loss": 0.0142, "step": 102850 }, { - "epoch": 1.11, - "learning_rate": 0.00013320360640851008, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.0002221587096578898, + "loss": 0.0157, "step": 102860 }, { - "epoch": 1.11, - "learning_rate": 0.00013318739054290717, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022215114196487578, + "loss": 0.0124, "step": 102870 }, { - "epoch": 1.11, - "learning_rate": 0.00013317117467730427, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022214357427186178, + "loss": 0.0156, "step": 102880 }, { - "epoch": 1.11, - "learning_rate": 0.00013315495881170136, - "loss": 0.0115, + "epoch": 0.52, + "learning_rate": 0.00022213600657884777, + "loss": 0.0133, "step": 102890 }, { - "epoch": 1.11, - "learning_rate": 0.00013313874294609845, - "loss": 0.0116, + "epoch": 0.52, + "learning_rate": 0.00022212843888583375, + "loss": 0.0142, "step": 102900 }, { - "epoch": 1.11, - "learning_rate": 0.00013312252708049555, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.00022212087119281976, + "loss": 0.018, "step": 102910 }, { - "epoch": 1.11, - "learning_rate": 0.00013310631121489264, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022211330349980574, + "loss": 0.016, "step": 102920 }, { - "epoch": 1.11, - "learning_rate": 0.00013309009534928973, - "loss": 0.0126, + "epoch": 0.52, + "learning_rate": 0.00022210573580679172, + "loss": 0.0134, "step": 102930 }, { - "epoch": 1.11, - "learning_rate": 0.00013307387948368682, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022209816811377773, + "loss": 0.0178, "step": 102940 }, { - "epoch": 1.11, - "learning_rate": 0.00013305766361808392, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.0002220906004207637, + "loss": 0.0167, "step": 102950 }, { - "epoch": 1.11, - "learning_rate": 0.00013304144775248104, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.0002220830327277497, + "loss": 0.0121, "step": 102960 }, { - "epoch": 1.11, - "learning_rate": 0.0001330252318868781, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.0002220754650347357, + "loss": 0.0166, "step": 102970 }, { - "epoch": 1.11, - "learning_rate": 0.00013300901602127522, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022206789734172168, + "loss": 0.0175, "step": 102980 }, { - "epoch": 1.11, - "learning_rate": 0.0001329928001556723, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022206032964870766, + "loss": 0.0172, "step": 102990 }, { - "epoch": 1.11, - "learning_rate": 0.0001329765842900694, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.00022205276195569367, + "loss": 0.0146, "step": 103000 }, { - "epoch": 1.11, - "eval_cer": 0.921526065906118, - "eval_loss": 0.008482340723276138, - "eval_runtime": 121.2993, - "eval_samples_per_second": 16.488, - "eval_steps_per_second": 4.122, + "epoch": 0.52, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.011572513729333878, + "eval_runtime": 116.71, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, "step": 103000 }, { - "epoch": 1.11, - "learning_rate": 0.00013296036842446647, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022204519426267965, + "loss": 0.0157, "step": 103010 }, { - "epoch": 1.11, - "learning_rate": 0.0001329441525588636, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022203762656966563, + "loss": 0.0173, "step": 103020 }, { - "epoch": 1.11, - "learning_rate": 0.00013292793669326069, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022203005887665164, + "loss": 0.0147, "step": 103030 }, { - "epoch": 1.11, - "learning_rate": 0.00013291172082765778, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022202249118363762, + "loss": 0.0159, "step": 103040 }, { - "epoch": 1.11, - "learning_rate": 0.00013289550496205487, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.0002220149234906236, + "loss": 0.0166, "step": 103050 }, { - "epoch": 1.11, - "learning_rate": 0.00013287928909645196, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022200735579760959, + "loss": 0.0133, "step": 103060 }, { - "epoch": 1.11, - "learning_rate": 0.00013286307323084906, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.0002219997881045956, + "loss": 0.019, "step": 103070 }, { - "epoch": 1.11, - "learning_rate": 0.00013284685736524615, - "loss": 0.0081, + "epoch": 0.52, + "learning_rate": 0.00022199222041158158, + "loss": 0.0156, "step": 103080 }, { - "epoch": 1.11, - "learning_rate": 0.00013283064149964324, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022198465271856756, + "loss": 0.0138, "step": 103090 }, { - "epoch": 1.11, - "learning_rate": 0.00013281442563404033, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.00022197708502555357, + "loss": 0.0165, "step": 103100 }, { - "epoch": 1.11, - "learning_rate": 0.00013279820976843743, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022196951733253955, + "loss": 0.0155, "step": 103110 }, { - "epoch": 1.11, - "learning_rate": 0.00013278199390283452, - "loss": 0.0124, + "epoch": 0.52, + "learning_rate": 0.00022196194963952553, + "loss": 0.0132, "step": 103120 }, { - "epoch": 1.11, - "learning_rate": 0.0001327657780372316, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022195438194651154, + "loss": 0.014, "step": 103130 }, { - "epoch": 1.11, - "learning_rate": 0.0001327495621716287, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022194681425349752, + "loss": 0.0137, "step": 103140 }, { - "epoch": 1.12, - "learning_rate": 0.0001327333463060258, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.0002219392465604835, + "loss": 0.0151, "step": 103150 }, { - "epoch": 1.12, - "learning_rate": 0.0001327171304404229, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.0002219316788674695, + "loss": 0.0145, "step": 103160 }, { - "epoch": 1.12, - "learning_rate": 0.00013270091457481998, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.0002219241111744555, + "loss": 0.0143, "step": 103170 }, { - "epoch": 1.12, - "learning_rate": 0.0001326846987092171, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022191654348144147, + "loss": 0.0154, "step": 103180 }, { - "epoch": 1.12, - "learning_rate": 0.00013266848284361417, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022190897578842748, + "loss": 0.0135, "step": 103190 }, { - "epoch": 1.12, - "learning_rate": 0.0001326522669780113, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022190140809541346, + "loss": 0.0154, "step": 103200 }, { - "epoch": 1.12, - "learning_rate": 0.00013263605111240835, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022189384040239944, + "loss": 0.0154, "step": 103210 }, { - "epoch": 1.12, - "learning_rate": 0.00013261983524680547, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022188627270938542, + "loss": 0.0158, "step": 103220 }, { - "epoch": 1.12, - "learning_rate": 0.00013260361938120254, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022187870501637143, + "loss": 0.0153, "step": 103230 }, { - "epoch": 1.12, - "learning_rate": 0.00013258740351559966, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022187113732335741, + "loss": 0.0149, "step": 103240 }, { - "epoch": 1.12, - "learning_rate": 0.00013257118764999675, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.0002218635696303434, + "loss": 0.0184, "step": 103250 }, { - "epoch": 1.12, - "learning_rate": 0.00013255497178439385, - "loss": 0.0128, + "epoch": 0.52, + "learning_rate": 0.0002218560019373294, + "loss": 0.0157, "step": 103260 }, { - "epoch": 1.12, - "learning_rate": 0.00013253875591879094, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022184843424431539, + "loss": 0.016, "step": 103270 }, { - "epoch": 1.12, - "learning_rate": 0.00013252254005318803, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022184086655130137, + "loss": 0.0157, "step": 103280 }, { - "epoch": 1.12, - "learning_rate": 0.00013250632418758512, - "loss": 0.0129, + "epoch": 0.52, + "learning_rate": 0.00022183329885828738, + "loss": 0.0153, "step": 103290 }, { - "epoch": 1.12, - "learning_rate": 0.00013249010832198222, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022182573116527336, + "loss": 0.0168, "step": 103300 }, { - "epoch": 1.12, - "learning_rate": 0.0001324738924563793, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022181816347225934, + "loss": 0.0129, "step": 103310 }, { - "epoch": 1.12, - "learning_rate": 0.0001324576765907764, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022181059577924535, + "loss": 0.0168, "step": 103320 }, { - "epoch": 1.12, - "learning_rate": 0.0001324414607251735, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022180302808623133, + "loss": 0.0216, "step": 103330 }, { - "epoch": 1.12, - "learning_rate": 0.0001324252448595706, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.0002217954603932173, + "loss": 0.0155, "step": 103340 }, { - "epoch": 1.12, - "learning_rate": 0.00013240902899396768, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022178789270020332, + "loss": 0.0165, "step": 103350 }, { - "epoch": 1.12, - "learning_rate": 0.00013239281312836477, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.0002217803250071893, + "loss": 0.0133, "step": 103360 }, { - "epoch": 1.12, - "learning_rate": 0.00013237659726276187, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022177275731417528, + "loss": 0.0164, "step": 103370 }, { - "epoch": 1.12, - "learning_rate": 0.00013236038139715896, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022176518962116126, + "loss": 0.0176, "step": 103380 }, { - "epoch": 1.12, - "learning_rate": 0.00013234416553155605, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022175762192814727, + "loss": 0.0157, "step": 103390 }, { - "epoch": 1.12, - "learning_rate": 0.00013232794966595317, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022175005423513325, + "loss": 0.0166, "step": 103400 }, { - "epoch": 1.12, - "learning_rate": 0.00013231173380035024, - "loss": 0.0127, + "epoch": 0.52, + "learning_rate": 0.00022174248654211923, + "loss": 0.0134, "step": 103410 }, { - "epoch": 1.12, - "learning_rate": 0.00013229551793474736, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022173491884910524, + "loss": 0.0163, "step": 103420 }, { - "epoch": 1.12, - "learning_rate": 0.00013227930206914442, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022172735115609122, + "loss": 0.019, "step": 103430 }, { - "epoch": 1.12, - "learning_rate": 0.00013226308620354154, - "loss": 0.0148, + "epoch": 0.52, + "learning_rate": 0.0002217197834630772, + "loss": 0.0143, "step": 103440 }, { - "epoch": 1.12, - "learning_rate": 0.0001322468703379386, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022171221577006321, + "loss": 0.0175, "step": 103450 }, { - "epoch": 1.12, - "learning_rate": 0.00013223065447233573, - "loss": 0.0141, + "epoch": 0.52, + "learning_rate": 0.0002217046480770492, + "loss": 0.03, "step": 103460 }, { - "epoch": 1.12, - "learning_rate": 0.00013221443860673282, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022169708038403518, + "loss": 0.0142, "step": 103470 }, { - "epoch": 1.12, - "learning_rate": 0.0001321982227411299, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022168951269102119, + "loss": 0.0197, "step": 103480 }, { - "epoch": 1.12, - "learning_rate": 0.000132182006875527, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.00022168194499800717, + "loss": 0.015, "step": 103490 }, { - "epoch": 1.12, - "learning_rate": 0.0001321657910099241, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022167437730499315, + "loss": 0.0146, "step": 103500 }, { - "epoch": 1.12, - "learning_rate": 0.0001321495751443212, - "loss": 0.0129, + "epoch": 0.52, + "learning_rate": 0.00022166680961197916, + "loss": 0.0138, "step": 103510 }, { - "epoch": 1.12, - "learning_rate": 0.00013213335927871828, - "loss": 0.0125, + "epoch": 0.52, + "learning_rate": 0.00022165924191896514, + "loss": 0.0151, "step": 103520 }, { - "epoch": 1.12, - "learning_rate": 0.00013211714341311538, - "loss": 0.0136, + "epoch": 0.52, + "learning_rate": 0.00022165167422595112, + "loss": 0.018, "step": 103530 }, { - "epoch": 1.12, - "learning_rate": 0.00013210092754751247, - "loss": 0.0127, + "epoch": 0.52, + "learning_rate": 0.00022164410653293713, + "loss": 0.0167, "step": 103540 }, { - "epoch": 1.12, - "learning_rate": 0.00013208471168190956, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.0002216365388399231, + "loss": 0.0158, "step": 103550 }, { - "epoch": 1.12, - "learning_rate": 0.00013206849581630666, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.0002216289711469091, + "loss": 0.0211, "step": 103560 }, { - "epoch": 1.12, - "learning_rate": 0.00013205227995070375, - "loss": 0.0129, + "epoch": 0.52, + "learning_rate": 0.00022162140345389507, + "loss": 0.0145, "step": 103570 }, { - "epoch": 1.12, - "learning_rate": 0.00013203606408510084, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.00022161383576088108, + "loss": 0.0159, "step": 103580 }, { - "epoch": 1.12, - "learning_rate": 0.00013201984821949796, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022160626806786706, + "loss": 0.0139, "step": 103590 }, { - "epoch": 1.12, - "learning_rate": 0.00013200363235389503, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022159870037485304, + "loss": 0.0145, "step": 103600 }, { - "epoch": 1.12, - "learning_rate": 0.00013198741648829215, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.00022159113268183905, + "loss": 0.0156, "step": 103610 }, { - "epoch": 1.12, - "learning_rate": 0.00013197120062268924, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.00022158356498882503, + "loss": 0.0138, "step": 103620 }, { - "epoch": 1.12, - "learning_rate": 0.00013195498475708633, - "loss": 0.0142, + "epoch": 0.52, + "learning_rate": 0.00022157599729581102, + "loss": 0.02, "step": 103630 }, { - "epoch": 1.12, - "learning_rate": 0.00013193876889148342, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022156842960279702, + "loss": 0.0142, "step": 103640 }, { - "epoch": 1.12, - "learning_rate": 0.00013192255302588052, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.000221560861909783, + "loss": 0.0153, "step": 103650 }, { - "epoch": 1.12, - "learning_rate": 0.0001319063371602776, - "loss": 0.0137, + "epoch": 0.52, + "learning_rate": 0.000221553294216769, + "loss": 0.0156, "step": 103660 }, { - "epoch": 1.12, - "learning_rate": 0.0001318901212946747, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.000221545726523755, + "loss": 0.0158, "step": 103670 }, { - "epoch": 1.12, - "learning_rate": 0.0001318739054290718, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022153815883074098, + "loss": 0.0144, "step": 103680 }, { - "epoch": 1.12, - "learning_rate": 0.0001318576895634689, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022153059113772696, + "loss": 0.0126, "step": 103690 }, { - "epoch": 1.12, - "learning_rate": 0.00013184147369786598, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.0002215230234447129, + "loss": 0.0229, "step": 103700 }, { - "epoch": 1.12, - "learning_rate": 0.00013182525783226307, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022151545575169892, + "loss": 0.016, "step": 103710 }, { - "epoch": 1.12, - "learning_rate": 0.00013180904196666017, - "loss": 0.0132, + "epoch": 0.52, + "learning_rate": 0.0002215078880586849, + "loss": 0.0139, "step": 103720 }, { - "epoch": 1.12, - "learning_rate": 0.00013179282610105726, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022150032036567088, + "loss": 0.0166, "step": 103730 }, { - "epoch": 1.12, - "learning_rate": 0.00013177661023545435, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.0002214927526726569, + "loss": 0.0151, "step": 103740 }, { - "epoch": 1.12, - "learning_rate": 0.00013176039436985144, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022148518497964287, + "loss": 0.0144, "step": 103750 }, { - "epoch": 1.12, - "learning_rate": 0.00013174417850424854, - "loss": 0.0115, + "epoch": 0.52, + "learning_rate": 0.00022147761728662886, + "loss": 0.0166, "step": 103760 }, { - "epoch": 1.12, - "learning_rate": 0.00013172796263864566, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.00022147004959361484, + "loss": 0.0164, "step": 103770 }, { - "epoch": 1.12, - "learning_rate": 0.00013171174677304272, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022146248190060085, + "loss": 0.0161, "step": 103780 }, { - "epoch": 1.12, - "learning_rate": 0.00013169553090743984, - "loss": 0.0086, + "epoch": 0.52, + "learning_rate": 0.00022145491420758683, + "loss": 0.0156, "step": 103790 }, { - "epoch": 1.12, - "learning_rate": 0.0001316793150418369, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.0002214473465145728, + "loss": 0.0187, "step": 103800 }, { - "epoch": 1.12, - "learning_rate": 0.00013166309917623403, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022143977882155882, + "loss": 0.0165, "step": 103810 }, { - "epoch": 1.12, - "learning_rate": 0.00013164688331063112, - "loss": 0.0078, + "epoch": 0.52, + "learning_rate": 0.0002214322111285448, + "loss": 0.0166, "step": 103820 }, { - "epoch": 1.12, - "learning_rate": 0.0001316306674450282, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022142464343553078, + "loss": 0.015, "step": 103830 }, { - "epoch": 1.12, - "learning_rate": 0.0001316144515794253, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.0002214170757425168, + "loss": 0.0156, "step": 103840 }, { - "epoch": 1.12, - "learning_rate": 0.0001315982357138224, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022140950804950277, + "loss": 0.0167, "step": 103850 }, { - "epoch": 1.12, - "learning_rate": 0.0001315820198482195, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022140194035648875, + "loss": 0.0155, "step": 103860 }, { - "epoch": 1.12, - "learning_rate": 0.00013156580398261658, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022139437266347476, + "loss": 0.0147, "step": 103870 }, { - "epoch": 1.12, - "learning_rate": 0.00013154958811701368, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022138680497046074, + "loss": 0.0185, "step": 103880 }, { - "epoch": 1.12, - "learning_rate": 0.00013153337225141077, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.00022137923727744672, + "loss": 0.0142, "step": 103890 }, { - "epoch": 1.12, - "learning_rate": 0.00013151715638580786, - "loss": 0.0115, + "epoch": 0.52, + "learning_rate": 0.00022137166958443273, + "loss": 0.0156, "step": 103900 }, { - "epoch": 1.12, - "learning_rate": 0.00013150094052020496, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.0002213641018914187, + "loss": 0.0155, "step": 103910 }, { - "epoch": 1.12, - "learning_rate": 0.00013148472465460205, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.0002213565341984047, + "loss": 0.0129, "step": 103920 }, { - "epoch": 1.12, - "learning_rate": 0.00013146850878899914, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.0002213489665053907, + "loss": 0.0154, "step": 103930 }, { - "epoch": 1.12, - "learning_rate": 0.00013145229292339623, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022134139881237668, + "loss": 0.0125, "step": 103940 }, { - "epoch": 1.12, - "learning_rate": 0.00013143607705779333, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022133383111936267, + "loss": 0.0165, "step": 103950 }, { - "epoch": 1.12, - "learning_rate": 0.00013141986119219042, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022132626342634865, + "loss": 0.0142, "step": 103960 }, { - "epoch": 1.12, - "learning_rate": 0.00013140364532658754, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022131869573333466, + "loss": 0.0153, "step": 103970 }, { - "epoch": 1.12, - "learning_rate": 0.0001313874294609846, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022131112804032064, + "loss": 0.0166, "step": 103980 }, { - "epoch": 1.12, - "learning_rate": 0.00013137121359538172, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022130356034730662, + "loss": 0.0114, "step": 103990 }, { - "epoch": 1.12, - "learning_rate": 0.0001313549977297788, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022129599265429263, + "loss": 0.0178, "step": 104000 }, { - "epoch": 1.12, - "eval_cer": 0.9215208542883797, - "eval_loss": 0.008366812020540237, - "eval_runtime": 121.4656, - "eval_samples_per_second": 16.466, - "eval_steps_per_second": 4.116, + "epoch": 0.52, + "eval_cer": 0.9145071309559275, + "eval_loss": 0.01152227446436882, + "eval_runtime": 116.6853, + "eval_samples_per_second": 17.14, + "eval_steps_per_second": 4.285, "step": 104000 }, { - "epoch": 1.12, - "learning_rate": 0.0001313387818641759, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002212884249612786, + "loss": 0.017, "step": 104010 }, { - "epoch": 1.12, - "learning_rate": 0.00013132256599857298, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.0002212808572682646, + "loss": 0.0172, "step": 104020 }, { - "epoch": 1.12, - "learning_rate": 0.0001313063501329701, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.0002212732895752506, + "loss": 0.017, "step": 104030 }, { - "epoch": 1.12, - "learning_rate": 0.0001312901342673672, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.00022126572188223658, + "loss": 0.0133, "step": 104040 }, { - "epoch": 1.12, - "learning_rate": 0.00013127391840176428, - "loss": 0.0161, + "epoch": 0.52, + "learning_rate": 0.00022125815418922256, + "loss": 0.0159, "step": 104050 }, { - "epoch": 1.12, - "learning_rate": 0.00013125770253616137, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022125058649620857, + "loss": 0.0134, "step": 104060 }, { - "epoch": 1.13, - "learning_rate": 0.00013124148667055847, - "loss": 0.0086, + "epoch": 0.53, + "learning_rate": 0.00022124301880319455, + "loss": 0.0152, "step": 104070 }, { - "epoch": 1.13, - "learning_rate": 0.00013122527080495556, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022123545111018053, + "loss": 0.0161, "step": 104080 }, { - "epoch": 1.13, - "learning_rate": 0.00013120905493935265, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022122788341716654, + "loss": 0.0185, "step": 104090 }, { - "epoch": 1.13, - "learning_rate": 0.00013119283907374974, - "loss": 0.0121, + "epoch": 0.53, + "learning_rate": 0.00022122031572415252, + "loss": 0.0135, "step": 104100 }, { - "epoch": 1.13, - "learning_rate": 0.00013117662320814684, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.0002212127480311385, + "loss": 0.0162, "step": 104110 }, { - "epoch": 1.13, - "learning_rate": 0.00013116040734254393, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002212051803381245, + "loss": 0.0162, "step": 104120 }, { - "epoch": 1.13, - "learning_rate": 0.00013114419147694102, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.0002211976126451105, + "loss": 0.0143, "step": 104130 }, { - "epoch": 1.13, - "learning_rate": 0.00013112797561133812, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022119004495209648, + "loss": 0.0179, "step": 104140 }, { - "epoch": 1.13, - "learning_rate": 0.0001311117597457352, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022118247725908246, + "loss": 0.0159, "step": 104150 }, { - "epoch": 1.13, - "learning_rate": 0.0001310955438801323, - "loss": 0.0144, + "epoch": 0.53, + "learning_rate": 0.00022117490956606847, + "loss": 0.0132, "step": 104160 }, { - "epoch": 1.13, - "learning_rate": 0.0001310793280145294, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022116734187305445, + "loss": 0.0149, "step": 104170 }, { - "epoch": 1.13, - "learning_rate": 0.00013106311214892649, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022115977418004043, + "loss": 0.0153, "step": 104180 }, { - "epoch": 1.13, - "learning_rate": 0.0001310468962833236, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022115220648702644, + "loss": 0.0149, "step": 104190 }, { - "epoch": 1.13, - "learning_rate": 0.00013103068041772067, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022114463879401242, + "loss": 0.0133, "step": 104200 }, { - "epoch": 1.13, - "learning_rate": 0.0001310144645521178, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.0002211370711009984, + "loss": 0.0234, "step": 104210 }, { - "epoch": 1.13, - "learning_rate": 0.00013099824868651486, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.0002211295034079844, + "loss": 0.015, "step": 104220 }, { - "epoch": 1.13, - "learning_rate": 0.00013098203282091198, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.0002211219357149704, + "loss": 0.019, "step": 104230 }, { - "epoch": 1.13, - "learning_rate": 0.00013096581695530904, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.00022111436802195637, + "loss": 0.0151, "step": 104240 }, { - "epoch": 1.13, - "learning_rate": 0.00013094960108970616, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022110680032894238, + "loss": 0.0173, "step": 104250 }, { - "epoch": 1.13, - "learning_rate": 0.00013093338522410326, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022109923263592836, + "loss": 0.0144, "step": 104260 }, { - "epoch": 1.13, - "learning_rate": 0.00013091716935850035, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022109166494291434, + "loss": 0.0125, "step": 104270 }, { - "epoch": 1.13, - "learning_rate": 0.00013090095349289744, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022108409724990033, + "loss": 0.0159, "step": 104280 }, { - "epoch": 1.13, - "learning_rate": 0.00013088473762729453, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.00022107652955688633, + "loss": 0.0124, "step": 104290 }, { - "epoch": 1.13, - "learning_rate": 0.00013086852176169163, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022106896186387232, + "loss": 0.0134, "step": 104300 }, { - "epoch": 1.13, - "learning_rate": 0.00013085230589608872, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.0002210613941708583, + "loss": 0.0159, "step": 104310 }, { - "epoch": 1.13, - "learning_rate": 0.0001308360900304858, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.0002210538264778443, + "loss": 0.0167, "step": 104320 }, { - "epoch": 1.13, - "learning_rate": 0.0001308198741648829, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.0002210462587848303, + "loss": 0.0154, "step": 104330 }, { - "epoch": 1.13, - "learning_rate": 0.00013080365829928002, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022103869109181627, + "loss": 0.0148, "step": 104340 }, { - "epoch": 1.13, - "learning_rate": 0.0001307874424336771, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022103112339880228, + "loss": 0.0202, "step": 104350 }, { - "epoch": 1.13, - "learning_rate": 0.0001307712265680742, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00022102355570578826, + "loss": 0.0176, "step": 104360 }, { - "epoch": 1.13, - "learning_rate": 0.00013075501070247128, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022101598801277424, + "loss": 0.0138, "step": 104370 }, { - "epoch": 1.13, - "learning_rate": 0.0001307387948368684, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00022100842031976025, + "loss": 0.0135, "step": 104380 }, { - "epoch": 1.13, - "learning_rate": 0.00013072257897126546, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022100085262674623, + "loss": 0.0159, "step": 104390 }, { - "epoch": 1.13, - "learning_rate": 0.00013070636310566258, - "loss": 0.0128, + "epoch": 0.53, + "learning_rate": 0.0002209932849337322, + "loss": 0.0148, "step": 104400 }, { - "epoch": 1.13, - "learning_rate": 0.00013069014724005967, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022098571724071822, + "loss": 0.0152, "step": 104410 }, { - "epoch": 1.13, - "learning_rate": 0.00013067393137445677, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.0002209781495477042, + "loss": 0.0187, "step": 104420 }, { - "epoch": 1.13, - "learning_rate": 0.00013065771550885386, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022097058185469018, + "loss": 0.0153, "step": 104430 }, { - "epoch": 1.13, - "learning_rate": 0.00013064149964325095, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.0002209630141616762, + "loss": 0.0169, "step": 104440 }, { - "epoch": 1.13, - "learning_rate": 0.00013062528377764804, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022095544646866217, + "loss": 0.0155, "step": 104450 }, { - "epoch": 1.13, - "learning_rate": 0.00013060906791204514, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022094787877564815, + "loss": 0.0154, "step": 104460 }, { - "epoch": 1.13, - "learning_rate": 0.00013059285204644223, - "loss": 0.0121, + "epoch": 0.53, + "learning_rate": 0.00022094031108263414, + "loss": 0.0214, "step": 104470 }, { - "epoch": 1.13, - "learning_rate": 0.00013057663618083932, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022093274338962014, + "loss": 0.0166, "step": 104480 }, { - "epoch": 1.13, - "learning_rate": 0.00013056042031523642, - "loss": 0.0132, + "epoch": 0.53, + "learning_rate": 0.00022092517569660613, + "loss": 0.0166, "step": 104490 }, { - "epoch": 1.13, - "learning_rate": 0.0001305442044496335, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.0002209176080035921, + "loss": 0.0129, "step": 104500 }, { - "epoch": 1.13, - "learning_rate": 0.0001305279885840306, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022091004031057812, + "loss": 0.0147, "step": 104510 }, { - "epoch": 1.13, - "learning_rate": 0.0001305117727184277, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.0002209024726175641, + "loss": 0.0187, "step": 104520 }, { - "epoch": 1.13, - "learning_rate": 0.0001304955568528248, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022089490492455008, + "loss": 0.0137, "step": 104530 }, { - "epoch": 1.13, - "learning_rate": 0.00013047934098722188, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.0002208873372315361, + "loss": 0.0161, "step": 104540 }, { - "epoch": 1.13, - "learning_rate": 0.00013046312512161897, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.00022087976953852207, + "loss": 0.0167, "step": 104550 }, { - "epoch": 1.13, - "learning_rate": 0.0001304469092560161, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022087220184550805, + "loss": 0.0148, "step": 104560 }, { - "epoch": 1.13, - "learning_rate": 0.00013043069339041316, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022086463415249406, + "loss": 0.0161, "step": 104570 }, { - "epoch": 1.13, - "learning_rate": 0.00013041447752481028, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00022085706645948004, + "loss": 0.0145, "step": 104580 }, { - "epoch": 1.13, - "learning_rate": 0.00013039826165920734, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022084949876646602, + "loss": 0.0169, "step": 104590 }, { - "epoch": 1.13, - "learning_rate": 0.00013038204579360446, - "loss": 0.0125, + "epoch": 0.53, + "learning_rate": 0.00022084193107345203, + "loss": 0.0157, "step": 104600 }, { - "epoch": 1.13, - "learning_rate": 0.00013036582992800153, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.000220834363380438, + "loss": 0.015, "step": 104610 }, { - "epoch": 1.13, - "learning_rate": 0.00013034961406239865, - "loss": 0.0135, + "epoch": 0.53, + "learning_rate": 0.000220826795687424, + "loss": 0.0147, "step": 104620 }, { - "epoch": 1.13, - "learning_rate": 0.00013033339819679574, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022081922799440997, + "loss": 0.0168, "step": 104630 }, { - "epoch": 1.13, - "learning_rate": 0.00013031718233119283, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022081166030139598, + "loss": 0.0171, "step": 104640 }, { - "epoch": 1.13, - "learning_rate": 0.00013030096646558993, - "loss": 0.0124, + "epoch": 0.53, + "learning_rate": 0.00022080409260838196, + "loss": 0.0161, "step": 104650 }, { - "epoch": 1.13, - "learning_rate": 0.00013028475059998702, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022079652491536795, + "loss": 0.0175, "step": 104660 }, { - "epoch": 1.13, - "learning_rate": 0.0001302685347343841, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022078895722235395, + "loss": 0.0151, "step": 104670 }, { - "epoch": 1.13, - "learning_rate": 0.0001302523188687812, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022078138952933994, + "loss": 0.0162, "step": 104680 }, { - "epoch": 1.13, - "learning_rate": 0.0001302361030031783, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022077382183632592, + "loss": 0.0147, "step": 104690 }, { - "epoch": 1.13, - "learning_rate": 0.0001302198871375754, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00022076625414331193, + "loss": 0.0147, "step": 104700 }, { - "epoch": 1.13, - "learning_rate": 0.00013020367127197248, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.0002207586864502979, + "loss": 0.0165, "step": 104710 }, { - "epoch": 1.13, - "learning_rate": 0.00013018745540636958, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.0002207511187572839, + "loss": 0.0146, "step": 104720 }, { - "epoch": 1.13, - "learning_rate": 0.00013017123954076667, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.0002207435510642699, + "loss": 0.019, "step": 104730 }, { - "epoch": 1.13, - "learning_rate": 0.00013015502367516376, - "loss": 0.0143, + "epoch": 0.53, + "learning_rate": 0.00022073598337125588, + "loss": 0.0171, "step": 104740 }, { - "epoch": 1.13, - "learning_rate": 0.00013013880780956085, - "loss": 0.0118, + "epoch": 0.53, + "learning_rate": 0.00022072841567824186, + "loss": 0.0163, "step": 104750 }, { - "epoch": 1.13, - "learning_rate": 0.00013012259194395795, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.00022072084798522787, + "loss": 0.0176, "step": 104760 }, { - "epoch": 1.13, - "learning_rate": 0.00013010637607835504, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022071328029221385, + "loss": 0.012, "step": 104770 }, { - "epoch": 1.13, - "learning_rate": 0.00013009016021275216, + "epoch": 0.53, + "learning_rate": 0.00022070571259919983, "loss": 0.013, "step": 104780 }, { - "epoch": 1.13, - "learning_rate": 0.00013007394434714923, - "loss": 0.0131, + "epoch": 0.53, + "learning_rate": 0.0002206981449061858, + "loss": 0.0134, "step": 104790 }, { - "epoch": 1.13, - "learning_rate": 0.00013005772848154634, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00022069057721317182, + "loss": 0.0151, "step": 104800 }, { - "epoch": 1.13, - "learning_rate": 0.0001300415126159434, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.0002206830095201578, + "loss": 0.0211, "step": 104810 }, { - "epoch": 1.13, - "learning_rate": 0.00013002529675034053, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.00022067544182714378, + "loss": 0.0153, "step": 104820 }, { - "epoch": 1.13, - "learning_rate": 0.00013000908088473762, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.0002206678741341298, + "loss": 0.0186, "step": 104830 }, { - "epoch": 1.13, - "learning_rate": 0.00012999286501913472, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022066030644111577, + "loss": 0.0161, "step": 104840 }, { - "epoch": 1.13, - "learning_rate": 0.0001299766491535318, - "loss": 0.0133, + "epoch": 0.53, + "learning_rate": 0.00022065273874810176, + "loss": 0.0184, "step": 104850 }, { - "epoch": 1.13, - "learning_rate": 0.0001299604332879289, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022064517105508776, + "loss": 0.0146, "step": 104860 }, { - "epoch": 1.13, - "learning_rate": 0.000129944217422326, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022063760336207375, + "loss": 0.0152, "step": 104870 }, { - "epoch": 1.13, - "learning_rate": 0.0001299280015567231, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022063003566905973, + "loss": 0.0127, "step": 104880 }, { - "epoch": 1.13, - "learning_rate": 0.00012991178569112018, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022062246797604574, + "loss": 0.0163, "step": 104890 }, { - "epoch": 1.13, - "learning_rate": 0.00012989556982551727, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022061490028303172, + "loss": 0.015, "step": 104900 }, { - "epoch": 1.13, - "learning_rate": 0.00012987935395991437, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.0002206073325900177, + "loss": 0.0136, "step": 104910 }, { - "epoch": 1.13, - "learning_rate": 0.00012986313809431146, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.0002205997648970037, + "loss": 0.0136, "step": 104920 }, { - "epoch": 1.13, - "learning_rate": 0.00012984692222870855, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.0002205921972039897, + "loss": 0.0199, "step": 104930 }, { - "epoch": 1.13, - "learning_rate": 0.00012983070636310564, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022058462951097567, + "loss": 0.0151, "step": 104940 }, { - "epoch": 1.13, - "learning_rate": 0.00012981449049750274, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.00022057706181796165, + "loss": 0.0161, "step": 104950 }, { - "epoch": 1.13, - "learning_rate": 0.00012979827463189983, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022056949412494763, + "loss": 0.0142, "step": 104960 }, { - "epoch": 1.13, - "learning_rate": 0.00012978205876629692, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022056192643193361, + "loss": 0.013, "step": 104970 }, { - "epoch": 1.13, - "learning_rate": 0.00012976584290069404, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.0002205543587389196, + "loss": 0.0197, "step": 104980 }, { - "epoch": 1.13, - "learning_rate": 0.0001297496270350911, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.0002205467910459056, + "loss": 0.0173, "step": 104990 }, { - "epoch": 1.14, - "learning_rate": 0.00012973341116948823, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.00022053922335289159, + "loss": 0.018, "step": 105000 }, { - "epoch": 1.14, - "eval_cer": 0.9215278031120306, - "eval_loss": 0.008072057738900185, - "eval_runtime": 121.1811, - "eval_samples_per_second": 16.504, - "eval_steps_per_second": 4.126, + "epoch": 0.53, + "eval_cer": 0.9144848118450433, + "eval_loss": 0.011399283073842525, + "eval_runtime": 116.6482, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.286, "step": 105000 }, { - "epoch": 1.14, - "learning_rate": 0.0001297171953038853, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00022053165565987757, + "loss": 0.0184, "step": 105010 }, { - "epoch": 1.14, - "learning_rate": 0.0001297009794382824, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022052408796686355, + "loss": 0.0154, "step": 105020 }, { - "epoch": 1.14, - "learning_rate": 0.0001296847635726795, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022051652027384956, + "loss": 0.015, "step": 105030 }, { - "epoch": 1.14, - "learning_rate": 0.0001296685477070766, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.00022050895258083554, + "loss": 0.0146, "step": 105040 }, { - "epoch": 1.14, - "learning_rate": 0.0001296523318414737, - "loss": 0.013, + "epoch": 0.53, + "learning_rate": 0.00022050138488782152, + "loss": 0.016, "step": 105050 }, { - "epoch": 1.14, - "learning_rate": 0.00012963611597587078, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022049381719480753, + "loss": 0.0169, "step": 105060 }, { - "epoch": 1.14, - "learning_rate": 0.00012961990011026788, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.0002204862495017935, + "loss": 0.0165, "step": 105070 }, { - "epoch": 1.14, - "learning_rate": 0.00012960368424466497, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.0002204786818087795, + "loss": 0.0157, "step": 105080 }, { - "epoch": 1.14, - "learning_rate": 0.00012958746837906206, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.0002204711141157655, + "loss": 0.0145, "step": 105090 }, { - "epoch": 1.14, - "learning_rate": 0.00012957125251345915, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022046354642275148, + "loss": 0.0233, "step": 105100 }, { - "epoch": 1.14, - "learning_rate": 0.00012955503664785625, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022045597872973746, + "loss": 0.0156, "step": 105110 }, { - "epoch": 1.14, - "learning_rate": 0.00012953882078225334, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.00022044841103672347, + "loss": 0.0163, "step": 105120 }, { - "epoch": 1.14, - "learning_rate": 0.00012952260491665046, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022044084334370945, + "loss": 0.0163, "step": 105130 }, { - "epoch": 1.14, - "learning_rate": 0.00012950638905104753, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022043327565069543, + "loss": 0.0185, "step": 105140 }, { - "epoch": 1.14, - "learning_rate": 0.00012949017318544465, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00022042570795768144, + "loss": 0.0161, "step": 105150 }, { - "epoch": 1.14, - "learning_rate": 0.0001294739573198417, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022041814026466742, + "loss": 0.0168, "step": 105160 }, { - "epoch": 1.14, - "learning_rate": 0.00012945774145423883, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.0002204105725716534, + "loss": 0.0132, "step": 105170 }, { - "epoch": 1.14, - "learning_rate": 0.0001294415255886359, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.0002204030048786394, + "loss": 0.0138, "step": 105180 }, { - "epoch": 1.14, - "learning_rate": 0.00012942530972303302, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.0002203954371856254, + "loss": 0.016, "step": 105190 }, { - "epoch": 1.14, - "learning_rate": 0.0001294090938574301, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022038786949261138, + "loss": 0.0129, "step": 105200 }, { - "epoch": 1.14, - "learning_rate": 0.0001293928779918272, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022038030179959736, + "loss": 0.018, "step": 105210 }, { - "epoch": 1.14, - "learning_rate": 0.0001293766621262243, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022037273410658337, + "loss": 0.0156, "step": 105220 }, { - "epoch": 1.14, - "learning_rate": 0.0001293604462606214, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022036516641356935, + "loss": 0.0149, "step": 105230 }, { - "epoch": 1.14, - "learning_rate": 0.00012934423039501848, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022035759872055533, + "loss": 0.0129, "step": 105240 }, { - "epoch": 1.14, - "learning_rate": 0.00012932801452941557, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022035003102754134, + "loss": 0.0138, "step": 105250 }, { - "epoch": 1.14, - "learning_rate": 0.00012931179866381267, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022034246333452732, + "loss": 0.0151, "step": 105260 }, { - "epoch": 1.14, - "learning_rate": 0.00012929558279820976, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.0002203348956415133, + "loss": 0.0154, "step": 105270 }, { - "epoch": 1.14, - "learning_rate": 0.00012927936693260685, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.0002203273279484993, + "loss": 0.0162, "step": 105280 }, { - "epoch": 1.14, - "learning_rate": 0.00012926315106700394, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.0002203197602554853, + "loss": 0.0158, "step": 105290 }, { - "epoch": 1.14, - "learning_rate": 0.00012924693520140104, - "loss": 0.0118, + "epoch": 0.53, + "learning_rate": 0.00022031219256247127, + "loss": 0.0155, "step": 105300 }, { - "epoch": 1.14, - "learning_rate": 0.00012923071933579813, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.00022030462486945728, + "loss": 0.0169, "step": 105310 }, { - "epoch": 1.14, - "learning_rate": 0.00012921450347019522, - "loss": 0.0124, + "epoch": 0.53, + "learning_rate": 0.00022029705717644326, + "loss": 0.0149, "step": 105320 }, { - "epoch": 1.14, - "learning_rate": 0.00012919828760459231, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022028948948342924, + "loss": 0.017, "step": 105330 }, { - "epoch": 1.14, - "learning_rate": 0.0001291820717389894, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022028192179041525, + "loss": 0.016, "step": 105340 }, { - "epoch": 1.14, - "learning_rate": 0.00012916585587338653, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022027435409740123, + "loss": 0.0195, "step": 105350 }, { - "epoch": 1.14, - "learning_rate": 0.0001291496400077836, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022026678640438722, + "loss": 0.0163, "step": 105360 }, { - "epoch": 1.14, - "learning_rate": 0.0001291334241421807, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.0002202592187113732, + "loss": 0.0194, "step": 105370 }, { - "epoch": 1.14, - "learning_rate": 0.00012911720827657778, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.0002202516510183592, + "loss": 0.0134, "step": 105380 }, { - "epoch": 1.14, - "learning_rate": 0.0001291009924109749, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002202440833253452, + "loss": 0.0166, "step": 105390 }, { - "epoch": 1.14, - "learning_rate": 0.00012908477654537196, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00022023651563233117, + "loss": 0.0136, "step": 105400 }, { - "epoch": 1.14, - "learning_rate": 0.00012906856067976908, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.00022022894793931718, + "loss": 0.0141, "step": 105410 }, { - "epoch": 1.14, - "learning_rate": 0.00012905234481416618, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022022138024630316, + "loss": 0.0151, "step": 105420 }, { - "epoch": 1.14, - "learning_rate": 0.00012903612894856327, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.00022021381255328914, + "loss": 0.0143, "step": 105430 }, { - "epoch": 1.14, - "learning_rate": 0.00012901991308296036, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022020624486027515, + "loss": 0.0155, "step": 105440 }, { - "epoch": 1.14, - "learning_rate": 0.00012900369721735745, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022019867716726113, + "loss": 0.0214, "step": 105450 }, { - "epoch": 1.14, - "learning_rate": 0.00012898748135175455, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.0002201911094742471, + "loss": 0.015, "step": 105460 }, { - "epoch": 1.14, - "learning_rate": 0.00012897126548615164, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022018354178123312, + "loss": 0.0156, "step": 105470 }, { - "epoch": 1.14, - "learning_rate": 0.00012895504962054873, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.0002201759740882191, + "loss": 0.0166, "step": 105480 }, { - "epoch": 1.14, - "learning_rate": 0.00012893883375494583, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00022016840639520508, + "loss": 0.0133, "step": 105490 }, { - "epoch": 1.14, - "learning_rate": 0.00012892261788934292, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002201608387021911, + "loss": 0.0131, "step": 105500 }, { - "epoch": 1.14, - "learning_rate": 0.00012890640202374, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022015327100917707, + "loss": 0.0165, "step": 105510 }, { - "epoch": 1.14, - "learning_rate": 0.0001288901861581371, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022014570331616305, + "loss": 0.0157, "step": 105520 }, { - "epoch": 1.14, - "learning_rate": 0.0001288739702925342, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022013813562314904, + "loss": 0.0125, "step": 105530 }, { - "epoch": 1.14, - "learning_rate": 0.0001288577544269313, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022013056793013504, + "loss": 0.0153, "step": 105540 }, { - "epoch": 1.14, - "learning_rate": 0.00012884153856132838, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022012300023712103, + "loss": 0.0188, "step": 105550 }, { - "epoch": 1.14, - "learning_rate": 0.00012882532269572547, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.000220115432544107, + "loss": 0.0133, "step": 105560 }, { - "epoch": 1.14, - "learning_rate": 0.0001288091068301226, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022010786485109302, + "loss": 0.0173, "step": 105570 }, { - "epoch": 1.14, - "learning_rate": 0.00012879289096451966, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.000220100297158079, + "loss": 0.0149, "step": 105580 }, { - "epoch": 1.14, - "learning_rate": 0.00012877667509891678, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.00022009272946506498, + "loss": 0.0133, "step": 105590 }, { - "epoch": 1.14, - "learning_rate": 0.00012876045923331385, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.000220085161772051, + "loss": 0.0187, "step": 105600 }, { - "epoch": 1.14, - "learning_rate": 0.00012874424336771097, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022007759407903697, + "loss": 0.0186, "step": 105610 }, { - "epoch": 1.14, - "learning_rate": 0.00012872802750210803, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.00022007002638602295, + "loss": 0.0146, "step": 105620 }, { - "epoch": 1.14, - "learning_rate": 0.00012871181163650515, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022006245869300896, + "loss": 0.0139, "step": 105630 }, { - "epoch": 1.14, - "learning_rate": 0.00012869559577090224, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022005489099999494, + "loss": 0.0125, "step": 105640 }, { - "epoch": 1.14, - "learning_rate": 0.00012867937990529934, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.00022004732330698092, + "loss": 0.0139, "step": 105650 }, { - "epoch": 1.14, - "learning_rate": 0.00012866316403969643, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022003975561396693, + "loss": 0.0158, "step": 105660 }, { - "epoch": 1.14, - "learning_rate": 0.00012864694817409352, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.0002200321879209529, + "loss": 0.0153, "step": 105670 }, { - "epoch": 1.14, - "learning_rate": 0.00012863073230849061, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.0002200246202279389, + "loss": 0.0165, "step": 105680 }, { - "epoch": 1.14, - "learning_rate": 0.0001286145164428877, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022001705253492487, + "loss": 0.0164, "step": 105690 }, { - "epoch": 1.14, - "learning_rate": 0.0001285983005772848, - "loss": 0.0075, + "epoch": 0.53, + "learning_rate": 0.00022000948484191088, + "loss": 0.0159, "step": 105700 }, { - "epoch": 1.14, - "learning_rate": 0.0001285820847116819, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022000191714889686, + "loss": 0.0166, "step": 105710 }, { - "epoch": 1.14, - "learning_rate": 0.00012856586884607899, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00021999434945588285, + "loss": 0.0141, "step": 105720 }, { - "epoch": 1.14, - "learning_rate": 0.00012854965298047608, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00021998678176286885, + "loss": 0.0182, "step": 105730 }, { - "epoch": 1.14, - "learning_rate": 0.0001285334371148732, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00021997921406985484, + "loss": 0.0159, "step": 105740 }, { - "epoch": 1.14, - "learning_rate": 0.00012851722124927026, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00021997164637684082, + "loss": 0.0157, "step": 105750 }, { - "epoch": 1.14, - "learning_rate": 0.00012850100538366738, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021996407868382683, + "loss": 0.0137, "step": 105760 }, { - "epoch": 1.14, - "learning_rate": 0.00012848478951806445, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.0002199565109908128, + "loss": 0.0157, "step": 105770 }, { - "epoch": 1.14, - "learning_rate": 0.00012846857365246157, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.0002199489432977988, + "loss": 0.0184, "step": 105780 }, { - "epoch": 1.14, - "learning_rate": 0.00012845235778685866, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.0002199413756047848, + "loss": 0.015, "step": 105790 }, { - "epoch": 1.14, - "learning_rate": 0.00012843614192125575, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00021993380791177078, + "loss": 0.0133, "step": 105800 }, { - "epoch": 1.14, - "learning_rate": 0.00012841992605565285, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00021992624021875676, + "loss": 0.021, "step": 105810 }, { - "epoch": 1.14, - "learning_rate": 0.00012840371019004994, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021991867252574277, + "loss": 0.0119, "step": 105820 }, { - "epoch": 1.14, - "learning_rate": 0.00012838749432444703, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00021991110483272875, + "loss": 0.013, "step": 105830 }, { - "epoch": 1.14, - "learning_rate": 0.00012837127845884413, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00021990353713971473, + "loss": 0.0163, "step": 105840 }, { - "epoch": 1.14, - "learning_rate": 0.00012835506259324122, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002198959694467007, + "loss": 0.0225, "step": 105850 }, { - "epoch": 1.14, - "learning_rate": 0.0001283388467276383, - "loss": 0.0127, + "epoch": 0.53, + "learning_rate": 0.00021988840175368672, + "loss": 0.0149, "step": 105860 }, { - "epoch": 1.14, - "learning_rate": 0.0001283226308620354, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.0002198808340606727, + "loss": 0.0129, "step": 105870 }, { - "epoch": 1.14, - "learning_rate": 0.0001283064149964325, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00021987326636765868, + "loss": 0.0191, "step": 105880 }, { - "epoch": 1.14, - "learning_rate": 0.0001282901991308296, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.0002198656986746447, + "loss": 0.0123, "step": 105890 }, { - "epoch": 1.14, - "learning_rate": 0.00012827398326522668, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.00021985813098163067, + "loss": 0.0126, "step": 105900 }, { - "epoch": 1.14, - "learning_rate": 0.00012825776739962377, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021985056328861666, + "loss": 0.0144, "step": 105910 }, { - "epoch": 1.15, - "learning_rate": 0.00012824155153402087, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00021984299559560266, + "loss": 0.0123, "step": 105920 }, { - "epoch": 1.15, - "learning_rate": 0.00012822533566841796, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00021983542790258865, + "loss": 0.0156, "step": 105930 }, { - "epoch": 1.15, - "learning_rate": 0.00012820911980281508, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00021982786020957463, + "loss": 0.0114, "step": 105940 }, { - "epoch": 1.15, - "learning_rate": 0.00012819290393721215, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00021982029251656064, + "loss": 0.015, "step": 105950 }, { - "epoch": 1.15, - "learning_rate": 0.00012817668807160927, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00021981272482354662, + "loss": 0.0171, "step": 105960 }, { - "epoch": 1.15, - "learning_rate": 0.00012816047220600633, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.0002198051571305326, + "loss": 0.0175, "step": 105970 }, { - "epoch": 1.15, - "learning_rate": 0.00012814425634040345, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.0002197975894375186, + "loss": 0.0168, "step": 105980 }, { - "epoch": 1.15, - "learning_rate": 0.00012812804047480054, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.0002197900217445046, + "loss": 0.0145, "step": 105990 }, { - "epoch": 1.15, - "learning_rate": 0.00012811182460919764, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.00021978245405149057, + "loss": 0.02, "step": 106000 }, { - "epoch": 1.15, - "eval_cer": 0.9215512553918529, - "eval_loss": 0.00793379731476307, - "eval_runtime": 121.3321, - "eval_samples_per_second": 16.484, - "eval_steps_per_second": 4.121, + "epoch": 0.53, + "eval_cer": 0.9144886934295449, + "eval_loss": 0.01085778046399355, + "eval_runtime": 116.7271, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, "step": 106000 }, { - "epoch": 1.15, - "learning_rate": 0.00012809560874359473, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00021977488635847658, + "loss": 0.0155, "step": 106010 }, { - "epoch": 1.15, - "learning_rate": 0.00012807939287799182, - "loss": 0.0118, + "epoch": 0.53, + "learning_rate": 0.00021976731866546256, + "loss": 0.0119, "step": 106020 }, { - "epoch": 1.15, - "learning_rate": 0.00012806317701238892, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00021975975097244854, + "loss": 0.0178, "step": 106030 }, { - "epoch": 1.15, - "learning_rate": 0.000128046961146786, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00021975218327943452, + "loss": 0.0181, "step": 106040 }, { - "epoch": 1.15, - "learning_rate": 0.0001280307452811831, - "loss": 0.0129, + "epoch": 0.54, + "learning_rate": 0.00021974461558642053, + "loss": 0.0155, "step": 106050 }, { - "epoch": 1.15, - "learning_rate": 0.0001280145294155802, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.0002197370478934065, + "loss": 0.0122, "step": 106060 }, { - "epoch": 1.15, - "learning_rate": 0.00012799831354997729, - "loss": 0.012, + "epoch": 0.54, + "learning_rate": 0.0002197294802003925, + "loss": 0.0148, "step": 106070 }, { - "epoch": 1.15, - "learning_rate": 0.00012798209768437438, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.0002197219125073785, + "loss": 0.0172, "step": 106080 }, { - "epoch": 1.15, - "learning_rate": 0.00012796588181877147, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021971434481436448, + "loss": 0.0152, "step": 106090 }, { - "epoch": 1.15, - "learning_rate": 0.00012794966595316856, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021970677712135047, + "loss": 0.016, "step": 106100 }, { - "epoch": 1.15, - "learning_rate": 0.00012793345008756566, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021969920942833647, + "loss": 0.0164, "step": 106110 }, { - "epoch": 1.15, - "learning_rate": 0.00012791723422196275, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021969164173532246, + "loss": 0.0144, "step": 106120 }, { - "epoch": 1.15, - "learning_rate": 0.00012790101835635984, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.00021968407404230844, + "loss": 0.0153, "step": 106130 }, { - "epoch": 1.15, - "learning_rate": 0.00012788480249075696, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.00021967650634929445, + "loss": 0.0152, "step": 106140 }, { - "epoch": 1.15, - "learning_rate": 0.00012786858662515403, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021966893865628043, + "loss": 0.0141, "step": 106150 }, { - "epoch": 1.15, - "learning_rate": 0.00012785237075955115, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.0002196613709632664, + "loss": 0.0137, "step": 106160 }, { - "epoch": 1.15, - "learning_rate": 0.0001278361548939482, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021965380327025242, + "loss": 0.0168, "step": 106170 }, { - "epoch": 1.15, - "learning_rate": 0.00012781993902834533, - "loss": 0.0121, + "epoch": 0.54, + "learning_rate": 0.0002196462355772384, + "loss": 0.0173, "step": 106180 }, { - "epoch": 1.15, - "learning_rate": 0.0001278037231627424, - "loss": 0.0132, + "epoch": 0.54, + "learning_rate": 0.00021963866788422438, + "loss": 0.0178, "step": 106190 }, { - "epoch": 1.15, - "learning_rate": 0.00012778750729713952, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021963110019121036, + "loss": 0.0139, "step": 106200 }, { - "epoch": 1.15, - "learning_rate": 0.0001277712914315366, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.00021962353249819634, + "loss": 0.0164, "step": 106210 }, { - "epoch": 1.15, - "learning_rate": 0.0001277550755659337, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021961596480518232, + "loss": 0.0166, "step": 106220 }, { - "epoch": 1.15, - "learning_rate": 0.0001277388597003308, - "loss": 0.016, + "epoch": 0.54, + "learning_rate": 0.0002196083971121683, + "loss": 0.0137, "step": 106230 }, { - "epoch": 1.15, - "learning_rate": 0.0001277226438347279, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.0002196008294191543, + "loss": 0.0137, "step": 106240 }, { - "epoch": 1.15, - "learning_rate": 0.00012770642796912498, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002195932617261403, + "loss": 0.0126, "step": 106250 }, { - "epoch": 1.15, - "learning_rate": 0.00012769021210352208, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021958569403312628, + "loss": 0.019, "step": 106260 }, { - "epoch": 1.15, - "learning_rate": 0.00012767399623791917, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021957812634011226, + "loss": 0.012, "step": 106270 }, { - "epoch": 1.15, - "learning_rate": 0.00012765778037231626, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.00021957055864709827, + "loss": 0.0136, "step": 106280 }, { - "epoch": 1.15, - "learning_rate": 0.00012764156450671335, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021956299095408425, + "loss": 0.0131, "step": 106290 }, { - "epoch": 1.15, - "learning_rate": 0.00012762534864111045, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021955542326107023, + "loss": 0.0152, "step": 106300 }, { - "epoch": 1.15, - "learning_rate": 0.00012760913277550754, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021954785556805624, + "loss": 0.0129, "step": 106310 }, { - "epoch": 1.15, - "learning_rate": 0.00012759291690990463, - "loss": 0.0122, + "epoch": 0.54, + "learning_rate": 0.00021954028787504222, + "loss": 0.012, "step": 106320 }, { - "epoch": 1.15, - "learning_rate": 0.00012757670104430172, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.0002195327201820282, + "loss": 0.0136, "step": 106330 }, { - "epoch": 1.15, - "learning_rate": 0.00012756048517869882, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.0002195251524890142, + "loss": 0.0148, "step": 106340 }, { - "epoch": 1.15, - "learning_rate": 0.0001275442693130959, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.0002195175847960002, + "loss": 0.013, "step": 106350 }, { - "epoch": 1.15, - "learning_rate": 0.00012752805344749303, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021951001710298617, + "loss": 0.015, "step": 106360 }, { - "epoch": 1.15, - "learning_rate": 0.0001275118375818901, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021950244940997218, + "loss": 0.0159, "step": 106370 }, { - "epoch": 1.15, - "learning_rate": 0.00012749562171628722, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021949488171695816, + "loss": 0.0124, "step": 106380 }, { - "epoch": 1.15, - "learning_rate": 0.00012747940585068428, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021948731402394414, + "loss": 0.0131, "step": 106390 }, { - "epoch": 1.15, - "learning_rate": 0.0001274631899850814, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.00021947974633093015, + "loss": 0.0172, "step": 106400 }, { - "epoch": 1.15, - "learning_rate": 0.00012744697411947847, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.00021947217863791613, + "loss": 0.0129, "step": 106410 }, { - "epoch": 1.15, - "learning_rate": 0.00012743075825387559, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021946461094490212, + "loss": 0.0194, "step": 106420 }, { - "epoch": 1.15, - "learning_rate": 0.00012741454238827268, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.0002194570432518881, + "loss": 0.0149, "step": 106430 }, { - "epoch": 1.15, - "learning_rate": 0.00012739832652266977, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.0002194494755588741, + "loss": 0.0191, "step": 106440 }, { - "epoch": 1.15, - "learning_rate": 0.00012738211065706686, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.0002194419078658601, + "loss": 0.0136, "step": 106450 }, { - "epoch": 1.15, - "learning_rate": 0.00012736589479146396, - "loss": 0.012, + "epoch": 0.54, + "learning_rate": 0.00021943434017284607, + "loss": 0.0142, "step": 106460 }, { - "epoch": 1.15, - "learning_rate": 0.00012734967892586105, - "loss": 0.0118, + "epoch": 0.54, + "learning_rate": 0.00021942677247983208, + "loss": 0.0128, "step": 106470 }, { - "epoch": 1.15, - "learning_rate": 0.00012733346306025814, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021941920478681806, + "loss": 0.0176, "step": 106480 }, { - "epoch": 1.15, - "learning_rate": 0.00012731724719465524, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.00021941163709380404, + "loss": 0.0141, "step": 106490 }, { - "epoch": 1.15, - "learning_rate": 0.00012730103132905233, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021940406940079005, + "loss": 0.0146, "step": 106500 }, { - "epoch": 1.15, - "learning_rate": 0.00012728481546344945, - "loss": 0.0118, + "epoch": 0.54, + "learning_rate": 0.00021939650170777603, + "loss": 0.0145, "step": 106510 }, { - "epoch": 1.15, - "learning_rate": 0.00012726859959784651, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.000219388934014762, + "loss": 0.0151, "step": 106520 }, { - "epoch": 1.15, - "learning_rate": 0.00012725238373224363, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021938136632174802, + "loss": 0.0161, "step": 106530 }, { - "epoch": 1.15, - "learning_rate": 0.0001272361678666407, - "loss": 0.0082, + "epoch": 0.54, + "learning_rate": 0.000219373798628734, + "loss": 0.0169, "step": 106540 }, { - "epoch": 1.15, - "learning_rate": 0.00012721995200103782, - "loss": 0.0119, + "epoch": 0.54, + "learning_rate": 0.00021936623093571998, + "loss": 0.0133, "step": 106550 }, { - "epoch": 1.15, - "learning_rate": 0.00012720373613543488, - "loss": 0.0129, + "epoch": 0.54, + "learning_rate": 0.000219358663242706, + "loss": 0.0263, "step": 106560 }, { - "epoch": 1.15, - "learning_rate": 0.000127187520269832, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021935109554969197, + "loss": 0.0191, "step": 106570 }, { - "epoch": 1.15, - "learning_rate": 0.0001271713044042291, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021934352785667795, + "loss": 0.0143, "step": 106580 }, { - "epoch": 1.15, - "learning_rate": 0.0001271550885386262, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021933596016366394, + "loss": 0.0169, "step": 106590 }, { - "epoch": 1.15, - "learning_rate": 0.00012713887267302328, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021932839247064994, + "loss": 0.0171, "step": 106600 }, { - "epoch": 1.15, - "learning_rate": 0.00012712265680742038, - "loss": 0.0129, + "epoch": 0.54, + "learning_rate": 0.00021932082477763593, + "loss": 0.0148, "step": 106610 }, { - "epoch": 1.15, - "learning_rate": 0.00012710644094181747, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002193132570846219, + "loss": 0.015, "step": 106620 }, { - "epoch": 1.15, - "learning_rate": 0.00012709022507621456, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021930568939160792, + "loss": 0.0174, "step": 106630 }, { - "epoch": 1.15, - "learning_rate": 0.00012707400921061165, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.0002192981216985939, + "loss": 0.012, "step": 106640 }, { - "epoch": 1.15, - "learning_rate": 0.00012705779334500875, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021929055400557988, + "loss": 0.0155, "step": 106650 }, { - "epoch": 1.15, - "learning_rate": 0.00012704157747940584, - "loss": 0.0128, + "epoch": 0.54, + "learning_rate": 0.0002192829863125659, + "loss": 0.0144, "step": 106660 }, { - "epoch": 1.15, - "learning_rate": 0.00012702536161380293, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021927541861955187, + "loss": 0.0144, "step": 106670 }, { - "epoch": 1.15, - "learning_rate": 0.00012700914574820002, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021926785092653785, + "loss": 0.0147, "step": 106680 }, { - "epoch": 1.15, - "learning_rate": 0.00012699292988259712, - "loss": 0.0119, + "epoch": 0.54, + "learning_rate": 0.00021926028323352386, + "loss": 0.0172, "step": 106690 }, { - "epoch": 1.15, - "learning_rate": 0.0001269767140169942, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021925271554050984, + "loss": 0.0147, "step": 106700 }, { - "epoch": 1.15, - "learning_rate": 0.0001269604981513913, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021924514784749582, + "loss": 0.0142, "step": 106710 }, { - "epoch": 1.15, - "learning_rate": 0.0001269442822857884, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021923758015448183, + "loss": 0.0154, "step": 106720 }, { - "epoch": 1.15, - "learning_rate": 0.00012692806642018552, - "loss": 0.0143, + "epoch": 0.54, + "learning_rate": 0.0002192300124614678, + "loss": 0.0151, "step": 106730 }, { - "epoch": 1.15, - "learning_rate": 0.00012691185055458258, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.0002192224447684538, + "loss": 0.016, "step": 106740 }, { - "epoch": 1.15, - "learning_rate": 0.0001268956346889797, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021921487707543977, + "loss": 0.0135, "step": 106750 }, { - "epoch": 1.15, - "learning_rate": 0.00012687941882337677, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021920730938242578, + "loss": 0.0155, "step": 106760 }, { - "epoch": 1.15, - "learning_rate": 0.0001268632029577739, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.00021919974168941176, + "loss": 0.0147, "step": 106770 }, { - "epoch": 1.15, - "learning_rate": 0.00012684698709217095, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021919217399639775, + "loss": 0.0216, "step": 106780 }, { - "epoch": 1.15, - "learning_rate": 0.00012683077122656807, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021918460630338375, + "loss": 0.0156, "step": 106790 }, { - "epoch": 1.15, - "learning_rate": 0.00012681455536096516, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021917703861036974, + "loss": 0.013, "step": 106800 }, { - "epoch": 1.15, - "learning_rate": 0.00012679833949536226, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021916947091735572, + "loss": 0.0147, "step": 106810 }, { - "epoch": 1.15, - "learning_rate": 0.00012678212362975935, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021916190322434173, + "loss": 0.0186, "step": 106820 }, { - "epoch": 1.15, - "learning_rate": 0.00012676590776415644, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002191543355313277, + "loss": 0.0157, "step": 106830 }, { - "epoch": 1.15, - "learning_rate": 0.00012674969189855354, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.0002191467678383137, + "loss": 0.0157, "step": 106840 }, { - "epoch": 1.16, - "learning_rate": 0.00012673347603295063, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.0002191392001452997, + "loss": 0.0161, "step": 106850 }, { - "epoch": 1.16, - "learning_rate": 0.00012671726016734772, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021913163245228568, + "loss": 0.0137, "step": 106860 }, { - "epoch": 1.16, - "learning_rate": 0.00012670104430174481, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021912406475927166, + "loss": 0.0169, "step": 106870 }, { - "epoch": 1.16, - "learning_rate": 0.0001266848284361419, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021911649706625767, + "loss": 0.0149, "step": 106880 }, { - "epoch": 1.16, - "learning_rate": 0.000126668612570539, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021910892937324365, + "loss": 0.019, "step": 106890 }, { - "epoch": 1.16, - "learning_rate": 0.0001266523967049361, - "loss": 0.0132, + "epoch": 0.54, + "learning_rate": 0.00021910136168022963, + "loss": 0.0167, "step": 106900 }, { - "epoch": 1.16, - "learning_rate": 0.00012663618083933318, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021909379398721564, + "loss": 0.0152, "step": 106910 }, { - "epoch": 1.16, - "learning_rate": 0.00012661996497373028, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021908622629420162, + "loss": 0.0167, "step": 106920 }, { - "epoch": 1.16, - "learning_rate": 0.00012660374910812737, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002190786586011876, + "loss": 0.0173, "step": 106930 }, { - "epoch": 1.16, - "learning_rate": 0.00012658753324252446, - "loss": 0.0128, + "epoch": 0.54, + "learning_rate": 0.00021907109090817358, + "loss": 0.011, "step": 106940 }, { - "epoch": 1.16, - "learning_rate": 0.00012657131737692158, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.0002190635232151596, + "loss": 0.0153, "step": 106950 }, { - "epoch": 1.16, - "learning_rate": 0.00012655510151131865, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021905595552214557, + "loss": 0.0154, "step": 106960 }, { - "epoch": 1.16, - "learning_rate": 0.00012653888564571577, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021904838782913156, + "loss": 0.0152, "step": 106970 }, { - "epoch": 1.16, - "learning_rate": 0.00012652266978011283, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021904082013611756, + "loss": 0.0168, "step": 106980 }, { - "epoch": 1.16, - "learning_rate": 0.00012650645391450995, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021903325244310355, + "loss": 0.0132, "step": 106990 }, { - "epoch": 1.16, - "learning_rate": 0.00012649023804890705, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021902568475008953, + "loss": 0.0152, "step": 107000 }, { - "epoch": 1.16, - "eval_cer": 0.9215686274509803, - "eval_loss": 0.008123186416924, - "eval_runtime": 121.1965, - "eval_samples_per_second": 16.502, - "eval_steps_per_second": 4.126, + "epoch": 0.54, + "eval_cer": 0.9144886934295449, + "eval_loss": 0.010931231081485748, + "eval_runtime": 116.6714, + "eval_samples_per_second": 17.142, + "eval_steps_per_second": 4.286, "step": 107000 }, { - "epoch": 1.16, - "learning_rate": 0.00012647402218330414, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021901811705707554, + "loss": 0.0139, "step": 107010 }, { - "epoch": 1.16, - "learning_rate": 0.00012645780631770123, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021901054936406152, + "loss": 0.0144, "step": 107020 }, { - "epoch": 1.16, - "learning_rate": 0.00012644159045209832, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.0002190029816710475, + "loss": 0.0108, "step": 107030 }, { - "epoch": 1.16, - "learning_rate": 0.00012642537458649542, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.0002189954139780335, + "loss": 0.0194, "step": 107040 }, { - "epoch": 1.16, - "learning_rate": 0.0001264091587208925, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.0002189878462850195, + "loss": 0.0142, "step": 107050 }, { - "epoch": 1.16, - "learning_rate": 0.0001263929428552896, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021898027859200547, + "loss": 0.0164, "step": 107060 }, { - "epoch": 1.16, - "learning_rate": 0.0001263767269896867, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021897271089899148, + "loss": 0.0135, "step": 107070 }, { - "epoch": 1.16, - "learning_rate": 0.0001263605111240838, - "loss": 0.0116, + "epoch": 0.54, + "learning_rate": 0.00021896514320597746, + "loss": 0.016, "step": 107080 }, { - "epoch": 1.16, - "learning_rate": 0.00012634429525848088, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021895757551296344, + "loss": 0.0143, "step": 107090 }, { - "epoch": 1.16, - "learning_rate": 0.00012632807939287797, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021895000781994942, + "loss": 0.0282, "step": 107100 }, { - "epoch": 1.16, - "learning_rate": 0.00012631186352727507, - "loss": 0.0119, + "epoch": 0.54, + "learning_rate": 0.00021894244012693543, + "loss": 0.0153, "step": 107110 }, { - "epoch": 1.16, - "learning_rate": 0.00012629564766167216, - "loss": 0.0125, + "epoch": 0.54, + "learning_rate": 0.0002189348724339214, + "loss": 0.0144, "step": 107120 }, { - "epoch": 1.16, - "learning_rate": 0.00012627943179606925, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.0002189273047409074, + "loss": 0.0135, "step": 107130 }, { - "epoch": 1.16, - "learning_rate": 0.00012626321593046635, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.0002189197370478934, + "loss": 0.0165, "step": 107140 }, { - "epoch": 1.16, - "learning_rate": 0.00012624700006486346, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.00021891216935487938, + "loss": 0.0173, "step": 107150 }, { - "epoch": 1.16, - "learning_rate": 0.00012623078419926053, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021890460166186537, + "loss": 0.0209, "step": 107160 }, { - "epoch": 1.16, - "learning_rate": 0.00012621456833365765, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021889703396885137, + "loss": 0.0149, "step": 107170 }, { - "epoch": 1.16, - "learning_rate": 0.00012619835246805474, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021888946627583736, + "loss": 0.0118, "step": 107180 }, { - "epoch": 1.16, - "learning_rate": 0.00012618213660245184, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021888189858282334, + "loss": 0.017, "step": 107190 }, { - "epoch": 1.16, - "learning_rate": 0.00012616592073684893, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.00021887433088980935, + "loss": 0.0166, "step": 107200 }, { - "epoch": 1.16, - "learning_rate": 0.00012614970487124602, - "loss": 0.0128, + "epoch": 0.54, + "learning_rate": 0.00021886676319679533, + "loss": 0.0153, "step": 107210 }, { - "epoch": 1.16, - "learning_rate": 0.00012613348900564311, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.0002188591955037813, + "loss": 0.0159, "step": 107220 }, { - "epoch": 1.16, - "learning_rate": 0.0001261172731400402, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021885162781076732, + "loss": 0.0161, "step": 107230 }, { - "epoch": 1.16, - "learning_rate": 0.0001261010572744373, - "loss": 0.012, + "epoch": 0.54, + "learning_rate": 0.0002188440601177533, + "loss": 0.0136, "step": 107240 }, { - "epoch": 1.16, - "learning_rate": 0.0001260848414088344, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021883649242473928, + "loss": 0.0146, "step": 107250 }, { - "epoch": 1.16, - "learning_rate": 0.00012606862554323149, - "loss": 0.0076, + "epoch": 0.54, + "learning_rate": 0.00021882892473172526, + "loss": 0.0155, "step": 107260 }, { - "epoch": 1.16, - "learning_rate": 0.00012605240967762858, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021882135703871127, + "loss": 0.013, "step": 107270 }, { - "epoch": 1.16, - "learning_rate": 0.00012603619381202567, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021881378934569725, + "loss": 0.0149, "step": 107280 }, { - "epoch": 1.16, - "learning_rate": 0.00012601997794642276, - "loss": 0.0076, + "epoch": 0.54, + "learning_rate": 0.00021880622165268323, + "loss": 0.0144, "step": 107290 }, { - "epoch": 1.16, - "learning_rate": 0.00012600376208081988, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021879865395966924, + "loss": 0.0143, "step": 107300 }, { - "epoch": 1.16, - "learning_rate": 0.00012598754621521695, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021879108626665522, + "loss": 0.0117, "step": 107310 }, { - "epoch": 1.16, - "learning_rate": 0.00012597133034961407, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002187835185736412, + "loss": 0.0171, "step": 107320 }, { - "epoch": 1.16, - "learning_rate": 0.00012595511448401113, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.0002187759508806272, + "loss": 0.0158, "step": 107330 }, { - "epoch": 1.16, - "learning_rate": 0.00012593889861840825, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.0002187683831876132, + "loss": 0.0203, "step": 107340 }, { - "epoch": 1.16, - "learning_rate": 0.00012592268275280532, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021876081549459918, + "loss": 0.014, "step": 107350 }, { - "epoch": 1.16, - "learning_rate": 0.00012590646688720244, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021875324780158518, + "loss": 0.0154, "step": 107360 }, { - "epoch": 1.16, - "learning_rate": 0.00012589025102159953, - "loss": 0.0118, + "epoch": 0.54, + "learning_rate": 0.00021874568010857117, + "loss": 0.0205, "step": 107370 }, { - "epoch": 1.16, - "learning_rate": 0.00012587403515599663, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021873811241555715, + "loss": 0.0145, "step": 107380 }, { - "epoch": 1.16, - "learning_rate": 0.00012585781929039372, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021873054472254316, + "loss": 0.0134, "step": 107390 }, { - "epoch": 1.16, - "learning_rate": 0.0001258416034247908, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021872297702952914, + "loss": 0.0152, "step": 107400 }, { - "epoch": 1.16, - "learning_rate": 0.0001258253875591879, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021871540933651512, + "loss": 0.0144, "step": 107410 }, { - "epoch": 1.16, - "learning_rate": 0.000125809171693585, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021870784164350113, + "loss": 0.0147, "step": 107420 }, { - "epoch": 1.16, - "learning_rate": 0.0001257929558279821, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.0002187002739504871, + "loss": 0.0152, "step": 107430 }, { - "epoch": 1.16, - "learning_rate": 0.00012577673996237918, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.0002186927062574731, + "loss": 0.0188, "step": 107440 }, { - "epoch": 1.16, - "learning_rate": 0.00012576052409677627, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021868513856445907, + "loss": 0.0185, "step": 107450 }, { - "epoch": 1.16, - "learning_rate": 0.00012574430823117337, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.00021867757087144508, + "loss": 0.0164, "step": 107460 }, { - "epoch": 1.16, - "learning_rate": 0.00012572809236557046, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021867000317843103, + "loss": 0.0124, "step": 107470 }, { - "epoch": 1.16, - "learning_rate": 0.00012571187649996755, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.00021866243548541702, + "loss": 0.0153, "step": 107480 }, { - "epoch": 1.16, - "learning_rate": 0.00012569566063436465, - "loss": 0.0073, + "epoch": 0.54, + "learning_rate": 0.000218654867792403, + "loss": 0.0181, "step": 107490 }, { - "epoch": 1.16, - "learning_rate": 0.00012567944476876174, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.000218647300099389, + "loss": 0.016, "step": 107500 }, { - "epoch": 1.16, - "learning_rate": 0.00012566322890315883, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.000218639732406375, + "loss": 0.0168, "step": 107510 }, { - "epoch": 1.16, - "learning_rate": 0.00012564701303755595, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021863216471336097, + "loss": 0.0162, "step": 107520 }, { - "epoch": 1.16, - "learning_rate": 0.00012563079717195302, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021862459702034698, + "loss": 0.0138, "step": 107530 }, { - "epoch": 1.16, - "learning_rate": 0.00012561458130635014, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.00021861702932733296, + "loss": 0.0174, "step": 107540 }, { - "epoch": 1.16, - "learning_rate": 0.0001255983654407472, - "loss": 0.0121, + "epoch": 0.54, + "learning_rate": 0.00021860946163431894, + "loss": 0.0166, "step": 107550 }, { - "epoch": 1.16, - "learning_rate": 0.00012558214957514432, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.00021860189394130495, + "loss": 0.0149, "step": 107560 }, { - "epoch": 1.16, - "learning_rate": 0.0001255659337095414, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021859432624829093, + "loss": 0.0163, "step": 107570 }, { - "epoch": 1.16, - "learning_rate": 0.0001255497178439385, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.0002185867585552769, + "loss": 0.0165, "step": 107580 }, { - "epoch": 1.16, - "learning_rate": 0.0001255335019783356, - "loss": 0.0133, + "epoch": 0.54, + "learning_rate": 0.00021857919086226292, + "loss": 0.0174, "step": 107590 }, { - "epoch": 1.16, - "learning_rate": 0.0001255172861127327, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.0002185716231692489, + "loss": 0.0131, "step": 107600 }, { - "epoch": 1.16, - "learning_rate": 0.00012550107024712979, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021856405547623488, + "loss": 0.0154, "step": 107610 }, { - "epoch": 1.16, - "learning_rate": 0.00012548485438152688, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.0002185564877832209, + "loss": 0.0119, "step": 107620 }, { - "epoch": 1.16, - "learning_rate": 0.00012546863851592397, - "loss": 0.012, + "epoch": 0.54, + "learning_rate": 0.00021854892009020687, + "loss": 0.0144, "step": 107630 }, { - "epoch": 1.16, - "learning_rate": 0.00012545242265032106, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021854135239719285, + "loss": 0.0144, "step": 107640 }, { - "epoch": 1.16, - "learning_rate": 0.00012543620678471816, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.00021853378470417884, + "loss": 0.0173, "step": 107650 }, { - "epoch": 1.16, - "learning_rate": 0.00012541999091911525, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021852621701116484, + "loss": 0.0188, "step": 107660 }, { - "epoch": 1.16, - "learning_rate": 0.00012540377505351234, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021851864931815083, + "loss": 0.0186, "step": 107670 }, { - "epoch": 1.16, - "learning_rate": 0.00012538755918790943, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.0002185110816251368, + "loss": 0.0114, "step": 107680 }, { - "epoch": 1.16, - "learning_rate": 0.00012537134332230653, - "loss": 0.0133, + "epoch": 0.54, + "learning_rate": 0.00021850351393212282, + "loss": 0.0166, "step": 107690 }, { - "epoch": 1.16, - "learning_rate": 0.00012535512745670362, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.0002184959462391088, + "loss": 0.0158, "step": 107700 }, { - "epoch": 1.16, - "learning_rate": 0.0001253389115911007, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021848837854609478, + "loss": 0.0154, "step": 107710 }, { - "epoch": 1.16, - "learning_rate": 0.0001253226957254978, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.0002184808108530808, + "loss": 0.0178, "step": 107720 }, { - "epoch": 1.16, - "learning_rate": 0.0001253064798598949, - "loss": 0.0127, + "epoch": 0.54, + "learning_rate": 0.00021847324316006677, + "loss": 0.016, "step": 107730 }, { - "epoch": 1.16, - "learning_rate": 0.00012529026399429202, - "loss": 0.0125, + "epoch": 0.54, + "learning_rate": 0.00021846567546705275, + "loss": 0.0134, "step": 107740 }, { - "epoch": 1.16, - "learning_rate": 0.00012527404812868908, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021845810777403876, + "loss": 0.0142, "step": 107750 }, { - "epoch": 1.16, - "learning_rate": 0.0001252578322630862, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021845054008102474, + "loss": 0.0135, "step": 107760 }, { - "epoch": 1.17, - "learning_rate": 0.00012524161639748327, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021844297238801072, + "loss": 0.0173, "step": 107770 }, { - "epoch": 1.17, - "learning_rate": 0.0001252254005318804, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021843540469499673, + "loss": 0.0131, "step": 107780 }, { - "epoch": 1.17, - "learning_rate": 0.00012520918466627745, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.0002184278370019827, + "loss": 0.0145, "step": 107790 }, { - "epoch": 1.17, - "learning_rate": 0.00012519296880067457, - "loss": 0.0082, + "epoch": 0.54, + "learning_rate": 0.0002184202693089687, + "loss": 0.0142, "step": 107800 }, { - "epoch": 1.17, - "learning_rate": 0.00012517675293507167, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.0002184127016159547, + "loss": 0.0166, "step": 107810 }, { - "epoch": 1.17, - "learning_rate": 0.00012516053706946876, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021840513392294068, + "loss": 0.0137, "step": 107820 }, { - "epoch": 1.17, - "learning_rate": 0.00012514432120386585, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021839756622992666, + "loss": 0.0165, "step": 107830 }, { - "epoch": 1.17, - "learning_rate": 0.00012512810533826295, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.00021838999853691265, + "loss": 0.0128, "step": 107840 }, { - "epoch": 1.17, - "learning_rate": 0.00012511188947266004, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021838243084389865, + "loss": 0.0143, "step": 107850 }, { - "epoch": 1.17, - "learning_rate": 0.00012509567360705713, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021837486315088464, + "loss": 0.0123, "step": 107860 }, { - "epoch": 1.17, - "learning_rate": 0.00012507945774145422, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021836729545787062, + "loss": 0.0162, "step": 107870 }, { - "epoch": 1.17, - "learning_rate": 0.00012506324187585132, - "loss": 0.0131, + "epoch": 0.54, + "learning_rate": 0.00021835972776485663, + "loss": 0.0173, "step": 107880 }, { - "epoch": 1.17, - "learning_rate": 0.0001250470260102484, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.0002183521600718426, + "loss": 0.0154, "step": 107890 }, { - "epoch": 1.17, - "learning_rate": 0.0001250308101446455, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002183445923788286, + "loss": 0.0174, "step": 107900 }, { - "epoch": 1.17, - "learning_rate": 0.00012501459427904262, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.0002183370246858146, + "loss": 0.0143, "step": 107910 }, { - "epoch": 1.17, - "learning_rate": 0.0001249983784134397, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021832945699280058, + "loss": 0.0183, "step": 107920 }, { - "epoch": 1.17, - "learning_rate": 0.0001249821625478368, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021832188929978656, + "loss": 0.0166, "step": 107930 }, { - "epoch": 1.17, - "learning_rate": 0.00012496594668223387, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.00021831432160677257, + "loss": 0.0179, "step": 107940 }, { - "epoch": 1.17, - "learning_rate": 0.000124949730816631, - "loss": 0.0152, + "epoch": 0.54, + "learning_rate": 0.00021830675391375855, + "loss": 0.0156, "step": 107950 }, { - "epoch": 1.17, - "learning_rate": 0.00012493351495102809, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021829918622074453, + "loss": 0.0146, "step": 107960 }, { - "epoch": 1.17, - "learning_rate": 0.00012491729908542518, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021829161852773054, + "loss": 0.0139, "step": 107970 }, { - "epoch": 1.17, - "learning_rate": 0.00012490108321982227, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021828405083471652, + "loss": 0.0175, "step": 107980 }, { - "epoch": 1.17, - "learning_rate": 0.00012488486735421936, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.0002182764831417025, + "loss": 0.0176, "step": 107990 }, { - "epoch": 1.17, - "learning_rate": 0.00012486865148861646, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021826891544868848, + "loss": 0.0146, "step": 108000 }, { - "epoch": 1.17, - "eval_cer": 0.9215590728184603, - "eval_loss": 0.008009477518498898, - "eval_runtime": 121.2932, - "eval_samples_per_second": 16.489, - "eval_steps_per_second": 4.122, + "epoch": 0.54, + "eval_cer": 0.9144886934295449, + "eval_loss": 0.011288284324109554, + "eval_runtime": 116.6804, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, "step": 108000 }, { - "epoch": 1.17, - "learning_rate": 0.00012485243562301355, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.0002182613477556745, + "loss": 0.0146, "step": 108010 }, { - "epoch": 1.17, - "learning_rate": 0.00012483621975741064, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021825378006266047, + "loss": 0.0141, "step": 108020 }, { - "epoch": 1.17, - "learning_rate": 0.00012482000389180773, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021824621236964646, + "loss": 0.0117, "step": 108030 }, { - "epoch": 1.17, - "learning_rate": 0.00012480378802620483, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021823864467663246, + "loss": 0.0141, "step": 108040 }, { - "epoch": 1.17, - "learning_rate": 0.00012478757216060192, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021823107698361845, + "loss": 0.0155, "step": 108050 }, { - "epoch": 1.17, - "learning_rate": 0.000124771356294999, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021822350929060443, + "loss": 0.0161, "step": 108060 }, { - "epoch": 1.17, - "learning_rate": 0.0001247551404293961, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021821594159759044, + "loss": 0.0161, "step": 108070 }, { - "epoch": 1.17, - "learning_rate": 0.0001247389245637932, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021820837390457642, + "loss": 0.0119, "step": 108080 }, { - "epoch": 1.17, - "learning_rate": 0.0001247227086981903, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.0002182008062115624, + "loss": 0.0153, "step": 108090 }, { - "epoch": 1.17, - "learning_rate": 0.00012470649283258738, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.0002181932385185484, + "loss": 0.0184, "step": 108100 }, { - "epoch": 1.17, - "learning_rate": 0.0001246902769669845, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.0002181856708255344, + "loss": 0.0135, "step": 108110 }, { - "epoch": 1.17, - "learning_rate": 0.00012467406110138157, - "loss": 0.0132, + "epoch": 0.55, + "learning_rate": 0.00021817810313252037, + "loss": 0.0131, "step": 108120 }, { - "epoch": 1.17, - "learning_rate": 0.0001246578452357787, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021817053543950638, + "loss": 0.0136, "step": 108130 }, { - "epoch": 1.17, - "learning_rate": 0.00012464162937017575, - "loss": 0.0139, + "epoch": 0.55, + "learning_rate": 0.00021816296774649236, + "loss": 0.0147, "step": 108140 }, { - "epoch": 1.17, - "learning_rate": 0.00012462541350457287, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021815540005347834, + "loss": 0.0152, "step": 108150 }, { - "epoch": 1.17, - "learning_rate": 0.00012460919763896997, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021814783236046432, + "loss": 0.0159, "step": 108160 }, { - "epoch": 1.17, - "learning_rate": 0.00012459298177336706, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021814026466745033, + "loss": 0.0132, "step": 108170 }, { - "epoch": 1.17, - "learning_rate": 0.00012457676590776415, - "loss": 0.0134, + "epoch": 0.55, + "learning_rate": 0.0002181326969744363, + "loss": 0.0161, "step": 108180 }, { - "epoch": 1.17, - "learning_rate": 0.00012456055004216125, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002181251292814223, + "loss": 0.0189, "step": 108190 }, { - "epoch": 1.17, - "learning_rate": 0.00012454433417655834, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.0002181175615884083, + "loss": 0.0147, "step": 108200 }, { - "epoch": 1.17, - "learning_rate": 0.00012452811831095543, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021810999389539428, + "loss": 0.0148, "step": 108210 }, { - "epoch": 1.17, - "learning_rate": 0.00012451190244535252, - "loss": 0.0114, + "epoch": 0.55, + "learning_rate": 0.00021810242620238027, + "loss": 0.0171, "step": 108220 }, { - "epoch": 1.17, - "learning_rate": 0.00012449568657974962, - "loss": 0.0133, + "epoch": 0.55, + "learning_rate": 0.00021809485850936627, + "loss": 0.0148, "step": 108230 }, { - "epoch": 1.17, - "learning_rate": 0.0001244794707141467, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021808729081635226, + "loss": 0.0146, "step": 108240 }, { - "epoch": 1.17, - "learning_rate": 0.0001244632548485438, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021807972312333824, + "loss": 0.0192, "step": 108250 }, { - "epoch": 1.17, - "learning_rate": 0.0001244470389829409, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021807215543032425, + "loss": 0.013, "step": 108260 }, { - "epoch": 1.17, - "learning_rate": 0.000124430823117338, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021806458773731023, + "loss": 0.0154, "step": 108270 }, { - "epoch": 1.17, - "learning_rate": 0.00012441460725173508, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.0002180570200442962, + "loss": 0.016, "step": 108280 }, { - "epoch": 1.17, - "learning_rate": 0.00012439839138613217, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021804945235128222, + "loss": 0.0175, "step": 108290 }, { - "epoch": 1.17, - "learning_rate": 0.00012438217552052927, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002180418846582682, + "loss": 0.0148, "step": 108300 }, { - "epoch": 1.17, - "learning_rate": 0.00012436595965492639, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021803431696525418, + "loss": 0.0147, "step": 108310 }, { - "epoch": 1.17, - "learning_rate": 0.00012434974378932345, - "loss": 0.0123, + "epoch": 0.55, + "learning_rate": 0.0002180267492722402, + "loss": 0.016, "step": 108320 }, { - "epoch": 1.17, - "learning_rate": 0.00012433352792372057, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021801918157922617, + "loss": 0.0168, "step": 108330 }, { - "epoch": 1.17, - "learning_rate": 0.00012431731205811764, - "loss": 0.0066, + "epoch": 0.55, + "learning_rate": 0.00021801161388621215, + "loss": 0.0147, "step": 108340 }, { - "epoch": 1.17, - "learning_rate": 0.00012430109619251476, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021800404619319813, + "loss": 0.0136, "step": 108350 }, { - "epoch": 1.17, - "learning_rate": 0.00012428488032691182, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021799647850018414, + "loss": 0.0153, "step": 108360 }, { - "epoch": 1.17, - "learning_rate": 0.00012426866446130894, - "loss": 0.0072, + "epoch": 0.55, + "learning_rate": 0.00021798891080717012, + "loss": 0.0143, "step": 108370 }, { - "epoch": 1.17, - "learning_rate": 0.00012425244859570603, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.0002179813431141561, + "loss": 0.0173, "step": 108380 }, { - "epoch": 1.17, - "learning_rate": 0.00012423623273010313, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.0002179737754211421, + "loss": 0.0151, "step": 108390 }, { - "epoch": 1.17, - "learning_rate": 0.00012422001686450022, - "loss": 0.0114, + "epoch": 0.55, + "learning_rate": 0.0002179662077281281, + "loss": 0.0167, "step": 108400 }, { - "epoch": 1.17, - "learning_rate": 0.0001242038009988973, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021795864003511408, + "loss": 0.0154, "step": 108410 }, { - "epoch": 1.17, - "learning_rate": 0.0001241875851332944, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021795107234210008, + "loss": 0.0163, "step": 108420 }, { - "epoch": 1.17, - "learning_rate": 0.0001241713692676915, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021794350464908607, + "loss": 0.0185, "step": 108430 }, { - "epoch": 1.17, - "learning_rate": 0.0001241551534020886, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021793593695607205, + "loss": 0.0172, "step": 108440 }, { - "epoch": 1.17, - "learning_rate": 0.00012413893753648568, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021792836926305806, + "loss": 0.0151, "step": 108450 }, { - "epoch": 1.17, - "learning_rate": 0.00012412272167088278, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021792080157004404, + "loss": 0.016, "step": 108460 }, { - "epoch": 1.17, - "learning_rate": 0.00012410650580527987, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021791323387703002, + "loss": 0.0127, "step": 108470 }, { - "epoch": 1.17, - "learning_rate": 0.00012409028993967696, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021790566618401603, + "loss": 0.0163, "step": 108480 }, { - "epoch": 1.17, - "learning_rate": 0.00012407407407407406, - "loss": 0.0129, + "epoch": 0.55, + "learning_rate": 0.000217898098491002, + "loss": 0.0133, "step": 108490 }, { - "epoch": 1.17, - "learning_rate": 0.00012405785820847115, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.000217890530797988, + "loss": 0.0174, "step": 108500 }, { - "epoch": 1.17, - "learning_rate": 0.00012404164234286824, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021788296310497397, + "loss": 0.0156, "step": 108510 }, { - "epoch": 1.17, - "learning_rate": 0.00012402542647726533, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021787539541195998, + "loss": 0.0122, "step": 108520 }, { - "epoch": 1.17, - "learning_rate": 0.00012400921061166245, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021786782771894596, + "loss": 0.0138, "step": 108530 }, { - "epoch": 1.17, - "learning_rate": 0.00012399299474605952, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021786026002593194, + "loss": 0.0144, "step": 108540 }, { - "epoch": 1.17, - "learning_rate": 0.00012397677888045664, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.00021785269233291795, + "loss": 0.0116, "step": 108550 }, { - "epoch": 1.17, - "learning_rate": 0.0001239605630148537, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021784512463990393, + "loss": 0.0165, "step": 108560 }, { - "epoch": 1.17, - "learning_rate": 0.00012394434714925082, - "loss": 0.0114, + "epoch": 0.55, + "learning_rate": 0.00021783755694688991, + "loss": 0.0151, "step": 108570 }, { - "epoch": 1.17, - "learning_rate": 0.0001239281312836479, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021782998925387592, + "loss": 0.0148, "step": 108580 }, { - "epoch": 1.17, - "learning_rate": 0.000123911915418045, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002178224215608619, + "loss": 0.0196, "step": 108590 }, { - "epoch": 1.17, - "learning_rate": 0.0001238956995524421, - "loss": 0.015, + "epoch": 0.55, + "learning_rate": 0.00021781485386784789, + "loss": 0.012, "step": 108600 }, { - "epoch": 1.17, - "learning_rate": 0.0001238794836868392, - "loss": 0.008, + "epoch": 0.55, + "learning_rate": 0.0002178072861748339, + "loss": 0.0145, "step": 108610 }, { - "epoch": 1.17, - "learning_rate": 0.0001238632678212363, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021779971848181988, + "loss": 0.0168, "step": 108620 }, { - "epoch": 1.17, - "learning_rate": 0.00012384705195563338, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021779215078880586, + "loss": 0.0145, "step": 108630 }, { - "epoch": 1.17, - "learning_rate": 0.00012383083609003047, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021778458309579187, + "loss": 0.014, "step": 108640 }, { - "epoch": 1.17, - "learning_rate": 0.00012381462022442757, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021777701540277785, + "loss": 0.0138, "step": 108650 }, { - "epoch": 1.17, - "learning_rate": 0.00012379840435882466, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021776944770976383, + "loss": 0.0156, "step": 108660 }, { - "epoch": 1.17, - "learning_rate": 0.00012378218849322175, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.0002177618800167498, + "loss": 0.0135, "step": 108670 }, { - "epoch": 1.17, - "learning_rate": 0.00012376597262761887, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021775431232373582, + "loss": 0.0162, "step": 108680 }, { - "epoch": 1.17, - "learning_rate": 0.00012374975676201594, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.0002177467446307218, + "loss": 0.0203, "step": 108690 }, { - "epoch": 1.18, - "learning_rate": 0.00012373354089641306, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021773917693770778, + "loss": 0.02, "step": 108700 }, { - "epoch": 1.18, - "learning_rate": 0.00012371732503081012, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.0002177316092446938, + "loss": 0.0156, "step": 108710 }, { - "epoch": 1.18, - "learning_rate": 0.00012370110916520724, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021772404155167977, + "loss": 0.0137, "step": 108720 }, { - "epoch": 1.18, - "learning_rate": 0.0001236848932996043, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021771647385866573, + "loss": 0.015, "step": 108730 }, { - "epoch": 1.18, - "learning_rate": 0.00012366867743400143, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002177089061656517, + "loss": 0.0159, "step": 108740 }, { - "epoch": 1.18, - "learning_rate": 0.00012365246156839852, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021770133847263772, + "loss": 0.0164, "step": 108750 }, { - "epoch": 1.18, - "learning_rate": 0.0001236362457027956, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.0002176937707796237, + "loss": 0.0166, "step": 108760 }, { - "epoch": 1.18, - "learning_rate": 0.0001236200298371927, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021768620308660968, + "loss": 0.0131, "step": 108770 }, { - "epoch": 1.18, - "learning_rate": 0.0001236038139715898, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.0002176786353935957, + "loss": 0.0144, "step": 108780 }, { - "epoch": 1.18, - "learning_rate": 0.0001235875981059869, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021767106770058167, + "loss": 0.0163, "step": 108790 }, { - "epoch": 1.18, - "learning_rate": 0.00012357138224038398, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021766350000756765, + "loss": 0.0138, "step": 108800 }, { - "epoch": 1.18, - "learning_rate": 0.00012355516637478108, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021765593231455366, + "loss": 0.0149, "step": 108810 }, { - "epoch": 1.18, - "learning_rate": 0.00012353895050917817, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021764836462153964, + "loss": 0.0181, "step": 108820 }, { - "epoch": 1.18, - "learning_rate": 0.00012352273464357526, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021764079692852562, + "loss": 0.0157, "step": 108830 }, { - "epoch": 1.18, - "learning_rate": 0.00012350651877797236, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.00021763322923551163, + "loss": 0.0157, "step": 108840 }, { - "epoch": 1.18, - "learning_rate": 0.00012349030291236945, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.0002176256615424976, + "loss": 0.0162, "step": 108850 }, { - "epoch": 1.18, - "learning_rate": 0.00012347408704676654, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.0002176180938494836, + "loss": 0.0153, "step": 108860 }, { - "epoch": 1.18, - "learning_rate": 0.00012345787118116363, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002176105261564696, + "loss": 0.0141, "step": 108870 }, { - "epoch": 1.18, - "learning_rate": 0.00012344165531556073, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.00021760295846345558, + "loss": 0.0152, "step": 108880 }, { - "epoch": 1.18, - "learning_rate": 0.00012342543944995782, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021759539077044156, + "loss": 0.0146, "step": 108890 }, { - "epoch": 1.18, - "learning_rate": 0.00012340922358435494, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021758782307742755, + "loss": 0.0162, "step": 108900 }, { - "epoch": 1.18, - "learning_rate": 0.000123393007718752, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021758025538441355, + "loss": 0.0141, "step": 108910 }, { - "epoch": 1.18, - "learning_rate": 0.00012337679185314912, - "loss": 0.0076, + "epoch": 0.55, + "learning_rate": 0.00021757268769139954, + "loss": 0.0153, "step": 108920 }, { - "epoch": 1.18, - "learning_rate": 0.0001233605759875462, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021756511999838552, + "loss": 0.0144, "step": 108930 }, { - "epoch": 1.18, - "learning_rate": 0.0001233443601219433, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021755755230537153, + "loss": 0.0137, "step": 108940 }, { - "epoch": 1.18, - "learning_rate": 0.00012332814425634038, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.0002175499846123575, + "loss": 0.0129, "step": 108950 }, { - "epoch": 1.18, - "learning_rate": 0.0001233119283907375, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.0002175424169193435, + "loss": 0.0133, "step": 108960 }, { - "epoch": 1.18, - "learning_rate": 0.0001232957125251346, - "loss": 0.0125, + "epoch": 0.55, + "learning_rate": 0.0002175348492263295, + "loss": 0.0119, "step": 108970 }, { - "epoch": 1.18, - "learning_rate": 0.00012327949665953168, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021752728153331548, + "loss": 0.0169, "step": 108980 }, { - "epoch": 1.18, - "learning_rate": 0.00012326328079392877, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021751971384030146, + "loss": 0.0128, "step": 108990 }, { - "epoch": 1.18, - "learning_rate": 0.00012324706492832587, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021751214614728747, + "loss": 0.0128, "step": 109000 }, { - "epoch": 1.18, - "eval_cer": 0.9215503867888964, - "eval_loss": 0.0077276891097426414, - "eval_runtime": 121.2693, - "eval_samples_per_second": 16.492, - "eval_steps_per_second": 4.123, + "epoch": 0.55, + "eval_cer": 0.9145003381830497, + "eval_loss": 0.011132709681987762, + "eval_runtime": 116.5842, + "eval_samples_per_second": 17.155, + "eval_steps_per_second": 4.289, "step": 109000 }, { - "epoch": 1.18, - "learning_rate": 0.00012323084906272296, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021750457845427345, + "loss": 0.0133, "step": 109010 }, { - "epoch": 1.18, - "learning_rate": 0.00012321463319712005, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021749701076125943, + "loss": 0.0148, "step": 109020 }, { - "epoch": 1.18, - "learning_rate": 0.00012319841733151714, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021748944306824544, + "loss": 0.0132, "step": 109030 }, { - "epoch": 1.18, - "learning_rate": 0.00012318220146591424, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021748187537523142, + "loss": 0.0138, "step": 109040 }, { - "epoch": 1.18, - "learning_rate": 0.00012316598560031133, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.0002174743076822174, + "loss": 0.0147, "step": 109050 }, { - "epoch": 1.18, - "learning_rate": 0.00012314976973470842, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021746673998920338, + "loss": 0.0134, "step": 109060 }, { - "epoch": 1.18, - "learning_rate": 0.00012313355386910552, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.0002174591722961894, + "loss": 0.0126, "step": 109070 }, { - "epoch": 1.18, - "learning_rate": 0.0001231173380035026, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021745160460317537, + "loss": 0.0146, "step": 109080 }, { - "epoch": 1.18, - "learning_rate": 0.0001231011221378997, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021744403691016136, + "loss": 0.013, "step": 109090 }, { - "epoch": 1.18, - "learning_rate": 0.0001230849062722968, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021743646921714736, + "loss": 0.0133, "step": 109100 }, { - "epoch": 1.18, - "learning_rate": 0.0001230686904066939, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021742890152413335, + "loss": 0.0145, "step": 109110 }, { - "epoch": 1.18, - "learning_rate": 0.000123052474541091, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021742133383111933, + "loss": 0.0169, "step": 109120 }, { - "epoch": 1.18, - "learning_rate": 0.00012303625867548807, - "loss": 0.008, + "epoch": 0.55, + "learning_rate": 0.00021741376613810534, + "loss": 0.0157, "step": 109130 }, { - "epoch": 1.18, - "learning_rate": 0.0001230200428098852, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021740619844509132, + "loss": 0.0158, "step": 109140 }, { - "epoch": 1.18, - "learning_rate": 0.00012300382694428226, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.0002173986307520773, + "loss": 0.017, "step": 109150 }, { - "epoch": 1.18, - "learning_rate": 0.00012298761107867938, - "loss": 0.0141, + "epoch": 0.55, + "learning_rate": 0.0002173910630590633, + "loss": 0.0136, "step": 109160 }, { - "epoch": 1.18, - "learning_rate": 0.00012297139521307647, - "loss": 0.0123, + "epoch": 0.55, + "learning_rate": 0.0002173834953660493, + "loss": 0.0227, "step": 109170 }, { - "epoch": 1.18, - "learning_rate": 0.00012295517934747356, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021737592767303527, + "loss": 0.0156, "step": 109180 }, { - "epoch": 1.18, - "learning_rate": 0.00012293896348187066, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021736835998002128, + "loss": 0.0136, "step": 109190 }, { - "epoch": 1.18, - "learning_rate": 0.00012292274761626775, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021736079228700726, + "loss": 0.0174, "step": 109200 }, { - "epoch": 1.18, - "learning_rate": 0.00012290653175066484, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021735322459399324, + "loss": 0.0162, "step": 109210 }, { - "epoch": 1.18, - "learning_rate": 0.00012289031588506193, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021734565690097925, + "loss": 0.0196, "step": 109220 }, { - "epoch": 1.18, - "learning_rate": 0.00012287410001945903, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021733808920796523, + "loss": 0.0146, "step": 109230 }, { - "epoch": 1.18, - "learning_rate": 0.00012285788415385612, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.0002173305215149512, + "loss": 0.0141, "step": 109240 }, { - "epoch": 1.18, - "learning_rate": 0.0001228416682882532, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002173229538219372, + "loss": 0.0138, "step": 109250 }, { - "epoch": 1.18, - "learning_rate": 0.0001228254524226503, - "loss": 0.0078, + "epoch": 0.55, + "learning_rate": 0.0002173153861289232, + "loss": 0.019, "step": 109260 }, { - "epoch": 1.18, - "learning_rate": 0.0001228092365570474, - "loss": 0.0076, + "epoch": 0.55, + "learning_rate": 0.00021730781843590918, + "loss": 0.0148, "step": 109270 }, { - "epoch": 1.18, - "learning_rate": 0.0001227930206914445, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.00021730025074289517, + "loss": 0.0146, "step": 109280 }, { - "epoch": 1.18, - "learning_rate": 0.00012277680482584158, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021729268304988117, + "loss": 0.0189, "step": 109290 }, { - "epoch": 1.18, - "learning_rate": 0.00012276058896023868, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021728511535686716, + "loss": 0.0137, "step": 109300 }, { - "epoch": 1.18, - "learning_rate": 0.00012274437309463577, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021727754766385314, + "loss": 0.0152, "step": 109310 }, { - "epoch": 1.18, - "learning_rate": 0.0001227281572290329, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021726997997083915, + "loss": 0.0151, "step": 109320 }, { - "epoch": 1.18, - "learning_rate": 0.00012271194136342995, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021726241227782513, + "loss": 0.0135, "step": 109330 }, { - "epoch": 1.18, - "learning_rate": 0.00012269572549782707, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.0002172548445848111, + "loss": 0.0156, "step": 109340 }, { - "epoch": 1.18, - "learning_rate": 0.00012267950963222417, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021724727689179712, + "loss": 0.0176, "step": 109350 }, { - "epoch": 1.18, - "learning_rate": 0.00012266329376662126, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002172397091987831, + "loss": 0.0189, "step": 109360 }, { - "epoch": 1.18, - "learning_rate": 0.00012264707790101835, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021723214150576908, + "loss": 0.0128, "step": 109370 }, { - "epoch": 1.18, - "learning_rate": 0.00012263086203541544, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.0002172245738127551, + "loss": 0.0181, "step": 109380 }, { - "epoch": 1.18, - "learning_rate": 0.00012261464616981254, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021721700611974107, + "loss": 0.017, "step": 109390 }, { - "epoch": 1.18, - "learning_rate": 0.00012259843030420963, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021720943842672705, + "loss": 0.0163, "step": 109400 }, { - "epoch": 1.18, - "learning_rate": 0.00012258221443860672, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021720187073371303, + "loss": 0.0133, "step": 109410 }, { - "epoch": 1.18, - "learning_rate": 0.00012256599857300382, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021719430304069904, + "loss": 0.0169, "step": 109420 }, { - "epoch": 1.18, - "learning_rate": 0.0001225497827074009, - "loss": 0.012, + "epoch": 0.55, + "learning_rate": 0.00021718673534768502, + "loss": 0.0212, "step": 109430 }, { - "epoch": 1.18, - "learning_rate": 0.000122533566841798, - "loss": 0.012, + "epoch": 0.55, + "learning_rate": 0.000217179167654671, + "loss": 0.0189, "step": 109440 }, { - "epoch": 1.18, - "learning_rate": 0.0001225173509761951, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.000217171599961657, + "loss": 0.0172, "step": 109450 }, { - "epoch": 1.18, - "learning_rate": 0.0001225011351105922, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.000217164032268643, + "loss": 0.0149, "step": 109460 }, { - "epoch": 1.18, - "learning_rate": 0.0001224849192449893, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021715646457562898, + "loss": 0.0174, "step": 109470 }, { - "epoch": 1.18, - "learning_rate": 0.00012246870337938637, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021714889688261498, + "loss": 0.0147, "step": 109480 }, { - "epoch": 1.18, - "learning_rate": 0.0001224524875137835, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021714132918960097, + "loss": 0.0137, "step": 109490 }, { - "epoch": 1.18, - "learning_rate": 0.00012243627164818056, - "loss": 0.0081, + "epoch": 0.55, + "learning_rate": 0.00021713376149658695, + "loss": 0.0174, "step": 109500 }, { - "epoch": 1.18, - "learning_rate": 0.00012242005578257768, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.00021712619380357296, + "loss": 0.0149, "step": 109510 }, { - "epoch": 1.18, - "learning_rate": 0.00012240383991697474, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021711862611055894, + "loss": 0.0162, "step": 109520 }, { - "epoch": 1.18, - "learning_rate": 0.00012238762405137186, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021711105841754492, + "loss": 0.0143, "step": 109530 }, { - "epoch": 1.18, - "learning_rate": 0.00012237140818576896, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021710349072453093, + "loss": 0.0132, "step": 109540 }, { - "epoch": 1.18, - "learning_rate": 0.00012235519232016605, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.0002170959230315169, + "loss": 0.0123, "step": 109550 }, { - "epoch": 1.18, - "learning_rate": 0.00012233897645456314, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002170883553385029, + "loss": 0.0172, "step": 109560 }, { - "epoch": 1.18, - "learning_rate": 0.00012232276058896023, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021708078764548887, + "loss": 0.0189, "step": 109570 }, { - "epoch": 1.18, - "learning_rate": 0.00012230654472335733, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.00021707321995247488, + "loss": 0.0147, "step": 109580 }, { - "epoch": 1.18, - "learning_rate": 0.00012229032885775442, - "loss": 0.0114, + "epoch": 0.55, + "learning_rate": 0.00021706565225946086, + "loss": 0.0143, "step": 109590 }, { - "epoch": 1.18, - "learning_rate": 0.0001222741129921515, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021705808456644684, + "loss": 0.0121, "step": 109600 }, { - "epoch": 1.18, - "learning_rate": 0.0001222578971265486, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021705051687343285, + "loss": 0.015, "step": 109610 }, { - "epoch": 1.19, - "learning_rate": 0.0001222416812609457, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021704294918041883, + "loss": 0.0157, "step": 109620 }, { - "epoch": 1.19, - "learning_rate": 0.0001222254653953428, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021703538148740481, + "loss": 0.0152, "step": 109630 }, { - "epoch": 1.19, - "learning_rate": 0.00012220924952973988, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021702781379439082, + "loss": 0.0142, "step": 109640 }, { - "epoch": 1.19, - "learning_rate": 0.00012219303366413698, - "loss": 0.0127, + "epoch": 0.55, + "learning_rate": 0.0002170202461013768, + "loss": 0.0134, "step": 109650 }, { - "epoch": 1.19, - "learning_rate": 0.00012217681779853407, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021701267840836279, + "loss": 0.0163, "step": 109660 }, { - "epoch": 1.19, - "learning_rate": 0.00012216060193293116, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.0002170051107153488, + "loss": 0.0142, "step": 109670 }, { - "epoch": 1.19, - "learning_rate": 0.00012214438606732825, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021699754302233478, + "loss": 0.012, "step": 109680 }, { - "epoch": 1.19, - "learning_rate": 0.00012212817020172537, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021698997532932076, + "loss": 0.0158, "step": 109690 }, { - "epoch": 1.19, - "learning_rate": 0.00012211195433612244, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021698240763630677, + "loss": 0.0142, "step": 109700 }, { - "epoch": 1.19, - "learning_rate": 0.00012209573847051956, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021697483994329275, + "loss": 0.0159, "step": 109710 }, { - "epoch": 1.19, - "learning_rate": 0.00012207952260491663, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021696727225027873, + "loss": 0.0153, "step": 109720 }, { - "epoch": 1.19, - "learning_rate": 0.00012206330673931373, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.0002169597045572647, + "loss": 0.0123, "step": 109730 }, { - "epoch": 1.19, - "learning_rate": 0.00012204709087371082, - "loss": 0.0126, + "epoch": 0.55, + "learning_rate": 0.00021695213686425072, + "loss": 0.0161, "step": 109740 }, { - "epoch": 1.19, - "learning_rate": 0.00012203087500810793, - "loss": 0.0132, + "epoch": 0.55, + "learning_rate": 0.0002169445691712367, + "loss": 0.0119, "step": 109750 }, { - "epoch": 1.19, - "learning_rate": 0.00012201465914250501, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021693700147822268, + "loss": 0.0182, "step": 109760 }, { - "epoch": 1.19, - "learning_rate": 0.00012199844327690212, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.0002169294337852087, + "loss": 0.019, "step": 109770 }, { - "epoch": 1.19, - "learning_rate": 0.0001219822274112992, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021692186609219467, + "loss": 0.0133, "step": 109780 }, { - "epoch": 1.19, - "learning_rate": 0.0001219660115456963, - "loss": 0.0073, + "epoch": 0.55, + "learning_rate": 0.00021691429839918065, + "loss": 0.0151, "step": 109790 }, { - "epoch": 1.19, - "learning_rate": 0.00012194979568009338, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021690673070616666, + "loss": 0.0133, "step": 109800 }, { - "epoch": 1.19, - "learning_rate": 0.00012193357981449049, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021689916301315264, + "loss": 0.0112, "step": 109810 }, { - "epoch": 1.19, - "learning_rate": 0.00012191736394888758, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021689159532013862, + "loss": 0.0145, "step": 109820 }, { - "epoch": 1.19, - "learning_rate": 0.00012190114808328467, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021688402762712463, + "loss": 0.0114, "step": 109830 }, { - "epoch": 1.19, - "learning_rate": 0.00012188493221768177, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021687645993411061, + "loss": 0.0134, "step": 109840 }, { - "epoch": 1.19, - "learning_rate": 0.00012186871635207887, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.0002168688922410966, + "loss": 0.0146, "step": 109850 }, { - "epoch": 1.19, - "learning_rate": 0.00012185250048647595, - "loss": 0.012, + "epoch": 0.55, + "learning_rate": 0.0002168613245480826, + "loss": 0.0147, "step": 109860 }, { - "epoch": 1.19, - "learning_rate": 0.00012183628462087306, - "loss": 0.0129, + "epoch": 0.55, + "learning_rate": 0.00021685375685506859, + "loss": 0.0115, "step": 109870 }, { - "epoch": 1.19, - "learning_rate": 0.00012182006875527014, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021684618916205457, + "loss": 0.0162, "step": 109880 }, { - "epoch": 1.19, - "learning_rate": 0.00012180385288966724, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.00021683862146904058, + "loss": 0.0133, "step": 109890 }, { - "epoch": 1.19, - "learning_rate": 0.00012178763702406432, - "loss": 0.0071, + "epoch": 0.55, + "learning_rate": 0.00021683105377602656, + "loss": 0.0174, "step": 109900 }, { - "epoch": 1.19, - "learning_rate": 0.00012177142115846143, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021682348608301254, + "loss": 0.0163, "step": 109910 }, { - "epoch": 1.19, - "learning_rate": 0.00012175520529285852, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021681591838999852, + "loss": 0.018, "step": 109920 }, { - "epoch": 1.19, - "learning_rate": 0.00012173898942725561, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.00021680835069698453, + "loss": 0.0169, "step": 109930 }, { - "epoch": 1.19, - "learning_rate": 0.0001217227735616527, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.0002168007830039705, + "loss": 0.0144, "step": 109940 }, { - "epoch": 1.19, - "learning_rate": 0.0001217065576960498, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002167932153109565, + "loss": 0.0142, "step": 109950 }, { - "epoch": 1.19, - "learning_rate": 0.00012169034183044689, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.0002167856476179425, + "loss": 0.0112, "step": 109960 }, { - "epoch": 1.19, - "learning_rate": 0.000121674125964844, - "loss": 0.0124, + "epoch": 0.55, + "learning_rate": 0.00021677807992492848, + "loss": 0.0167, "step": 109970 }, { - "epoch": 1.19, - "learning_rate": 0.00012165791009924108, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021677051223191444, + "loss": 0.0149, "step": 109980 }, { - "epoch": 1.19, - "learning_rate": 0.00012164169423363818, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021676294453890042, + "loss": 0.0146, "step": 109990 }, { - "epoch": 1.19, - "learning_rate": 0.00012162547836803526, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021675537684588643, + "loss": 0.0159, "step": 110000 }, { - "epoch": 1.19, - "eval_cer": 0.9215582042155038, - "eval_loss": 0.007691715378314257, - "eval_runtime": 121.2349, - "eval_samples_per_second": 16.497, - "eval_steps_per_second": 4.124, + "epoch": 0.55, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.010691503062844276, + "eval_runtime": 116.7007, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.284, "step": 110000 }, { - "epoch": 1.19, - "learning_rate": 0.00012160926250243237, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.0002167478091528724, + "loss": 0.015, "step": 110010 }, { - "epoch": 1.19, - "learning_rate": 0.00012159304663682946, - "loss": 0.0125, + "epoch": 0.56, + "learning_rate": 0.0002167402414598584, + "loss": 0.0209, "step": 110020 }, { - "epoch": 1.19, - "learning_rate": 0.00012157683077122655, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.0002167326737668444, + "loss": 0.0157, "step": 110030 }, { - "epoch": 1.19, - "learning_rate": 0.00012156061490562365, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021672510607383038, + "loss": 0.0184, "step": 110040 }, { - "epoch": 1.19, - "learning_rate": 0.00012154439904002074, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021671753838081636, + "loss": 0.0169, "step": 110050 }, { - "epoch": 1.19, - "learning_rate": 0.00012152818317441785, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021670997068780237, + "loss": 0.0206, "step": 110060 }, { - "epoch": 1.19, - "learning_rate": 0.00012151196730881494, - "loss": 0.0072, + "epoch": 0.56, + "learning_rate": 0.00021670240299478835, + "loss": 0.0151, "step": 110070 }, { - "epoch": 1.19, - "learning_rate": 0.00012149575144321203, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.00021669483530177433, + "loss": 0.0166, "step": 110080 }, { - "epoch": 1.19, - "learning_rate": 0.00012147953557760912, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021668726760876034, + "loss": 0.0171, "step": 110090 }, { - "epoch": 1.19, - "learning_rate": 0.00012146331971200622, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021667969991574632, + "loss": 0.0128, "step": 110100 }, { - "epoch": 1.19, - "learning_rate": 0.00012144710384640331, - "loss": 0.0135, + "epoch": 0.56, + "learning_rate": 0.0002166721322227323, + "loss": 0.0141, "step": 110110 }, { - "epoch": 1.19, - "learning_rate": 0.00012143088798080042, - "loss": 0.0127, + "epoch": 0.56, + "learning_rate": 0.00021666456452971829, + "loss": 0.0174, "step": 110120 }, { - "epoch": 1.19, - "learning_rate": 0.0001214146721151975, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.0002166569968367043, + "loss": 0.0129, "step": 110130 }, { - "epoch": 1.19, - "learning_rate": 0.0001213984562495946, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.00021664942914369028, + "loss": 0.0202, "step": 110140 }, { - "epoch": 1.19, - "learning_rate": 0.00012138224038399168, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021664186145067626, + "loss": 0.0145, "step": 110150 }, { - "epoch": 1.19, - "learning_rate": 0.00012136602451838879, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.00021663429375766227, + "loss": 0.0186, "step": 110160 }, { - "epoch": 1.19, - "learning_rate": 0.00012134980865278588, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021662672606464825, + "loss": 0.0183, "step": 110170 }, { - "epoch": 1.19, - "learning_rate": 0.00012133359278718297, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021661915837163423, + "loss": 0.0143, "step": 110180 }, { - "epoch": 1.19, - "learning_rate": 0.00012131737692158007, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021661159067862024, + "loss": 0.0127, "step": 110190 }, { - "epoch": 1.19, - "learning_rate": 0.00012130116105597716, - "loss": 0.0115, + "epoch": 0.56, + "learning_rate": 0.00021660402298560622, + "loss": 0.0195, "step": 110200 }, { - "epoch": 1.19, - "learning_rate": 0.00012128494519037425, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002165964552925922, + "loss": 0.0149, "step": 110210 }, { - "epoch": 1.19, - "learning_rate": 0.00012126872932477136, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002165888875995782, + "loss": 0.0144, "step": 110220 }, { - "epoch": 1.19, - "learning_rate": 0.00012125251345916844, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.0002165813199065642, + "loss": 0.0134, "step": 110230 }, { - "epoch": 1.19, - "learning_rate": 0.00012123629759356554, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.00021657375221355017, + "loss": 0.0139, "step": 110240 }, { - "epoch": 1.19, - "learning_rate": 0.00012122008172796262, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021656618452053618, + "loss": 0.0156, "step": 110250 }, { - "epoch": 1.19, - "learning_rate": 0.00012120386586235973, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021655861682752216, + "loss": 0.0141, "step": 110260 }, { - "epoch": 1.19, - "learning_rate": 0.00012118764999675681, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021655104913450814, + "loss": 0.0146, "step": 110270 }, { - "epoch": 1.19, - "learning_rate": 0.00012117143413115391, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021654348144149415, + "loss": 0.0167, "step": 110280 }, { - "epoch": 1.19, - "learning_rate": 0.000121155218265551, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021653591374848013, + "loss": 0.0131, "step": 110290 }, { - "epoch": 1.19, - "learning_rate": 0.0001211390023999481, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021652834605546611, + "loss": 0.0151, "step": 110300 }, { - "epoch": 1.19, - "learning_rate": 0.00012112278653434519, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002165207783624521, + "loss": 0.021, "step": 110310 }, { - "epoch": 1.19, - "learning_rate": 0.0001211065706687423, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.0002165132106694381, + "loss": 0.0161, "step": 110320 }, { - "epoch": 1.19, - "learning_rate": 0.00012109035480313938, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021650564297642409, + "loss": 0.0161, "step": 110330 }, { - "epoch": 1.19, - "learning_rate": 0.00012107413893753648, - "loss": 0.0137, + "epoch": 0.56, + "learning_rate": 0.00021649807528341007, + "loss": 0.0179, "step": 110340 }, { - "epoch": 1.19, - "learning_rate": 0.00012105792307193356, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021649050759039608, + "loss": 0.0155, "step": 110350 }, { - "epoch": 1.19, - "learning_rate": 0.00012104170720633067, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021648293989738206, + "loss": 0.0141, "step": 110360 }, { - "epoch": 1.19, - "learning_rate": 0.00012102549134072775, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021647537220436804, + "loss": 0.0187, "step": 110370 }, { - "epoch": 1.19, - "learning_rate": 0.00012100927547512485, - "loss": 0.0072, + "epoch": 0.56, + "learning_rate": 0.00021646780451135405, + "loss": 0.0149, "step": 110380 }, { - "epoch": 1.19, - "learning_rate": 0.00012099305960952195, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.00021646023681834003, + "loss": 0.0146, "step": 110390 }, { - "epoch": 1.19, - "learning_rate": 0.00012097684374391904, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.000216452669125326, + "loss": 0.0131, "step": 110400 }, { - "epoch": 1.19, - "learning_rate": 0.00012096062787831613, - "loss": 0.0064, + "epoch": 0.56, + "learning_rate": 0.00021644510143231202, + "loss": 0.0139, "step": 110410 }, { - "epoch": 1.19, - "learning_rate": 0.00012094441201271323, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.000216437533739298, + "loss": 0.0112, "step": 110420 }, { - "epoch": 1.19, - "learning_rate": 0.00012092819614711032, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021642996604628398, + "loss": 0.0148, "step": 110430 }, { - "epoch": 1.19, - "learning_rate": 0.00012091198028150742, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.00021642239835327, + "loss": 0.0128, "step": 110440 }, { - "epoch": 1.19, - "learning_rate": 0.0001208957644159045, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021641483066025597, + "loss": 0.0147, "step": 110450 }, { - "epoch": 1.19, - "learning_rate": 0.00012087954855030161, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021640726296724195, + "loss": 0.0164, "step": 110460 }, { - "epoch": 1.19, - "learning_rate": 0.00012086333268469869, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021639969527422793, + "loss": 0.0181, "step": 110470 }, { - "epoch": 1.19, - "learning_rate": 0.0001208471168190958, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021639212758121394, + "loss": 0.0146, "step": 110480 }, { - "epoch": 1.19, - "learning_rate": 0.00012083090095349289, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021638455988819992, + "loss": 0.016, "step": 110490 }, { - "epoch": 1.19, - "learning_rate": 0.00012081468508788998, - "loss": 0.017, + "epoch": 0.56, + "learning_rate": 0.0002163769921951859, + "loss": 0.0187, "step": 110500 }, { - "epoch": 1.19, - "learning_rate": 0.00012079846922228707, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021636942450217191, + "loss": 0.014, "step": 110510 }, { - "epoch": 1.19, - "learning_rate": 0.00012078225335668417, - "loss": 0.0066, + "epoch": 0.56, + "learning_rate": 0.0002163618568091579, + "loss": 0.0164, "step": 110520 }, { - "epoch": 1.19, - "learning_rate": 0.00012076603749108126, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021635428911614388, + "loss": 0.0137, "step": 110530 }, { - "epoch": 1.19, - "learning_rate": 0.00012074982162547837, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021634672142312989, + "loss": 0.016, "step": 110540 }, { - "epoch": 1.2, - "learning_rate": 0.00012073360575987544, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021633915373011587, + "loss": 0.0117, "step": 110550 }, { - "epoch": 1.2, - "learning_rate": 0.00012071738989427255, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021633158603710185, + "loss": 0.0146, "step": 110560 }, { - "epoch": 1.2, - "learning_rate": 0.00012070117402866963, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021632401834408786, + "loss": 0.0161, "step": 110570 }, { - "epoch": 1.2, - "learning_rate": 0.00012068495816306674, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021631645065107384, + "loss": 0.0128, "step": 110580 }, { - "epoch": 1.2, - "learning_rate": 0.00012066874229746382, - "loss": 0.0126, + "epoch": 0.56, + "learning_rate": 0.00021630888295805982, + "loss": 0.0235, "step": 110590 }, { - "epoch": 1.2, - "learning_rate": 0.00012065252643186092, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021630131526504583, + "loss": 0.0162, "step": 110600 }, { - "epoch": 1.2, - "learning_rate": 0.00012063631056625801, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002162937475720318, + "loss": 0.0138, "step": 110610 }, { - "epoch": 1.2, - "learning_rate": 0.00012062009470065511, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.0002162861798790178, + "loss": 0.0136, "step": 110620 }, { - "epoch": 1.2, - "learning_rate": 0.0001206038788350522, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021627861218600377, + "loss": 0.0175, "step": 110630 }, { - "epoch": 1.2, - "learning_rate": 0.0001205876629694493, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021627104449298978, + "loss": 0.0148, "step": 110640 }, { - "epoch": 1.2, - "learning_rate": 0.00012057144710384639, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021626347679997576, + "loss": 0.0158, "step": 110650 }, { - "epoch": 1.2, - "learning_rate": 0.00012055523123824349, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021625590910696174, + "loss": 0.0154, "step": 110660 }, { - "epoch": 1.2, - "learning_rate": 0.00012053901537264057, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021624834141394775, + "loss": 0.0143, "step": 110670 }, { - "epoch": 1.2, - "learning_rate": 0.00012052279950703768, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021624077372093373, + "loss": 0.0148, "step": 110680 }, { - "epoch": 1.2, - "learning_rate": 0.00012050658364143476, - "loss": 0.0071, + "epoch": 0.56, + "learning_rate": 0.00021623320602791972, + "loss": 0.0164, "step": 110690 }, { - "epoch": 1.2, - "learning_rate": 0.00012049036777583186, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021622563833490572, + "loss": 0.0163, "step": 110700 }, { - "epoch": 1.2, - "learning_rate": 0.00012047415191022896, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.0002162180706418917, + "loss": 0.015, "step": 110710 }, { - "epoch": 1.2, - "learning_rate": 0.00012045793604462605, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.0002162105029488777, + "loss": 0.0141, "step": 110720 }, { - "epoch": 1.2, - "learning_rate": 0.00012044172017902314, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.0002162029352558637, + "loss": 0.0157, "step": 110730 }, { - "epoch": 1.2, - "learning_rate": 0.00012042550431342023, + "epoch": 0.56, + "learning_rate": 0.00021619536756284968, "loss": 0.0123, "step": 110740 }, { - "epoch": 1.2, - "learning_rate": 0.00012040928844781733, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021618779986983566, + "loss": 0.0141, "step": 110750 }, { - "epoch": 1.2, - "learning_rate": 0.00012039307258221443, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021618023217682167, + "loss": 0.0146, "step": 110760 }, { - "epoch": 1.2, - "learning_rate": 0.00012037685671661151, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021617266448380765, + "loss": 0.0148, "step": 110770 }, { - "epoch": 1.2, - "learning_rate": 0.00012036064085100862, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021616509679079363, + "loss": 0.0186, "step": 110780 }, { - "epoch": 1.2, - "learning_rate": 0.00012034442498540572, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021615752909777964, + "loss": 0.0168, "step": 110790 }, { - "epoch": 1.2, - "learning_rate": 0.0001203282091198028, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021614996140476562, + "loss": 0.0136, "step": 110800 }, { - "epoch": 1.2, - "learning_rate": 0.00012031199325419991, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.0002161423937117516, + "loss": 0.0126, "step": 110810 }, { - "epoch": 1.2, - "learning_rate": 0.00012029577738859699, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021613482601873758, + "loss": 0.0173, "step": 110820 }, { - "epoch": 1.2, - "learning_rate": 0.0001202795615229941, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002161272583257236, + "loss": 0.0129, "step": 110830 }, { - "epoch": 1.2, - "learning_rate": 0.00012026334565739118, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021611969063270957, + "loss": 0.016, "step": 110840 }, { - "epoch": 1.2, - "learning_rate": 0.00012024712979178828, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021611212293969555, + "loss": 0.0134, "step": 110850 }, { - "epoch": 1.2, - "learning_rate": 0.00012023091392618537, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021610455524668156, + "loss": 0.019, "step": 110860 }, { - "epoch": 1.2, - "learning_rate": 0.00012021469806058247, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021609698755366754, + "loss": 0.0157, "step": 110870 }, { - "epoch": 1.2, - "learning_rate": 0.00012019848219497956, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021608941986065353, + "loss": 0.0173, "step": 110880 }, { - "epoch": 1.2, - "learning_rate": 0.00012018226632937665, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021608185216763953, + "loss": 0.0149, "step": 110890 }, { - "epoch": 1.2, - "learning_rate": 0.00012016605046377375, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021607428447462552, + "loss": 0.0156, "step": 110900 }, { - "epoch": 1.2, - "learning_rate": 0.00012014983459817085, - "loss": 0.0118, + "epoch": 0.56, + "learning_rate": 0.0002160667167816115, + "loss": 0.0137, "step": 110910 }, { - "epoch": 1.2, - "learning_rate": 0.00012013361873256793, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002160591490885975, + "loss": 0.0135, "step": 110920 }, { - "epoch": 1.2, - "learning_rate": 0.00012011740286696504, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002160515813955835, + "loss": 0.0158, "step": 110930 }, { - "epoch": 1.2, - "learning_rate": 0.00012010118700136212, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021604401370256947, + "loss": 0.0155, "step": 110940 }, { - "epoch": 1.2, - "learning_rate": 0.00012008497113575922, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021603644600955548, + "loss": 0.0147, "step": 110950 }, { - "epoch": 1.2, - "learning_rate": 0.0001200687552701563, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.00021602887831654146, + "loss": 0.0134, "step": 110960 }, { - "epoch": 1.2, - "learning_rate": 0.00012005253940455341, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.00021602131062352744, + "loss": 0.0138, "step": 110970 }, { - "epoch": 1.2, - "learning_rate": 0.0001200363235389505, - "loss": 0.0122, + "epoch": 0.56, + "learning_rate": 0.00021601374293051342, + "loss": 0.0126, "step": 110980 }, { - "epoch": 1.2, - "learning_rate": 0.0001200201076733476, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.00021600617523749943, + "loss": 0.0159, "step": 110990 }, { - "epoch": 1.2, - "learning_rate": 0.00012000389180774469, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.0002159986075444854, + "loss": 0.0134, "step": 111000 }, { - "epoch": 1.2, - "eval_cer": 0.9215321461268126, - "eval_loss": 0.0076298159547150135, - "eval_runtime": 121.3154, - "eval_samples_per_second": 16.486, - "eval_steps_per_second": 4.121, + "epoch": 0.56, + "eval_cer": 0.914462492734159, + "eval_loss": 0.010961051099002361, + "eval_runtime": 116.7509, + "eval_samples_per_second": 17.13, + "eval_steps_per_second": 4.283, "step": 111000 }, { - "epoch": 1.2, - "learning_rate": 0.00011998767594214179, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002159910398514714, + "loss": 0.0137, "step": 111010 }, { - "epoch": 1.2, - "learning_rate": 0.00011997146007653887, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002159834721584574, + "loss": 0.0143, "step": 111020 }, { - "epoch": 1.2, - "learning_rate": 0.00011995524421093598, - "loss": 0.0133, + "epoch": 0.56, + "learning_rate": 0.00021597590446544338, + "loss": 0.0179, "step": 111030 }, { - "epoch": 1.2, - "learning_rate": 0.00011993902834533306, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021596833677242936, + "loss": 0.0129, "step": 111040 }, { - "epoch": 1.2, - "learning_rate": 0.00011992281247973016, - "loss": 0.0125, + "epoch": 0.56, + "learning_rate": 0.00021596076907941537, + "loss": 0.0147, "step": 111050 }, { - "epoch": 1.2, - "learning_rate": 0.00011990659661412724, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.00021595320138640135, + "loss": 0.0141, "step": 111060 }, { - "epoch": 1.2, - "learning_rate": 0.00011989038074852435, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021594563369338734, + "loss": 0.011, "step": 111070 }, { - "epoch": 1.2, - "learning_rate": 0.00011987416488292144, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021593806600037334, + "loss": 0.0134, "step": 111080 }, { - "epoch": 1.2, - "learning_rate": 0.00011985794901731853, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021593049830735933, + "loss": 0.0135, "step": 111090 }, { - "epoch": 1.2, - "learning_rate": 0.00011984173315171563, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.0002159229306143453, + "loss": 0.013, "step": 111100 }, { - "epoch": 1.2, - "learning_rate": 0.00011982551728611272, + "epoch": 0.56, + "learning_rate": 0.00021591536292133132, "loss": 0.0121, "step": 111110 }, { - "epoch": 1.2, - "learning_rate": 0.00011980930142050981, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.0002159077952283173, + "loss": 0.0138, "step": 111120 }, { - "epoch": 1.2, - "learning_rate": 0.00011979308555490692, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.00021590022753530328, + "loss": 0.0152, "step": 111130 }, { - "epoch": 1.2, - "learning_rate": 0.000119776869689304, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021589265984228926, + "loss": 0.0119, "step": 111140 }, { - "epoch": 1.2, - "learning_rate": 0.0001197606538237011, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.00021588509214927527, + "loss": 0.0138, "step": 111150 }, { - "epoch": 1.2, - "learning_rate": 0.00011974443795809818, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021587752445626125, + "loss": 0.0133, "step": 111160 }, { - "epoch": 1.2, - "learning_rate": 0.00011972822209249529, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021586995676324723, + "loss": 0.016, "step": 111170 }, { - "epoch": 1.2, - "learning_rate": 0.00011971200622689238, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021586238907023324, + "loss": 0.0151, "step": 111180 }, { - "epoch": 1.2, - "learning_rate": 0.00011969579036128948, - "loss": 0.0117, + "epoch": 0.56, + "learning_rate": 0.00021585482137721922, + "loss": 0.0139, "step": 111190 }, { - "epoch": 1.2, - "learning_rate": 0.00011967957449568657, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.0002158472536842052, + "loss": 0.0184, "step": 111200 }, { - "epoch": 1.2, - "learning_rate": 0.00011966335863008366, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.0002158396859911912, + "loss": 0.0145, "step": 111210 }, { - "epoch": 1.2, - "learning_rate": 0.00011964714276448075, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.0002158321182981772, + "loss": 0.0189, "step": 111220 }, { - "epoch": 1.2, - "learning_rate": 0.00011963092689887786, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021582455060516317, + "loss": 0.0204, "step": 111230 }, { - "epoch": 1.2, - "learning_rate": 0.00011961471103327494, - "loss": 0.0073, + "epoch": 0.56, + "learning_rate": 0.00021581698291214913, + "loss": 0.0139, "step": 111240 }, { - "epoch": 1.2, - "learning_rate": 0.00011959849516767205, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021580941521913514, + "loss": 0.0145, "step": 111250 }, { - "epoch": 1.2, - "learning_rate": 0.00011958227930206912, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021580184752612112, + "loss": 0.0141, "step": 111260 }, { - "epoch": 1.2, - "learning_rate": 0.00011956606343646623, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002157942798331071, + "loss": 0.0161, "step": 111270 }, { - "epoch": 1.2, - "learning_rate": 0.00011954984757086331, - "loss": 0.013, + "epoch": 0.56, + "learning_rate": 0.0002157867121400931, + "loss": 0.0121, "step": 111280 }, { - "epoch": 1.2, - "learning_rate": 0.00011953363170526042, - "loss": 0.0117, + "epoch": 0.56, + "learning_rate": 0.0002157791444470791, + "loss": 0.0169, "step": 111290 }, { - "epoch": 1.2, - "learning_rate": 0.00011951741583965751, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021577157675406507, + "loss": 0.0119, "step": 111300 }, { - "epoch": 1.2, - "learning_rate": 0.0001195011999740546, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021576400906105108, + "loss": 0.017, "step": 111310 }, { - "epoch": 1.2, - "learning_rate": 0.0001194849841084517, - "loss": 0.0122, + "epoch": 0.56, + "learning_rate": 0.00021575644136803706, + "loss": 0.0133, "step": 111320 }, { - "epoch": 1.2, - "learning_rate": 0.0001194687682428488, - "loss": 0.0132, + "epoch": 0.56, + "learning_rate": 0.00021574887367502304, + "loss": 0.0149, "step": 111330 }, { - "epoch": 1.2, - "learning_rate": 0.00011945255237724588, - "loss": 0.0133, + "epoch": 0.56, + "learning_rate": 0.00021574130598200905, + "loss": 0.014, "step": 111340 }, { - "epoch": 1.2, - "learning_rate": 0.00011943633651164299, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021573373828899503, + "loss": 0.0133, "step": 111350 }, { - "epoch": 1.2, - "learning_rate": 0.00011942012064604007, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021572617059598101, + "loss": 0.0144, "step": 111360 }, { - "epoch": 1.2, - "learning_rate": 0.00011940390478043717, - "loss": 0.0147, + "epoch": 0.56, + "learning_rate": 0.000215718602902967, + "loss": 0.0146, "step": 111370 }, { - "epoch": 1.2, - "learning_rate": 0.00011938768891483425, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.000215711035209953, + "loss": 0.0159, "step": 111380 }, { - "epoch": 1.2, - "learning_rate": 0.00011937147304923136, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021570346751693899, + "loss": 0.0174, "step": 111390 }, { - "epoch": 1.2, - "learning_rate": 0.00011935525718362845, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021569589982392497, + "loss": 0.0138, "step": 111400 }, { - "epoch": 1.2, - "learning_rate": 0.00011933904131802554, - "loss": 0.0115, + "epoch": 0.56, + "learning_rate": 0.00021568833213091098, + "loss": 0.0134, "step": 111410 }, { - "epoch": 1.2, - "learning_rate": 0.00011932282545242264, - "loss": 0.0121, + "epoch": 0.56, + "learning_rate": 0.00021568076443789696, + "loss": 0.0156, "step": 111420 }, { - "epoch": 1.2, - "learning_rate": 0.00011930660958681973, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021567319674488294, + "loss": 0.0156, "step": 111430 }, { - "epoch": 1.2, - "learning_rate": 0.00011929039372121682, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021566562905186895, + "loss": 0.0161, "step": 111440 }, { - "epoch": 1.2, - "learning_rate": 0.00011927417785561393, - "loss": 0.0135, + "epoch": 0.56, + "learning_rate": 0.00021565806135885493, + "loss": 0.0157, "step": 111450 }, { - "epoch": 1.2, - "learning_rate": 0.000119257961990011, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.0002156504936658409, + "loss": 0.0136, "step": 111460 }, { - "epoch": 1.21, - "learning_rate": 0.00011924174612440811, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021564292597282692, + "loss": 0.0164, "step": 111470 }, { - "epoch": 1.21, - "learning_rate": 0.00011922553025880519, - "loss": 0.0115, + "epoch": 0.56, + "learning_rate": 0.0002156353582798129, + "loss": 0.0124, "step": 111480 }, { - "epoch": 1.21, - "learning_rate": 0.0001192093143932023, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021562779058679888, + "loss": 0.0155, "step": 111490 }, { - "epoch": 1.21, - "learning_rate": 0.0001191930985275994, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002156202228937849, + "loss": 0.0125, "step": 111500 }, { - "epoch": 1.21, - "learning_rate": 0.00011917688266199648, - "loss": 0.0075, + "epoch": 0.56, + "learning_rate": 0.00021561265520077087, + "loss": 0.0154, "step": 111510 }, { - "epoch": 1.21, - "learning_rate": 0.00011916066679639359, - "loss": 0.0128, + "epoch": 0.56, + "learning_rate": 0.00021560508750775685, + "loss": 0.0203, "step": 111520 }, { - "epoch": 1.21, - "learning_rate": 0.00011914445093079067, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021559751981474283, + "loss": 0.014, "step": 111530 }, { - "epoch": 1.21, - "learning_rate": 0.00011912823506518778, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021558995212172884, + "loss": 0.0149, "step": 111540 }, { - "epoch": 1.21, - "learning_rate": 0.00011911201919958487, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021558238442871482, + "loss": 0.0156, "step": 111550 }, { - "epoch": 1.21, - "learning_rate": 0.00011909580333398196, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002155748167357008, + "loss": 0.0158, "step": 111560 }, { - "epoch": 1.21, - "learning_rate": 0.00011907958746837905, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021556724904268681, + "loss": 0.0125, "step": 111570 }, { - "epoch": 1.21, - "learning_rate": 0.00011906337160277615, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.0002155596813496728, + "loss": 0.0137, "step": 111580 }, { - "epoch": 1.21, - "learning_rate": 0.00011904715573717324, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021555211365665878, + "loss": 0.0136, "step": 111590 }, { - "epoch": 1.21, - "learning_rate": 0.00011903093987157035, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021554454596364479, + "loss": 0.0153, "step": 111600 }, { - "epoch": 1.21, - "learning_rate": 0.00011901472400596742, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021553697827063077, + "loss": 0.0156, "step": 111610 }, { - "epoch": 1.21, - "learning_rate": 0.00011899850814036453, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021552941057761675, + "loss": 0.0135, "step": 111620 }, { - "epoch": 1.21, - "learning_rate": 0.00011898229227476161, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021552184288460276, + "loss": 0.0147, "step": 111630 }, { - "epoch": 1.21, - "learning_rate": 0.00011896607640915872, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021551427519158874, + "loss": 0.0157, "step": 111640 }, { - "epoch": 1.21, - "learning_rate": 0.00011894986054355581, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021550670749857472, + "loss": 0.0163, "step": 111650 }, { - "epoch": 1.21, - "learning_rate": 0.0001189336446779529, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021549913980556073, + "loss": 0.0135, "step": 111660 }, { - "epoch": 1.21, - "learning_rate": 0.00011891742881235, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.0002154915721125467, + "loss": 0.0114, "step": 111670 }, { - "epoch": 1.21, - "learning_rate": 0.00011890121294674709, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.0002154840044195327, + "loss": 0.0199, "step": 111680 }, { - "epoch": 1.21, - "learning_rate": 0.00011888499708114418, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.0002154764367265187, + "loss": 0.0155, "step": 111690 }, { - "epoch": 1.21, - "learning_rate": 0.00011886878121554129, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021546886903350468, + "loss": 0.017, "step": 111700 }, { - "epoch": 1.21, - "learning_rate": 0.00011885256534993837, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021546130134049066, + "loss": 0.0176, "step": 111710 }, { - "epoch": 1.21, - "learning_rate": 0.00011883634948433547, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021545373364747664, + "loss": 0.0138, "step": 111720 }, { - "epoch": 1.21, - "learning_rate": 0.00011882013361873255, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021544616595446265, + "loss": 0.0155, "step": 111730 }, { - "epoch": 1.21, - "learning_rate": 0.00011880391775312966, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021543859826144863, + "loss": 0.0142, "step": 111740 }, { - "epoch": 1.21, - "learning_rate": 0.00011878770188752674, - "loss": 0.0121, + "epoch": 0.56, + "learning_rate": 0.00021543103056843462, + "loss": 0.0168, "step": 111750 }, { - "epoch": 1.21, - "learning_rate": 0.00011877148602192384, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021542346287542062, + "loss": 0.0152, "step": 111760 }, { - "epoch": 1.21, - "learning_rate": 0.00011875527015632094, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.0002154158951824066, + "loss": 0.0178, "step": 111770 }, { - "epoch": 1.21, - "learning_rate": 0.00011873905429071803, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.0002154083274893926, + "loss": 0.0135, "step": 111780 }, { - "epoch": 1.21, - "learning_rate": 0.00011872283842511512, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002154007597963786, + "loss": 0.0133, "step": 111790 }, { - "epoch": 1.21, - "learning_rate": 0.00011870662255951223, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021539319210336458, + "loss": 0.0188, "step": 111800 }, { - "epoch": 1.21, - "learning_rate": 0.00011869040669390931, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021538562441035056, + "loss": 0.0127, "step": 111810 }, { - "epoch": 1.21, - "learning_rate": 0.00011867419082830641, - "loss": 0.0133, + "epoch": 0.56, + "learning_rate": 0.00021537805671733657, + "loss": 0.0127, "step": 111820 }, { - "epoch": 1.21, - "learning_rate": 0.00011865797496270349, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021537048902432255, + "loss": 0.0147, "step": 111830 }, { - "epoch": 1.21, - "learning_rate": 0.0001186417590971006, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021536292133130853, + "loss": 0.0136, "step": 111840 }, { - "epoch": 1.21, - "learning_rate": 0.00011862554323149768, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021535535363829454, + "loss": 0.0131, "step": 111850 }, { - "epoch": 1.21, - "learning_rate": 0.00011860932736589478, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021534778594528052, + "loss": 0.0123, "step": 111860 }, { - "epoch": 1.21, - "learning_rate": 0.00011859311150029188, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.0002153402182522665, + "loss": 0.0157, "step": 111870 }, { - "epoch": 1.21, - "learning_rate": 0.00011857689563468897, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021533265055925248, + "loss": 0.0141, "step": 111880 }, { - "epoch": 1.21, - "learning_rate": 0.00011856067976908606, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.0002153250828662385, + "loss": 0.0141, "step": 111890 }, { - "epoch": 1.21, - "learning_rate": 0.00011854446390348316, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021531751517322447, + "loss": 0.0133, "step": 111900 }, { - "epoch": 1.21, - "learning_rate": 0.00011852824803788025, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021530994748021045, + "loss": 0.0154, "step": 111910 }, { - "epoch": 1.21, - "learning_rate": 0.00011851203217227735, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.00021530237978719646, + "loss": 0.0134, "step": 111920 }, { - "epoch": 1.21, - "learning_rate": 0.00011849581630667443, - "loss": 0.0121, + "epoch": 0.56, + "learning_rate": 0.00021529481209418244, + "loss": 0.0162, "step": 111930 }, { - "epoch": 1.21, - "learning_rate": 0.00011847960044107154, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021528724440116843, + "loss": 0.0168, "step": 111940 }, { - "epoch": 1.21, - "learning_rate": 0.00011846338457546862, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021527967670815443, + "loss": 0.0145, "step": 111950 }, { - "epoch": 1.21, - "learning_rate": 0.00011844716870986573, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021527210901514042, + "loss": 0.0118, "step": 111960 }, { - "epoch": 1.21, - "learning_rate": 0.0001184309528442628, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.0002152645413221264, + "loss": 0.0131, "step": 111970 }, { - "epoch": 1.21, - "learning_rate": 0.00011841473697865991, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.0002152569736291124, + "loss": 0.0128, "step": 111980 }, { - "epoch": 1.21, - "learning_rate": 0.000118398521113057, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.0002152494059360984, + "loss": 0.0134, "step": 111990 }, { - "epoch": 1.21, - "learning_rate": 0.0001183823052474541, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021524183824308437, + "loss": 0.0167, "step": 112000 }, { - "epoch": 1.21, - "eval_cer": 0.9215408321563763, - "eval_loss": 0.007726356852799654, - "eval_runtime": 121.0775, - "eval_samples_per_second": 16.518, - "eval_steps_per_second": 4.13, + "epoch": 0.57, + "eval_cer": 0.9144595815457828, + "eval_loss": 0.011023299768567085, + "eval_runtime": 116.6938, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 112000 }, { - "epoch": 1.21, - "learning_rate": 0.00011836608938185119, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.00021523427055007038, + "loss": 0.0195, "step": 112010 }, { - "epoch": 1.21, - "learning_rate": 0.0001183498735162483, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021522670285705636, + "loss": 0.0127, "step": 112020 }, { - "epoch": 1.21, - "learning_rate": 0.00011833365765064537, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021521913516404234, + "loss": 0.0153, "step": 112030 }, { - "epoch": 1.21, - "learning_rate": 0.00011831744178504248, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021521156747102832, + "loss": 0.0166, "step": 112040 }, { - "epoch": 1.21, - "learning_rate": 0.00011830122591943956, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021520399977801433, + "loss": 0.0152, "step": 112050 }, { - "epoch": 1.21, - "learning_rate": 0.00011828501005383667, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.0002151964320850003, + "loss": 0.0159, "step": 112060 }, { - "epoch": 1.21, - "learning_rate": 0.00011826879418823375, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.0002151888643919863, + "loss": 0.0152, "step": 112070 }, { - "epoch": 1.21, - "learning_rate": 0.00011825257832263085, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.0002151812966989723, + "loss": 0.0179, "step": 112080 }, { - "epoch": 1.21, - "learning_rate": 0.00011823636245702794, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021517372900595828, + "loss": 0.0182, "step": 112090 }, { - "epoch": 1.21, - "learning_rate": 0.00011822014659142504, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021516616131294426, + "loss": 0.0182, "step": 112100 }, { - "epoch": 1.21, - "learning_rate": 0.00011820393072582213, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021515859361993027, + "loss": 0.0156, "step": 112110 }, { - "epoch": 1.21, - "learning_rate": 0.00011818771486021922, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021515102592691625, + "loss": 0.0191, "step": 112120 }, { - "epoch": 1.21, - "learning_rate": 0.00011817149899461632, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.00021514345823390224, + "loss": 0.0153, "step": 112130 }, { - "epoch": 1.21, - "learning_rate": 0.00011815528312901342, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021513589054088824, + "loss": 0.0165, "step": 112140 }, { - "epoch": 1.21, - "learning_rate": 0.0001181390672634105, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021512832284787423, + "loss": 0.0143, "step": 112150 }, { - "epoch": 1.21, - "learning_rate": 0.00011812285139780761, - "loss": 0.0076, + "epoch": 0.57, + "learning_rate": 0.0002151207551548602, + "loss": 0.0154, "step": 112160 }, { - "epoch": 1.21, - "learning_rate": 0.00011810663553220469, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021511318746184622, + "loss": 0.0149, "step": 112170 }, { - "epoch": 1.21, - "learning_rate": 0.00011809041966660179, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002151056197688322, + "loss": 0.0132, "step": 112180 }, { - "epoch": 1.21, - "learning_rate": 0.00011807420380099889, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.00021509805207581818, + "loss": 0.0111, "step": 112190 }, { - "epoch": 1.21, - "learning_rate": 0.00011805798793539598, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002150904843828042, + "loss": 0.0147, "step": 112200 }, { - "epoch": 1.21, - "learning_rate": 0.00011804177206979307, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021508291668979017, + "loss": 0.0165, "step": 112210 }, { - "epoch": 1.21, - "learning_rate": 0.00011802555620419016, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021507534899677615, + "loss": 0.0142, "step": 112220 }, { - "epoch": 1.21, - "learning_rate": 0.00011800934033858727, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021506778130376213, + "loss": 0.0134, "step": 112230 }, { - "epoch": 1.21, - "learning_rate": 0.00011799312447298436, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021506021361074814, + "loss": 0.0141, "step": 112240 }, { - "epoch": 1.21, - "learning_rate": 0.00011797690860738146, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021505264591773412, + "loss": 0.0153, "step": 112250 }, { - "epoch": 1.21, - "learning_rate": 0.00011796069274177855, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.0002150450782247201, + "loss": 0.0162, "step": 112260 }, { - "epoch": 1.21, - "learning_rate": 0.00011794447687617565, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.0002150375105317061, + "loss": 0.0133, "step": 112270 }, { - "epoch": 1.21, - "learning_rate": 0.00011792826101057273, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.0002150299428386921, + "loss": 0.0153, "step": 112280 }, { - "epoch": 1.21, - "learning_rate": 0.00011791204514496984, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021502237514567807, + "loss": 0.0169, "step": 112290 }, { - "epoch": 1.21, - "learning_rate": 0.00011789582927936692, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021501480745266408, + "loss": 0.0133, "step": 112300 }, { - "epoch": 1.21, - "learning_rate": 0.00011787961341376403, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021500723975965006, + "loss": 0.0134, "step": 112310 }, { - "epoch": 1.21, - "learning_rate": 0.0001178633975481611, - "loss": 0.0119, + "epoch": 0.57, + "learning_rate": 0.00021499967206663605, + "loss": 0.0123, "step": 112320 }, { - "epoch": 1.21, - "learning_rate": 0.00011784718168255821, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.00021499210437362205, + "loss": 0.0195, "step": 112330 }, { - "epoch": 1.21, - "learning_rate": 0.0001178309658169553, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021498453668060804, + "loss": 0.0159, "step": 112340 }, { - "epoch": 1.21, - "learning_rate": 0.0001178147499513524, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021497696898759402, + "loss": 0.0147, "step": 112350 }, { - "epoch": 1.21, - "learning_rate": 0.00011779853408574949, - "loss": 0.0131, + "epoch": 0.57, + "learning_rate": 0.00021496940129458003, + "loss": 0.0153, "step": 112360 }, { - "epoch": 1.21, - "learning_rate": 0.00011778231822014658, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.000214961833601566, + "loss": 0.0128, "step": 112370 }, { - "epoch": 1.21, - "learning_rate": 0.00011776610235454367, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.000214954265908552, + "loss": 0.0178, "step": 112380 }, { - "epoch": 1.21, - "learning_rate": 0.00011774988648894078, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021494669821553797, + "loss": 0.0147, "step": 112390 }, { - "epoch": 1.22, - "learning_rate": 0.00011773367062333786, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021493913052252398, + "loss": 0.0145, "step": 112400 }, { - "epoch": 1.22, - "learning_rate": 0.00011771745475773497, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021493156282950996, + "loss": 0.0131, "step": 112410 }, { - "epoch": 1.22, - "learning_rate": 0.00011770123889213205, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021492399513649594, + "loss": 0.0176, "step": 112420 }, { - "epoch": 1.22, - "learning_rate": 0.00011768502302652915, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021491642744348195, + "loss": 0.0153, "step": 112430 }, { - "epoch": 1.22, - "learning_rate": 0.00011766880716092623, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021490885975046793, + "loss": 0.0136, "step": 112440 }, { - "epoch": 1.22, - "learning_rate": 0.00011765259129532334, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002149012920574539, + "loss": 0.0145, "step": 112450 }, { - "epoch": 1.22, - "learning_rate": 0.00011763637542972043, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021489372436443992, + "loss": 0.015, "step": 112460 }, { - "epoch": 1.22, - "learning_rate": 0.00011762015956411752, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.0002148861566714259, + "loss": 0.0154, "step": 112470 }, { - "epoch": 1.22, - "learning_rate": 0.00011760394369851462, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021487858897841188, + "loss": 0.0152, "step": 112480 }, { - "epoch": 1.22, - "learning_rate": 0.00011758772783291172, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.0002148710212853979, + "loss": 0.0182, "step": 112490 }, { - "epoch": 1.22, - "learning_rate": 0.0001175715119673088, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.00021486345359238385, + "loss": 0.0151, "step": 112500 }, { - "epoch": 1.22, - "learning_rate": 0.00011755529610170591, - "loss": 0.0065, + "epoch": 0.57, + "learning_rate": 0.00021485588589936983, + "loss": 0.0166, "step": 112510 }, { - "epoch": 1.22, - "learning_rate": 0.00011753908023610299, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002148483182063558, + "loss": 0.0154, "step": 112520 }, { - "epoch": 1.22, - "learning_rate": 0.00011752286437050009, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021484075051334182, + "loss": 0.0146, "step": 112530 }, { - "epoch": 1.22, - "learning_rate": 0.00011750664850489717, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.0002148331828203278, + "loss": 0.018, "step": 112540 }, { - "epoch": 1.22, - "learning_rate": 0.00011749043263929428, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021482561512731378, + "loss": 0.0169, "step": 112550 }, { - "epoch": 1.22, - "learning_rate": 0.00011747421677369137, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002148180474342998, + "loss": 0.0161, "step": 112560 }, { - "epoch": 1.22, - "learning_rate": 0.00011745800090808846, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021481047974128577, + "loss": 0.0176, "step": 112570 }, { - "epoch": 1.22, - "learning_rate": 0.00011744178504248556, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021480291204827175, + "loss": 0.0145, "step": 112580 }, { - "epoch": 1.22, - "learning_rate": 0.00011742556917688265, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021479534435525776, + "loss": 0.017, "step": 112590 }, { - "epoch": 1.22, - "learning_rate": 0.00011740935331127974, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021478777666224374, + "loss": 0.0145, "step": 112600 }, { - "epoch": 1.22, - "learning_rate": 0.00011739313744567685, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021478020896922972, + "loss": 0.0167, "step": 112610 }, { - "epoch": 1.22, - "learning_rate": 0.00011737692158007393, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.0002147726412762157, + "loss": 0.0129, "step": 112620 }, { - "epoch": 1.22, - "learning_rate": 0.00011736070571447103, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021476507358320171, + "loss": 0.016, "step": 112630 }, { - "epoch": 1.22, - "learning_rate": 0.00011734448984886811, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002147575058901877, + "loss": 0.0161, "step": 112640 }, { - "epoch": 1.22, - "learning_rate": 0.00011732827398326522, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.00021474993819717368, + "loss": 0.0152, "step": 112650 }, { - "epoch": 1.22, - "learning_rate": 0.00011731205811766231, - "loss": 0.0115, + "epoch": 0.57, + "learning_rate": 0.00021474237050415969, + "loss": 0.015, "step": 112660 }, { - "epoch": 1.22, - "learning_rate": 0.0001172958422520594, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.00021473480281114567, + "loss": 0.0124, "step": 112670 }, { - "epoch": 1.22, - "learning_rate": 0.0001172796263864565, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021472723511813165, + "loss": 0.0177, "step": 112680 }, { - "epoch": 1.22, - "learning_rate": 0.00011726341052085359, - "loss": 0.0125, + "epoch": 0.57, + "learning_rate": 0.00021471966742511766, + "loss": 0.0141, "step": 112690 }, { - "epoch": 1.22, - "learning_rate": 0.00011724719465525068, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021471209973210364, + "loss": 0.0172, "step": 112700 }, { - "epoch": 1.22, - "learning_rate": 0.00011723097878964779, - "loss": 0.0115, + "epoch": 0.57, + "learning_rate": 0.00021470453203908962, + "loss": 0.0172, "step": 112710 }, { - "epoch": 1.22, - "learning_rate": 0.00011721476292404487, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021469696434607563, + "loss": 0.0129, "step": 112720 }, { - "epoch": 1.22, - "learning_rate": 0.00011719854705844197, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002146893966530616, + "loss": 0.0144, "step": 112730 }, { - "epoch": 1.22, - "learning_rate": 0.00011718233119283905, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.0002146818289600476, + "loss": 0.0146, "step": 112740 }, { - "epoch": 1.22, - "learning_rate": 0.00011716611532723616, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.0002146742612670336, + "loss": 0.0137, "step": 112750 }, { - "epoch": 1.22, - "learning_rate": 0.00011714989946163324, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021466669357401958, + "loss": 0.0127, "step": 112760 }, { - "epoch": 1.22, - "learning_rate": 0.00011713368359603035, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021465912588100556, + "loss": 0.0149, "step": 112770 }, { - "epoch": 1.22, - "learning_rate": 0.00011711746773042744, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021465155818799154, + "loss": 0.0145, "step": 112780 }, { - "epoch": 1.22, - "learning_rate": 0.00011710125186482453, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021464399049497755, + "loss": 0.0139, "step": 112790 }, { - "epoch": 1.22, - "learning_rate": 0.00011708503599922162, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021463642280196353, + "loss": 0.0182, "step": 112800 }, { - "epoch": 1.22, - "learning_rate": 0.00011706882013361873, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.00021462885510894952, + "loss": 0.0184, "step": 112810 }, { - "epoch": 1.22, - "learning_rate": 0.00011705260426801581, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021462128741593552, + "loss": 0.0125, "step": 112820 }, { - "epoch": 1.22, - "learning_rate": 0.00011703638840241292, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.0002146137197229215, + "loss": 0.0129, "step": 112830 }, { - "epoch": 1.22, - "learning_rate": 0.00011702017253681, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.0002146061520299075, + "loss": 0.0189, "step": 112840 }, { - "epoch": 1.22, - "learning_rate": 0.0001170039566712071, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.0002145985843368935, + "loss": 0.0168, "step": 112850 }, { - "epoch": 1.22, - "learning_rate": 0.00011698774080560418, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021459101664387948, + "loss": 0.0165, "step": 112860 }, { - "epoch": 1.22, - "learning_rate": 0.00011697152494000129, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021458344895086546, + "loss": 0.0146, "step": 112870 }, { - "epoch": 1.22, - "learning_rate": 0.00011695530907439838, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021457588125785147, + "loss": 0.0148, "step": 112880 }, { - "epoch": 1.22, - "learning_rate": 0.00011693909320879547, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021456831356483745, + "loss": 0.0177, "step": 112890 }, { - "epoch": 1.22, - "learning_rate": 0.00011692287734319256, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021456074587182343, + "loss": 0.0177, "step": 112900 }, { - "epoch": 1.22, - "learning_rate": 0.00011690666147758966, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021455317817880944, + "loss": 0.0157, "step": 112910 }, { - "epoch": 1.22, - "learning_rate": 0.00011689044561198675, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021454561048579542, + "loss": 0.0153, "step": 112920 }, { - "epoch": 1.22, - "learning_rate": 0.00011687422974638386, - "loss": 0.013, + "epoch": 0.57, + "learning_rate": 0.0002145380427927814, + "loss": 0.0155, "step": 112930 }, { - "epoch": 1.22, - "learning_rate": 0.00011685801388078095, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021453047509976738, + "loss": 0.0152, "step": 112940 }, { - "epoch": 1.22, - "learning_rate": 0.00011684179801517804, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.0002145229074067534, + "loss": 0.013, "step": 112950 }, { - "epoch": 1.22, - "learning_rate": 0.00011682558214957515, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021451533971373937, + "loss": 0.015, "step": 112960 }, { - "epoch": 1.22, - "learning_rate": 0.00011680936628397223, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021450777202072535, + "loss": 0.0171, "step": 112970 }, { - "epoch": 1.22, - "learning_rate": 0.00011679315041836933, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021450020432771136, + "loss": 0.016, "step": 112980 }, { - "epoch": 1.22, - "learning_rate": 0.00011677693455276641, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021449263663469734, + "loss": 0.0162, "step": 112990 }, { - "epoch": 1.22, - "learning_rate": 0.00011676071868716352, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021448506894168333, + "loss": 0.012, "step": 113000 }, { - "epoch": 1.22, - "eval_cer": 0.9215060880381213, - "eval_loss": 0.00777030223980546, - "eval_runtime": 121.2227, - "eval_samples_per_second": 16.499, - "eval_steps_per_second": 4.125, + "epoch": 0.57, + "eval_cer": 0.9144906342217957, + "eval_loss": 0.01105137262493372, + "eval_runtime": 116.8218, + "eval_samples_per_second": 17.12, + "eval_steps_per_second": 4.28, "step": 113000 }, { - "epoch": 1.22, - "learning_rate": 0.0001167445028215606, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021447750124866933, + "loss": 0.0144, "step": 113010 }, { - "epoch": 1.22, - "learning_rate": 0.0001167282869559577, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021446993355565532, + "loss": 0.0109, "step": 113020 }, { - "epoch": 1.22, - "learning_rate": 0.0001167120710903548, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002144623658626413, + "loss": 0.0141, "step": 113030 }, { - "epoch": 1.22, - "learning_rate": 0.00011669585522475189, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.0002144547981696273, + "loss": 0.0138, "step": 113040 }, { - "epoch": 1.22, - "learning_rate": 0.00011667963935914898, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002144472304766133, + "loss": 0.0126, "step": 113050 }, { - "epoch": 1.22, - "learning_rate": 0.00011666342349354608, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021443966278359927, + "loss": 0.015, "step": 113060 }, { - "epoch": 1.22, - "learning_rate": 0.00011664720762794317, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.00021443209509058528, + "loss": 0.0164, "step": 113070 }, { - "epoch": 1.22, - "learning_rate": 0.00011663099176234027, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021442452739757126, + "loss": 0.0143, "step": 113080 }, { - "epoch": 1.22, - "learning_rate": 0.00011661477589673735, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021441695970455724, + "loss": 0.0136, "step": 113090 }, { - "epoch": 1.22, - "learning_rate": 0.00011659856003113446, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021440939201154325, + "loss": 0.0155, "step": 113100 }, { - "epoch": 1.22, - "learning_rate": 0.00011658234416553154, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021440182431852923, + "loss": 0.0133, "step": 113110 }, { - "epoch": 1.22, - "learning_rate": 0.00011656612829992865, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.0002143942566255152, + "loss": 0.0129, "step": 113120 }, { - "epoch": 1.22, - "learning_rate": 0.00011654991243432573, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.0002143866889325012, + "loss": 0.0142, "step": 113130 }, { - "epoch": 1.22, - "learning_rate": 0.00011653369656872283, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.0002143791212394872, + "loss": 0.0134, "step": 113140 }, { - "epoch": 1.22, - "learning_rate": 0.00011651748070311992, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021437155354647318, + "loss": 0.015, "step": 113150 }, { - "epoch": 1.22, - "learning_rate": 0.00011650126483751702, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021436398585345916, + "loss": 0.0131, "step": 113160 }, { - "epoch": 1.22, - "learning_rate": 0.00011648504897191411, - "loss": 0.0076, + "epoch": 0.57, + "learning_rate": 0.00021435641816044517, + "loss": 0.0163, "step": 113170 }, { - "epoch": 1.22, - "learning_rate": 0.00011646883310631122, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021434885046743115, + "loss": 0.0121, "step": 113180 }, { - "epoch": 1.22, - "learning_rate": 0.0001164526172407083, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021434128277441714, + "loss": 0.0155, "step": 113190 }, { - "epoch": 1.22, - "learning_rate": 0.0001164364013751054, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021433371508140314, + "loss": 0.0172, "step": 113200 }, { - "epoch": 1.22, - "learning_rate": 0.00011642018550950248, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021432614738838913, + "loss": 0.0142, "step": 113210 }, { - "epoch": 1.22, - "learning_rate": 0.00011640396964389959, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002143185796953751, + "loss": 0.0118, "step": 113220 }, { - "epoch": 1.22, - "learning_rate": 0.00011638775377829667, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021431101200236112, + "loss": 0.0115, "step": 113230 }, { - "epoch": 1.22, - "learning_rate": 0.00011637153791269377, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002143034443093471, + "loss": 0.0165, "step": 113240 }, { - "epoch": 1.22, - "learning_rate": 0.00011635532204709087, - "loss": 0.0125, + "epoch": 0.57, + "learning_rate": 0.00021429587661633308, + "loss": 0.013, "step": 113250 }, { - "epoch": 1.22, - "learning_rate": 0.00011633910618148796, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.0002142883089233191, + "loss": 0.0122, "step": 113260 }, { - "epoch": 1.22, - "learning_rate": 0.00011632289031588505, - "loss": 0.0115, + "epoch": 0.57, + "learning_rate": 0.00021428074123030507, + "loss": 0.0128, "step": 113270 }, { - "epoch": 1.22, - "learning_rate": 0.00011630667445028216, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021427317353729105, + "loss": 0.0123, "step": 113280 }, { - "epoch": 1.22, - "learning_rate": 0.00011629045858467924, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021426560584427703, + "loss": 0.0125, "step": 113290 }, { - "epoch": 1.22, - "learning_rate": 0.00011627424271907634, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021425803815126304, + "loss": 0.0142, "step": 113300 }, { - "epoch": 1.22, - "learning_rate": 0.00011625802685347342, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021425047045824902, + "loss": 0.0155, "step": 113310 }, { - "epoch": 1.23, - "learning_rate": 0.00011624181098787053, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.000214242902765235, + "loss": 0.0127, "step": 113320 }, { - "epoch": 1.23, - "learning_rate": 0.00011622559512226761, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.000214235335072221, + "loss": 0.0177, "step": 113330 }, { - "epoch": 1.23, - "learning_rate": 0.00011620937925666471, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.000214227767379207, + "loss": 0.0179, "step": 113340 }, { - "epoch": 1.23, - "learning_rate": 0.0001161931633910618, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021422019968619297, + "loss": 0.0167, "step": 113350 }, { - "epoch": 1.23, - "learning_rate": 0.0001161769475254589, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021421263199317898, + "loss": 0.0137, "step": 113360 }, { - "epoch": 1.23, - "learning_rate": 0.00011616073165985599, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021420506430016496, + "loss": 0.0126, "step": 113370 }, { - "epoch": 1.23, - "learning_rate": 0.00011614451579425308, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021419749660715095, + "loss": 0.0136, "step": 113380 }, { - "epoch": 1.23, - "learning_rate": 0.00011612829992865018, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021418992891413695, + "loss": 0.0182, "step": 113390 }, { - "epoch": 1.23, - "learning_rate": 0.00011611208406304728, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.00021418236122112294, + "loss": 0.0153, "step": 113400 }, { - "epoch": 1.23, - "learning_rate": 0.00011609586819744436, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021417479352810892, + "loss": 0.0141, "step": 113410 }, { - "epoch": 1.23, - "learning_rate": 0.00011607965233184147, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021416722583509493, + "loss": 0.0167, "step": 113420 }, { - "epoch": 1.23, - "learning_rate": 0.00011606343646623855, - "loss": 0.0126, + "epoch": 0.57, + "learning_rate": 0.0002141596581420809, + "loss": 0.0156, "step": 113430 }, { - "epoch": 1.23, - "learning_rate": 0.00011604722060063565, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002141520904490669, + "loss": 0.0175, "step": 113440 }, { - "epoch": 1.23, - "learning_rate": 0.00011603100473503273, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021414452275605287, + "loss": 0.017, "step": 113450 }, { - "epoch": 1.23, - "learning_rate": 0.00011601478886942984, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021413695506303888, + "loss": 0.0131, "step": 113460 }, { - "epoch": 1.23, - "learning_rate": 0.00011599857300382693, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021412938737002486, + "loss": 0.0128, "step": 113470 }, { - "epoch": 1.23, - "learning_rate": 0.00011598235713822403, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021412181967701084, + "loss": 0.0122, "step": 113480 }, { - "epoch": 1.23, - "learning_rate": 0.00011596614127262112, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021411425198399685, + "loss": 0.0181, "step": 113490 }, { - "epoch": 1.23, - "learning_rate": 0.00011594992540701822, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.00021410668429098283, + "loss": 0.0139, "step": 113500 }, { - "epoch": 1.23, - "learning_rate": 0.0001159337095414153, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.0002140991165979688, + "loss": 0.014, "step": 113510 }, { - "epoch": 1.23, - "learning_rate": 0.00011591749367581241, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.00021409154890495482, + "loss": 0.0205, "step": 113520 }, { - "epoch": 1.23, - "learning_rate": 0.00011590127781020949, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002140839812119408, + "loss": 0.0162, "step": 113530 }, { - "epoch": 1.23, - "learning_rate": 0.0001158850619446066, - "loss": 0.0122, + "epoch": 0.57, + "learning_rate": 0.00021407641351892678, + "loss": 0.0136, "step": 113540 }, { - "epoch": 1.23, - "learning_rate": 0.00011586884607900367, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002140688458259128, + "loss": 0.0142, "step": 113550 }, { - "epoch": 1.23, - "learning_rate": 0.00011585263021340078, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021406127813289877, + "loss": 0.0172, "step": 113560 }, { - "epoch": 1.23, - "learning_rate": 0.00011583641434779787, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021405371043988476, + "loss": 0.013, "step": 113570 }, { - "epoch": 1.23, - "learning_rate": 0.00011582019848219497, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021404614274687076, + "loss": 0.0134, "step": 113580 }, { - "epoch": 1.23, - "learning_rate": 0.00011580398261659206, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021403857505385675, + "loss": 0.0112, "step": 113590 }, { - "epoch": 1.23, - "learning_rate": 0.00011578776675098915, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021403100736084273, + "loss": 0.0147, "step": 113600 }, { - "epoch": 1.23, - "learning_rate": 0.00011577155088538624, - "loss": 0.012, + "epoch": 0.57, + "learning_rate": 0.0002140234396678287, + "loss": 0.0163, "step": 113610 }, { - "epoch": 1.23, - "learning_rate": 0.00011575533501978335, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021401587197481472, + "loss": 0.013, "step": 113620 }, { - "epoch": 1.23, - "learning_rate": 0.00011573911915418043, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002140083042818007, + "loss": 0.0175, "step": 113630 }, { - "epoch": 1.23, - "learning_rate": 0.00011572290328857754, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021400073658878668, + "loss": 0.0173, "step": 113640 }, { - "epoch": 1.23, - "learning_rate": 0.00011570668742297464, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.0002139931688957727, + "loss": 0.0137, "step": 113650 }, { - "epoch": 1.23, - "learning_rate": 0.00011569047155737172, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021398560120275867, + "loss": 0.013, "step": 113660 }, { - "epoch": 1.23, - "learning_rate": 0.00011567425569176883, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.00021397803350974465, + "loss": 0.0123, "step": 113670 }, { - "epoch": 1.23, - "learning_rate": 0.00011565803982616591, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021397046581673066, + "loss": 0.0183, "step": 113680 }, { - "epoch": 1.23, - "learning_rate": 0.00011564182396056301, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021396289812371664, + "loss": 0.016, "step": 113690 }, { - "epoch": 1.23, - "learning_rate": 0.00011562560809496009, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021395533043070262, + "loss": 0.0172, "step": 113700 }, { - "epoch": 1.23, - "learning_rate": 0.0001156093922293572, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021394776273768863, + "loss": 0.0139, "step": 113710 }, { - "epoch": 1.23, - "learning_rate": 0.00011559317636375429, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002139401950446746, + "loss": 0.0141, "step": 113720 }, { - "epoch": 1.23, - "learning_rate": 0.00011557696049815138, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002139326273516606, + "loss": 0.0152, "step": 113730 }, { - "epoch": 1.23, - "learning_rate": 0.00011556074463254848, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.0002139250596586466, + "loss": 0.0127, "step": 113740 }, { - "epoch": 1.23, - "learning_rate": 0.00011554452876694557, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021391749196563256, + "loss": 0.0144, "step": 113750 }, { - "epoch": 1.23, - "learning_rate": 0.00011552831290134266, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021390992427261854, + "loss": 0.0143, "step": 113760 }, { - "epoch": 1.23, - "learning_rate": 0.00011551209703573977, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021390235657960452, + "loss": 0.0119, "step": 113770 }, { - "epoch": 1.23, - "learning_rate": 0.00011549588117013685, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021389478888659053, + "loss": 0.0137, "step": 113780 }, { - "epoch": 1.23, - "learning_rate": 0.00011547966530453395, - "loss": 0.0139, + "epoch": 0.57, + "learning_rate": 0.0002138872211935765, + "loss": 0.0168, "step": 113790 }, { - "epoch": 1.23, - "learning_rate": 0.00011546344943893103, - "loss": 0.012, + "epoch": 0.57, + "learning_rate": 0.0002138796535005625, + "loss": 0.014, "step": 113800 }, { - "epoch": 1.23, - "learning_rate": 0.00011544723357332814, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002138720858075485, + "loss": 0.0155, "step": 113810 }, { - "epoch": 1.23, - "learning_rate": 0.00011543101770772523, - "loss": 0.014, + "epoch": 0.57, + "learning_rate": 0.00021386451811453448, + "loss": 0.0164, "step": 113820 }, { - "epoch": 1.23, - "learning_rate": 0.00011541480184212233, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021385695042152046, + "loss": 0.0149, "step": 113830 }, { - "epoch": 1.23, - "learning_rate": 0.00011539858597651942, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021384938272850644, + "loss": 0.0165, "step": 113840 }, { - "epoch": 1.23, - "learning_rate": 0.00011538237011091651, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021384181503549245, + "loss": 0.0137, "step": 113850 }, { - "epoch": 1.23, - "learning_rate": 0.0001153661542453136, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.00021383424734247843, + "loss": 0.0124, "step": 113860 }, { - "epoch": 1.23, - "learning_rate": 0.00011534993837971071, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021382667964946442, + "loss": 0.0167, "step": 113870 }, { - "epoch": 1.23, - "learning_rate": 0.00011533372251410779, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021381911195645042, + "loss": 0.0139, "step": 113880 }, { - "epoch": 1.23, - "learning_rate": 0.0001153175066485049, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002138115442634364, + "loss": 0.0131, "step": 113890 }, { - "epoch": 1.23, - "learning_rate": 0.00011530129078290197, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.0002138039765704224, + "loss": 0.0157, "step": 113900 }, { - "epoch": 1.23, - "learning_rate": 0.00011528507491729908, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002137964088774084, + "loss": 0.0146, "step": 113910 }, { - "epoch": 1.23, - "learning_rate": 0.00011526885905169616, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.00021378884118439438, + "loss": 0.0136, "step": 113920 }, { - "epoch": 1.23, - "learning_rate": 0.00011525264318609327, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021378127349138036, + "loss": 0.0117, "step": 113930 }, { - "epoch": 1.23, - "learning_rate": 0.00011523642732049036, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021377370579836637, + "loss": 0.0126, "step": 113940 }, { - "epoch": 1.23, - "learning_rate": 0.00011522021145488745, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021376613810535235, + "loss": 0.0138, "step": 113950 }, { - "epoch": 1.23, - "learning_rate": 0.00011520399558928454, - "loss": 0.0125, + "epoch": 0.57, + "learning_rate": 0.00021375857041233833, + "loss": 0.0143, "step": 113960 }, { - "epoch": 1.23, - "learning_rate": 0.00011518777972368165, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021375100271932434, + "loss": 0.0129, "step": 113970 }, { - "epoch": 1.23, - "learning_rate": 0.00011517156385807873, - "loss": 0.0075, + "epoch": 0.58, + "learning_rate": 0.00021374343502631032, + "loss": 0.0132, "step": 113980 }, { - "epoch": 1.23, - "learning_rate": 0.00011515534799247584, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.0002137358673332963, + "loss": 0.0198, "step": 113990 }, { - "epoch": 1.23, - "learning_rate": 0.00011513913212687292, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021372829964028228, + "loss": 0.0163, "step": 114000 }, { - "epoch": 1.23, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.007686339318752289, - "eval_runtime": 121.2235, - "eval_samples_per_second": 16.498, - "eval_steps_per_second": 4.125, + "epoch": 0.58, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.010899759829044342, + "eval_runtime": 116.7433, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, "step": 114000 }, { - "epoch": 1.23, - "learning_rate": 0.00011512291626127002, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002137207319472683, + "loss": 0.0124, "step": 114010 }, { - "epoch": 1.23, - "learning_rate": 0.0001151067003956671, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021371316425425427, + "loss": 0.0174, "step": 114020 }, { - "epoch": 1.23, - "learning_rate": 0.00011509048453006421, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021370559656124025, + "loss": 0.0158, "step": 114030 }, { - "epoch": 1.23, - "learning_rate": 0.0001150742686644613, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021369802886822626, + "loss": 0.0166, "step": 114040 }, { - "epoch": 1.23, - "learning_rate": 0.00011505805279885839, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021369046117521224, + "loss": 0.0124, "step": 114050 }, { - "epoch": 1.23, - "learning_rate": 0.00011504183693325549, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.00021368289348219823, + "loss": 0.0182, "step": 114060 }, { - "epoch": 1.23, - "learning_rate": 0.00011502562106765258, - "loss": 0.0134, + "epoch": 0.58, + "learning_rate": 0.00021367532578918423, + "loss": 0.017, "step": 114070 }, { - "epoch": 1.23, - "learning_rate": 0.00011500940520204967, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021366775809617022, + "loss": 0.0179, "step": 114080 }, { - "epoch": 1.23, - "learning_rate": 0.00011499318933644678, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.0002136601904031562, + "loss": 0.0182, "step": 114090 }, { - "epoch": 1.23, - "learning_rate": 0.00011497697347084386, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002136526227101422, + "loss": 0.0149, "step": 114100 }, { - "epoch": 1.23, - "learning_rate": 0.00011496075760524096, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.0002136450550171282, + "loss": 0.019, "step": 114110 }, { - "epoch": 1.23, - "learning_rate": 0.00011494454173963804, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021363748732411417, + "loss": 0.0156, "step": 114120 }, { - "epoch": 1.23, - "learning_rate": 0.00011492832587403515, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021362991963110018, + "loss": 0.0116, "step": 114130 }, { - "epoch": 1.23, - "learning_rate": 0.00011491211000843223, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021362235193808616, + "loss": 0.0136, "step": 114140 }, { - "epoch": 1.23, - "learning_rate": 0.00011489589414282933, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.00021361478424507214, + "loss": 0.0135, "step": 114150 }, { - "epoch": 1.23, - "learning_rate": 0.00011487967827722643, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021360721655205815, + "loss": 0.0153, "step": 114160 }, { - "epoch": 1.23, - "learning_rate": 0.00011486346241162352, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021359964885904413, + "loss": 0.015, "step": 114170 }, { - "epoch": 1.23, - "learning_rate": 0.00011484724654602061, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.0002135920811660301, + "loss": 0.0125, "step": 114180 }, { - "epoch": 1.23, - "learning_rate": 0.00011483103068041772, - "loss": 0.0113, + "epoch": 0.58, + "learning_rate": 0.0002135845134730161, + "loss": 0.0199, "step": 114190 }, { - "epoch": 1.23, - "learning_rate": 0.0001148148148148148, - "loss": 0.0063, + "epoch": 0.58, + "learning_rate": 0.0002135769457800021, + "loss": 0.013, "step": 114200 }, { - "epoch": 1.23, - "learning_rate": 0.0001147985989492119, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021356937808698808, + "loss": 0.0131, "step": 114210 }, { - "epoch": 1.23, - "learning_rate": 0.00011478238308360898, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021356181039397406, + "loss": 0.0158, "step": 114220 }, { - "epoch": 1.23, - "learning_rate": 0.00011476616721800609, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021355424270096007, + "loss": 0.0137, "step": 114230 }, { - "epoch": 1.23, - "learning_rate": 0.00011474995135240317, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021354667500794605, + "loss": 0.0186, "step": 114240 }, { - "epoch": 1.24, - "learning_rate": 0.00011473373548680027, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021353910731493204, + "loss": 0.016, "step": 114250 }, { - "epoch": 1.24, - "learning_rate": 0.00011471751962119737, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021353153962191804, + "loss": 0.0156, "step": 114260 }, { - "epoch": 1.24, - "learning_rate": 0.00011470130375559446, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021352397192890403, + "loss": 0.0145, "step": 114270 }, { - "epoch": 1.24, - "learning_rate": 0.00011468508788999155, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021351640423589, + "loss": 0.014, "step": 114280 }, { - "epoch": 1.24, - "learning_rate": 0.00011466887202438865, - "loss": 0.0123, + "epoch": 0.58, + "learning_rate": 0.00021350883654287602, + "loss": 0.0156, "step": 114290 }, { - "epoch": 1.24, - "learning_rate": 0.00011465265615878574, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.000213501268849862, + "loss": 0.0177, "step": 114300 }, { - "epoch": 1.24, - "learning_rate": 0.00011463644029318285, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021349370115684798, + "loss": 0.0136, "step": 114310 }, { - "epoch": 1.24, - "learning_rate": 0.00011462022442757992, - "loss": 0.0073, + "epoch": 0.58, + "learning_rate": 0.000213486133463834, + "loss": 0.0139, "step": 114320 }, { - "epoch": 1.24, - "learning_rate": 0.00011460400856197703, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021347856577081997, + "loss": 0.0191, "step": 114330 }, { - "epoch": 1.24, - "learning_rate": 0.00011458779269637411, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021347099807780595, + "loss": 0.0184, "step": 114340 }, { - "epoch": 1.24, - "learning_rate": 0.00011457157683077122, - "loss": 0.0073, + "epoch": 0.58, + "learning_rate": 0.00021346343038479193, + "loss": 0.018, "step": 114350 }, { - "epoch": 1.24, - "learning_rate": 0.00011455536096516831, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021345586269177794, + "loss": 0.0148, "step": 114360 }, { - "epoch": 1.24, - "learning_rate": 0.0001145391450995654, - "loss": 0.0074, + "epoch": 0.58, + "learning_rate": 0.00021344829499876392, + "loss": 0.0157, "step": 114370 }, { - "epoch": 1.24, - "learning_rate": 0.00011452292923396251, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002134407273057499, + "loss": 0.0136, "step": 114380 }, { - "epoch": 1.24, - "learning_rate": 0.00011450671336835959, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002134331596127359, + "loss": 0.0158, "step": 114390 }, { - "epoch": 1.24, - "learning_rate": 0.0001144904975027567, - "loss": 0.0071, + "epoch": 0.58, + "learning_rate": 0.0002134255919197219, + "loss": 0.0144, "step": 114400 }, { - "epoch": 1.24, - "learning_rate": 0.00011447428163715379, - "loss": 0.0126, + "epoch": 0.58, + "learning_rate": 0.00021341802422670787, + "loss": 0.015, "step": 114410 }, { - "epoch": 1.24, - "learning_rate": 0.00011445806577155088, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021341045653369388, + "loss": 0.013, "step": 114420 }, { - "epoch": 1.24, - "learning_rate": 0.00011444184990594797, - "loss": 0.013, + "epoch": 0.58, + "learning_rate": 0.00021340288884067986, + "loss": 0.0137, "step": 114430 }, { - "epoch": 1.24, - "learning_rate": 0.00011442563404034508, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021339532114766585, + "loss": 0.0161, "step": 114440 }, { - "epoch": 1.24, - "learning_rate": 0.00011440941817474216, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021338775345465185, + "loss": 0.0173, "step": 114450 }, { - "epoch": 1.24, - "learning_rate": 0.00011439320230913926, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021338018576163784, + "loss": 0.0167, "step": 114460 }, { - "epoch": 1.24, - "learning_rate": 0.00011437698644353634, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021337261806862382, + "loss": 0.0128, "step": 114470 }, { - "epoch": 1.24, - "learning_rate": 0.00011436077057793345, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021336505037560983, + "loss": 0.0147, "step": 114480 }, { - "epoch": 1.24, - "learning_rate": 0.00011434455471233053, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.0002133574826825958, + "loss": 0.0143, "step": 114490 }, { - "epoch": 1.24, - "learning_rate": 0.00011432833884672763, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.0002133499149895818, + "loss": 0.0149, "step": 114500 }, { - "epoch": 1.24, - "learning_rate": 0.00011431212298112473, - "loss": 0.0109, + "epoch": 0.58, + "learning_rate": 0.00021334234729656777, + "loss": 0.0123, "step": 114510 }, { - "epoch": 1.24, - "learning_rate": 0.00011429590711552182, - "loss": 0.0136, + "epoch": 0.58, + "learning_rate": 0.00021333477960355378, + "loss": 0.0166, "step": 114520 }, { - "epoch": 1.24, - "learning_rate": 0.00011427969124991891, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021332721191053976, + "loss": 0.0144, "step": 114530 }, { - "epoch": 1.24, - "learning_rate": 0.000114263475384316, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021331964421752574, + "loss": 0.0137, "step": 114540 }, { - "epoch": 1.24, - "learning_rate": 0.0001142472595187131, - "loss": 0.0115, + "epoch": 0.58, + "learning_rate": 0.00021331207652451175, + "loss": 0.0149, "step": 114550 }, { - "epoch": 1.24, - "learning_rate": 0.0001142310436531102, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021330450883149773, + "loss": 0.0172, "step": 114560 }, { - "epoch": 1.24, - "learning_rate": 0.00011421482778750728, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.0002132969411384837, + "loss": 0.0155, "step": 114570 }, { - "epoch": 1.24, - "learning_rate": 0.00011419861192190439, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021328937344546972, + "loss": 0.0166, "step": 114580 }, { - "epoch": 1.24, - "learning_rate": 0.00011418239605630147, - "loss": 0.0075, + "epoch": 0.58, + "learning_rate": 0.0002132818057524557, + "loss": 0.0122, "step": 114590 }, { - "epoch": 1.24, - "learning_rate": 0.00011416618019069858, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021327423805944168, + "loss": 0.0126, "step": 114600 }, { - "epoch": 1.24, - "learning_rate": 0.00011414996432509565, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002132666703664277, + "loss": 0.0165, "step": 114610 }, { - "epoch": 1.24, - "learning_rate": 0.00011413374845949276, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021325910267341367, + "loss": 0.015, "step": 114620 }, { - "epoch": 1.24, - "learning_rate": 0.00011411753259388985, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021325153498039966, + "loss": 0.0154, "step": 114630 }, { - "epoch": 1.24, - "learning_rate": 0.00011410131672828695, - "loss": 0.0108, + "epoch": 0.58, + "learning_rate": 0.00021324396728738566, + "loss": 0.0113, "step": 114640 }, { - "epoch": 1.24, - "learning_rate": 0.00011408510086268404, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021323639959437165, + "loss": 0.016, "step": 114650 }, { - "epoch": 1.24, - "learning_rate": 0.00011406888499708115, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021322883190135763, + "loss": 0.0173, "step": 114660 }, { - "epoch": 1.24, - "learning_rate": 0.00011405266913147822, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021322126420834364, + "loss": 0.0144, "step": 114670 }, { - "epoch": 1.24, - "learning_rate": 0.00011403645326587533, - "loss": 0.0123, + "epoch": 0.58, + "learning_rate": 0.00021321369651532962, + "loss": 0.0172, "step": 114680 }, { - "epoch": 1.24, - "learning_rate": 0.00011402023740027241, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.0002132061288223156, + "loss": 0.0195, "step": 114690 }, { - "epoch": 1.24, - "learning_rate": 0.00011400402153466952, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021319856112930158, + "loss": 0.0155, "step": 114700 }, { - "epoch": 1.24, - "learning_rate": 0.0001139878056690666, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.0002131909934362876, + "loss": 0.0172, "step": 114710 }, { - "epoch": 1.24, - "learning_rate": 0.0001139715898034637, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021318342574327357, + "loss": 0.0176, "step": 114720 }, { - "epoch": 1.24, - "learning_rate": 0.0001139553739378608, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.00021317585805025955, + "loss": 0.0133, "step": 114730 }, { - "epoch": 1.24, - "learning_rate": 0.00011393915807225789, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021316829035724556, + "loss": 0.0148, "step": 114740 }, { - "epoch": 1.24, - "learning_rate": 0.00011392294220665498, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021316072266423154, + "loss": 0.0113, "step": 114750 }, { - "epoch": 1.24, - "learning_rate": 0.00011390672634105207, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021315315497121752, + "loss": 0.0164, "step": 114760 }, { - "epoch": 1.24, - "learning_rate": 0.00011389051047544917, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021314558727820353, + "loss": 0.0172, "step": 114770 }, { - "epoch": 1.24, - "learning_rate": 0.00011387429460984627, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.0002131380195851895, + "loss": 0.0137, "step": 114780 }, { - "epoch": 1.24, - "learning_rate": 0.00011385807874424335, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.0002131304518921755, + "loss": 0.0176, "step": 114790 }, { - "epoch": 1.24, - "learning_rate": 0.00011384186287864046, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.0002131228841991615, + "loss": 0.0144, "step": 114800 }, { - "epoch": 1.24, - "learning_rate": 0.00011382564701303754, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021311531650614748, + "loss": 0.0164, "step": 114810 }, { - "epoch": 1.24, - "learning_rate": 0.00011380943114743464, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021310774881313347, + "loss": 0.0147, "step": 114820 }, { - "epoch": 1.24, - "learning_rate": 0.00011379321528183174, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021310018112011947, + "loss": 0.0126, "step": 114830 }, { - "epoch": 1.24, - "learning_rate": 0.00011377699941622883, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021309261342710546, + "loss": 0.0139, "step": 114840 }, { - "epoch": 1.24, - "learning_rate": 0.00011376078355062592, - "loss": 0.0125, + "epoch": 0.58, + "learning_rate": 0.00021308504573409144, + "loss": 0.0145, "step": 114850 }, { - "epoch": 1.24, - "learning_rate": 0.00011374456768502301, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021307747804107742, + "loss": 0.0157, "step": 114860 }, { - "epoch": 1.24, - "learning_rate": 0.0001137283518194201, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021306991034806343, + "loss": 0.0135, "step": 114870 }, { - "epoch": 1.24, - "learning_rate": 0.00011371213595381721, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002130623426550494, + "loss": 0.0161, "step": 114880 }, { - "epoch": 1.24, - "learning_rate": 0.00011369592008821429, - "loss": 0.0119, + "epoch": 0.58, + "learning_rate": 0.0002130547749620354, + "loss": 0.0139, "step": 114890 }, { - "epoch": 1.24, - "learning_rate": 0.0001136797042226114, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.0002130472072690214, + "loss": 0.014, "step": 114900 }, { - "epoch": 1.24, - "learning_rate": 0.00011366348835700848, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021303963957600738, + "loss": 0.016, "step": 114910 }, { - "epoch": 1.24, - "learning_rate": 0.00011364727249140558, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021303207188299336, + "loss": 0.0133, "step": 114920 }, { - "epoch": 1.24, - "learning_rate": 0.00011363105662580266, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021302450418997937, + "loss": 0.015, "step": 114930 }, { - "epoch": 1.24, - "learning_rate": 0.00011361484076019977, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021301693649696535, + "loss": 0.0177, "step": 114940 }, { - "epoch": 1.24, - "learning_rate": 0.00011359862489459686, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.00021300936880395133, + "loss": 0.0156, "step": 114950 }, { - "epoch": 1.24, - "learning_rate": 0.00011358240902899395, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021300180111093734, + "loss": 0.0172, "step": 114960 }, { - "epoch": 1.24, - "learning_rate": 0.00011356619316339105, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021299423341792332, + "loss": 0.0139, "step": 114970 }, { - "epoch": 1.24, - "learning_rate": 0.00011354997729778815, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.0002129866657249093, + "loss": 0.0137, "step": 114980 }, { - "epoch": 1.24, - "learning_rate": 0.00011353376143218523, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.0002129790980318953, + "loss": 0.0122, "step": 114990 }, { - "epoch": 1.24, - "learning_rate": 0.00011351754556658234, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.0002129715303388813, + "loss": 0.0139, "step": 115000 }, { - "epoch": 1.24, - "eval_cer": 0.9215182484795105, - "eval_loss": 0.007636575493961573, - "eval_runtime": 121.1591, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.58, + "eval_cer": 0.914481900656667, + "eval_loss": 0.010673732496798038, + "eval_runtime": 116.7514, + "eval_samples_per_second": 17.13, + "eval_steps_per_second": 4.283, "step": 115000 }, { - "epoch": 1.24, - "learning_rate": 0.00011350132970097942, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021296396264586725, + "loss": 0.0189, "step": 115010 }, { - "epoch": 1.24, - "learning_rate": 0.00011348511383537652, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021295639495285323, + "loss": 0.0179, "step": 115020 }, { - "epoch": 1.24, - "learning_rate": 0.0001134688979697736, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021294882725983924, + "loss": 0.0161, "step": 115030 }, { - "epoch": 1.24, - "learning_rate": 0.00011345268210417071, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021294125956682522, + "loss": 0.0156, "step": 115040 }, { - "epoch": 1.24, - "learning_rate": 0.0001134364662385678, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.0002129336918738112, + "loss": 0.0132, "step": 115050 }, { - "epoch": 1.24, - "learning_rate": 0.0001134202503729649, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.0002129261241807972, + "loss": 0.0175, "step": 115060 }, { - "epoch": 1.24, - "learning_rate": 0.00011340403450736199, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.0002129185564877832, + "loss": 0.0137, "step": 115070 }, { - "epoch": 1.24, - "learning_rate": 0.00011338781864175908, - "loss": 0.0073, + "epoch": 0.58, + "learning_rate": 0.00021291098879476917, + "loss": 0.0133, "step": 115080 }, { - "epoch": 1.24, - "learning_rate": 0.00011337160277615619, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021290342110175515, + "loss": 0.0138, "step": 115090 }, { - "epoch": 1.24, - "learning_rate": 0.00011335538691055328, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021289585340874116, + "loss": 0.0155, "step": 115100 }, { - "epoch": 1.24, - "learning_rate": 0.00011333917104495037, - "loss": 0.0102, + "epoch": 0.58, + "learning_rate": 0.00021288828571572714, + "loss": 0.0138, "step": 115110 }, { - "epoch": 1.24, - "learning_rate": 0.00011332295517934747, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021288071802271313, + "loss": 0.0133, "step": 115120 }, { - "epoch": 1.24, - "learning_rate": 0.00011330673931374457, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021287315032969913, + "loss": 0.015, "step": 115130 }, { - "epoch": 1.24, - "learning_rate": 0.00011329052344814165, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021286558263668512, + "loss": 0.0165, "step": 115140 }, { - "epoch": 1.24, - "learning_rate": 0.00011327430758253876, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.0002128580149436711, + "loss": 0.0177, "step": 115150 }, { - "epoch": 1.24, - "learning_rate": 0.00011325809171693584, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.0002128504472506571, + "loss": 0.0166, "step": 115160 }, { - "epoch": 1.25, - "learning_rate": 0.00011324187585133294, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.0002128428795576431, + "loss": 0.0148, "step": 115170 }, { - "epoch": 1.25, - "learning_rate": 0.00011322565998573002, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021283531186462907, + "loss": 0.015, "step": 115180 }, { - "epoch": 1.25, - "learning_rate": 0.00011320944412012713, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021282774417161508, + "loss": 0.0151, "step": 115190 }, { - "epoch": 1.25, - "learning_rate": 0.00011319322825452422, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021282017647860106, + "loss": 0.0125, "step": 115200 }, { - "epoch": 1.25, - "learning_rate": 0.00011317701238892131, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021281260878558704, + "loss": 0.0148, "step": 115210 }, { - "epoch": 1.25, - "learning_rate": 0.0001131607965233184, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021280504109257305, + "loss": 0.0161, "step": 115220 }, { - "epoch": 1.25, - "learning_rate": 0.0001131445806577155, - "loss": 0.0129, + "epoch": 0.58, + "learning_rate": 0.00021279747339955903, + "loss": 0.0156, "step": 115230 }, { - "epoch": 1.25, - "learning_rate": 0.00011312836479211259, - "loss": 0.0073, + "epoch": 0.58, + "learning_rate": 0.000212789905706545, + "loss": 0.0138, "step": 115240 }, { - "epoch": 1.25, - "learning_rate": 0.0001131121489265097, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.000212782338013531, + "loss": 0.0171, "step": 115250 }, { - "epoch": 1.25, - "learning_rate": 0.00011309593306090678, - "loss": 0.0116, + "epoch": 0.58, + "learning_rate": 0.000212774770320517, + "loss": 0.0167, "step": 115260 }, { - "epoch": 1.25, - "learning_rate": 0.00011307971719530388, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021276720262750298, + "loss": 0.0131, "step": 115270 }, { - "epoch": 1.25, - "learning_rate": 0.00011306350132970096, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021275963493448896, + "loss": 0.014, "step": 115280 }, { - "epoch": 1.25, - "learning_rate": 0.00011304728546409807, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021275206724147497, + "loss": 0.0129, "step": 115290 }, { - "epoch": 1.25, - "learning_rate": 0.00011303106959849515, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021274449954846095, + "loss": 0.0186, "step": 115300 }, { - "epoch": 1.25, - "learning_rate": 0.00011301485373289225, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021273693185544694, + "loss": 0.0129, "step": 115310 }, { - "epoch": 1.25, - "learning_rate": 0.00011299863786728935, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021272936416243294, + "loss": 0.014, "step": 115320 }, { - "epoch": 1.25, - "learning_rate": 0.00011298242200168644, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021272179646941893, + "loss": 0.017, "step": 115330 }, { - "epoch": 1.25, - "learning_rate": 0.00011296620613608353, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.0002127142287764049, + "loss": 0.0142, "step": 115340 }, { - "epoch": 1.25, - "learning_rate": 0.00011294999027048064, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021270666108339092, + "loss": 0.017, "step": 115350 }, { - "epoch": 1.25, - "learning_rate": 0.00011293377440487772, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002126990933903769, + "loss": 0.0163, "step": 115360 }, { - "epoch": 1.25, - "learning_rate": 0.00011291755853927482, - "loss": 0.0108, + "epoch": 0.58, + "learning_rate": 0.00021269152569736288, + "loss": 0.0149, "step": 115370 }, { - "epoch": 1.25, - "learning_rate": 0.0001129013426736719, - "loss": 0.0128, + "epoch": 0.58, + "learning_rate": 0.0002126839580043489, + "loss": 0.0133, "step": 115380 }, { - "epoch": 1.25, - "learning_rate": 0.00011288512680806901, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021267639031133487, + "loss": 0.0156, "step": 115390 }, { - "epoch": 1.25, - "learning_rate": 0.00011286891094246609, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021266882261832085, + "loss": 0.0144, "step": 115400 }, { - "epoch": 1.25, - "learning_rate": 0.0001128526950768632, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.00021266125492530683, + "loss": 0.0124, "step": 115410 }, { - "epoch": 1.25, - "learning_rate": 0.00011283647921126029, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021265368723229284, + "loss": 0.0131, "step": 115420 }, { - "epoch": 1.25, - "learning_rate": 0.00011282026334565738, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.00021264611953927882, + "loss": 0.0134, "step": 115430 }, { - "epoch": 1.25, - "learning_rate": 0.00011280404748005447, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.0002126385518462648, + "loss": 0.0152, "step": 115440 }, { - "epoch": 1.25, - "learning_rate": 0.00011278783161445158, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.0002126309841532508, + "loss": 0.013, "step": 115450 }, { - "epoch": 1.25, - "learning_rate": 0.00011277161574884866, - "loss": 0.0119, + "epoch": 0.58, + "learning_rate": 0.0002126234164602368, + "loss": 0.0147, "step": 115460 }, { - "epoch": 1.25, - "learning_rate": 0.00011275539988324577, - "loss": 0.0102, + "epoch": 0.58, + "learning_rate": 0.00021261584876722277, + "loss": 0.0212, "step": 115470 }, { - "epoch": 1.25, - "learning_rate": 0.00011273918401764285, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021260828107420878, + "loss": 0.0134, "step": 115480 }, { - "epoch": 1.25, - "learning_rate": 0.00011272296815203995, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021260071338119476, + "loss": 0.0186, "step": 115490 }, { - "epoch": 1.25, - "learning_rate": 0.00011270675228643703, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021259314568818075, + "loss": 0.0145, "step": 115500 }, { - "epoch": 1.25, - "learning_rate": 0.00011269053642083414, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.00021258557799516675, + "loss": 0.0126, "step": 115510 }, { - "epoch": 1.25, - "learning_rate": 0.00011267432055523123, - "loss": 0.0109, + "epoch": 0.58, + "learning_rate": 0.00021257801030215274, + "loss": 0.0182, "step": 115520 }, { - "epoch": 1.25, - "learning_rate": 0.00011265810468962832, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021257044260913872, + "loss": 0.0148, "step": 115530 }, { - "epoch": 1.25, - "learning_rate": 0.00011264188882402542, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021256287491612473, + "loss": 0.0169, "step": 115540 }, { - "epoch": 1.25, - "learning_rate": 0.00011262567295842251, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.0002125553072231107, + "loss": 0.0121, "step": 115550 }, { - "epoch": 1.25, - "learning_rate": 0.0001126094570928196, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.0002125477395300967, + "loss": 0.0132, "step": 115560 }, { - "epoch": 1.25, - "learning_rate": 0.00011259324122721671, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.0002125401718370827, + "loss": 0.0173, "step": 115570 }, { - "epoch": 1.25, - "learning_rate": 0.00011257702536161379, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021253260414406868, + "loss": 0.0155, "step": 115580 }, { - "epoch": 1.25, - "learning_rate": 0.00011256080949601089, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021252503645105466, + "loss": 0.0125, "step": 115590 }, { - "epoch": 1.25, - "learning_rate": 0.00011254459363040797, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021251746875804064, + "loss": 0.0122, "step": 115600 }, { - "epoch": 1.25, - "learning_rate": 0.00011252837776480508, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021250990106502665, + "loss": 0.015, "step": 115610 }, { - "epoch": 1.25, - "learning_rate": 0.00011251216189920216, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021250233337201263, + "loss": 0.0173, "step": 115620 }, { - "epoch": 1.25, - "learning_rate": 0.00011249594603359926, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021249476567899861, + "loss": 0.0134, "step": 115630 }, { - "epoch": 1.25, - "learning_rate": 0.00011247973016799636, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.00021248719798598462, + "loss": 0.0141, "step": 115640 }, { - "epoch": 1.25, - "learning_rate": 0.00011246351430239345, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.0002124796302929706, + "loss": 0.0159, "step": 115650 }, { - "epoch": 1.25, - "learning_rate": 0.00011244729843679054, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021247206259995659, + "loss": 0.0143, "step": 115660 }, { - "epoch": 1.25, - "learning_rate": 0.00011243108257118765, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.0002124644949069426, + "loss": 0.0169, "step": 115670 }, { - "epoch": 1.25, - "learning_rate": 0.00011241486670558473, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021245692721392858, + "loss": 0.0172, "step": 115680 }, { - "epoch": 1.25, - "learning_rate": 0.00011239865083998183, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021244935952091456, + "loss": 0.0152, "step": 115690 }, { - "epoch": 1.25, - "learning_rate": 0.00011238243497437891, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021244179182790056, + "loss": 0.0121, "step": 115700 }, { - "epoch": 1.25, - "learning_rate": 0.00011236621910877602, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021243422413488655, + "loss": 0.0149, "step": 115710 }, { - "epoch": 1.25, - "learning_rate": 0.0001123500032431731, - "loss": 0.0124, + "epoch": 0.58, + "learning_rate": 0.00021242665644187253, + "loss": 0.0119, "step": 115720 }, { - "epoch": 1.25, - "learning_rate": 0.0001123337873775702, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021241908874885854, + "loss": 0.0166, "step": 115730 }, { - "epoch": 1.25, - "learning_rate": 0.0001123175715119673, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021241152105584452, + "loss": 0.0142, "step": 115740 }, { - "epoch": 1.25, - "learning_rate": 0.00011230135564636439, - "loss": 0.0071, + "epoch": 0.58, + "learning_rate": 0.0002124039533628305, + "loss": 0.0153, "step": 115750 }, { - "epoch": 1.25, - "learning_rate": 0.00011228513978076148, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021239638566981648, + "loss": 0.012, "step": 115760 }, { - "epoch": 1.25, - "learning_rate": 0.00011226892391515858, - "loss": 0.0125, + "epoch": 0.58, + "learning_rate": 0.0002123888179768025, + "loss": 0.0147, "step": 115770 }, { - "epoch": 1.25, - "learning_rate": 0.00011225270804955567, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021238125028378847, + "loss": 0.0127, "step": 115780 }, { - "epoch": 1.25, - "learning_rate": 0.00011223649218395277, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021237368259077445, + "loss": 0.0133, "step": 115790 }, { - "epoch": 1.25, - "learning_rate": 0.00011222027631834985, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021236611489776046, + "loss": 0.0144, "step": 115800 }, { - "epoch": 1.25, - "learning_rate": 0.00011220406045274696, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021235854720474644, + "loss": 0.0151, "step": 115810 }, { - "epoch": 1.25, - "learning_rate": 0.00011218784458714407, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021235097951173242, + "loss": 0.0127, "step": 115820 }, { - "epoch": 1.25, - "learning_rate": 0.00011217162872154115, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021234341181871843, + "loss": 0.0137, "step": 115830 }, { - "epoch": 1.25, - "learning_rate": 0.00011215541285593825, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021233584412570441, + "loss": 0.0156, "step": 115840 }, { - "epoch": 1.25, - "learning_rate": 0.00011213919699033533, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.0002123282764326904, + "loss": 0.0145, "step": 115850 }, { - "epoch": 1.25, - "learning_rate": 0.00011212298112473244, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.0002123207087396764, + "loss": 0.0158, "step": 115860 }, { - "epoch": 1.25, - "learning_rate": 0.00011210676525912952, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.00021231314104666239, + "loss": 0.013, "step": 115870 }, { - "epoch": 1.25, - "learning_rate": 0.00011209054939352662, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021230557335364837, + "loss": 0.0139, "step": 115880 }, { - "epoch": 1.25, - "learning_rate": 0.00011207433352792372, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.00021229800566063438, + "loss": 0.0112, "step": 115890 }, { - "epoch": 1.25, - "learning_rate": 0.00011205811766232081, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021229043796762036, + "loss": 0.0131, "step": 115900 }, { - "epoch": 1.25, - "learning_rate": 0.0001120419017967179, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021228287027460634, + "loss": 0.0131, "step": 115910 }, { - "epoch": 1.25, - "learning_rate": 0.000112025685931115, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021227530258159232, + "loss": 0.0189, "step": 115920 }, { - "epoch": 1.25, - "learning_rate": 0.00011200947006551209, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021226773488857833, + "loss": 0.0137, "step": 115930 }, { - "epoch": 1.25, - "learning_rate": 0.00011199325419990919, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002122601671955643, + "loss": 0.0137, "step": 115940 }, { - "epoch": 1.25, - "learning_rate": 0.00011197703833430627, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.0002122525995025503, + "loss": 0.0169, "step": 115950 }, { - "epoch": 1.25, - "learning_rate": 0.00011196082246870338, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002122450318095363, + "loss": 0.0187, "step": 115960 }, { - "epoch": 1.25, - "learning_rate": 0.00011194460660310046, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021223746411652228, + "loss": 0.021, "step": 115970 }, { - "epoch": 1.25, - "learning_rate": 0.00011192839073749756, - "loss": 0.0113, + "epoch": 0.59, + "learning_rate": 0.00021222989642350826, + "loss": 0.0137, "step": 115980 }, { - "epoch": 1.25, - "learning_rate": 0.00011191217487189466, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021222232873049427, + "loss": 0.0138, "step": 115990 }, { - "epoch": 1.25, - "learning_rate": 0.00011189595900629175, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021221476103748025, + "loss": 0.016, "step": 116000 }, { - "epoch": 1.25, - "eval_cer": 0.9215382263475072, - "eval_loss": 0.00765196094289422, - "eval_runtime": 121.1107, - "eval_samples_per_second": 16.514, - "eval_steps_per_second": 4.128, + "epoch": 0.59, + "eval_cer": 0.9144634631302844, + "eval_loss": 0.01081350538879633, + "eval_runtime": 116.7675, + "eval_samples_per_second": 17.128, + "eval_steps_per_second": 4.282, "step": 116000 }, { - "epoch": 1.25, - "learning_rate": 0.00011187974314068884, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021220719334446623, + "loss": 0.013, "step": 116010 }, { - "epoch": 1.25, - "learning_rate": 0.00011186352727508593, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021219962565145224, + "loss": 0.0133, "step": 116020 }, { - "epoch": 1.25, - "learning_rate": 0.00011184731140948303, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021219205795843822, + "loss": 0.0153, "step": 116030 }, { - "epoch": 1.25, - "learning_rate": 0.00011183109554388013, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002121844902654242, + "loss": 0.0156, "step": 116040 }, { - "epoch": 1.25, - "learning_rate": 0.00011181487967827721, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021217692257241021, + "loss": 0.0145, "step": 116050 }, { - "epoch": 1.25, - "learning_rate": 0.00011179866381267432, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002121693548793962, + "loss": 0.024, "step": 116060 }, { - "epoch": 1.25, - "learning_rate": 0.0001117824479470714, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021216178718638218, + "loss": 0.0143, "step": 116070 }, { - "epoch": 1.25, - "learning_rate": 0.0001117662320814685, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021215421949336819, + "loss": 0.0164, "step": 116080 }, { - "epoch": 1.25, - "learning_rate": 0.00011175001621586558, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021214665180035417, + "loss": 0.0155, "step": 116090 }, { - "epoch": 1.26, - "learning_rate": 0.00011173380035026269, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021213908410734015, + "loss": 0.0149, "step": 116100 }, { - "epoch": 1.26, - "learning_rate": 0.00011171758448465978, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021213151641432613, + "loss": 0.0143, "step": 116110 }, { - "epoch": 1.26, - "learning_rate": 0.00011170136861905688, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021212394872131214, + "loss": 0.0126, "step": 116120 }, { - "epoch": 1.26, - "learning_rate": 0.00011168515275345397, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021211638102829812, + "loss": 0.0152, "step": 116130 }, { - "epoch": 1.26, - "learning_rate": 0.00011166893688785107, - "loss": 0.0069, + "epoch": 0.59, + "learning_rate": 0.0002121088133352841, + "loss": 0.0147, "step": 116140 }, { - "epoch": 1.26, - "learning_rate": 0.00011165272102224815, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.0002121012456422701, + "loss": 0.0129, "step": 116150 }, { - "epoch": 1.26, - "learning_rate": 0.00011163650515664526, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002120936779492561, + "loss": 0.0127, "step": 116160 }, { - "epoch": 1.26, - "learning_rate": 0.00011162028929104234, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021208611025624207, + "loss": 0.015, "step": 116170 }, { - "epoch": 1.26, - "learning_rate": 0.00011160407342543945, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021207854256322808, + "loss": 0.0169, "step": 116180 }, { - "epoch": 1.26, - "learning_rate": 0.00011158785755983652, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021207097487021406, + "loss": 0.0161, "step": 116190 }, { - "epoch": 1.26, - "learning_rate": 0.00011157164169423363, - "loss": 0.0113, + "epoch": 0.59, + "learning_rate": 0.00021206340717720004, + "loss": 0.0145, "step": 116200 }, { - "epoch": 1.26, - "learning_rate": 0.00011155542582863072, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021205583948418605, + "loss": 0.0162, "step": 116210 }, { - "epoch": 1.26, - "learning_rate": 0.00011153920996302782, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021204827179117203, + "loss": 0.0171, "step": 116220 }, { - "epoch": 1.26, - "learning_rate": 0.00011152299409742491, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021204070409815802, + "loss": 0.0155, "step": 116230 }, { - "epoch": 1.26, - "learning_rate": 0.000111506778231822, - "loss": 0.0051, + "epoch": 0.59, + "learning_rate": 0.00021203313640514402, + "loss": 0.0171, "step": 116240 }, { - "epoch": 1.26, - "learning_rate": 0.0001114905623662191, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021202556871213, + "loss": 0.0133, "step": 116250 }, { - "epoch": 1.26, - "learning_rate": 0.0001114743465006162, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.000212018001019116, + "loss": 0.0139, "step": 116260 }, { - "epoch": 1.26, - "learning_rate": 0.00011145813063501328, - "loss": 0.0127, + "epoch": 0.59, + "learning_rate": 0.00021201043332610194, + "loss": 0.0144, "step": 116270 }, { - "epoch": 1.26, - "learning_rate": 0.00011144191476941039, - "loss": 0.0162, + "epoch": 0.59, + "learning_rate": 0.00021200286563308795, + "loss": 0.0149, "step": 116280 }, { - "epoch": 1.26, - "learning_rate": 0.00011142569890380747, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021199529794007393, + "loss": 0.013, "step": 116290 }, { - "epoch": 1.26, - "learning_rate": 0.00011140948303820457, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002119877302470599, + "loss": 0.0139, "step": 116300 }, { - "epoch": 1.26, - "learning_rate": 0.00011139326717260165, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.0002119801625540459, + "loss": 0.0122, "step": 116310 }, { - "epoch": 1.26, - "learning_rate": 0.00011137705130699876, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002119725948610319, + "loss": 0.0149, "step": 116320 }, { - "epoch": 1.26, - "learning_rate": 0.00011136083544139585, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021196502716801788, + "loss": 0.015, "step": 116330 }, { - "epoch": 1.26, - "learning_rate": 0.00011134461957579294, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021195745947500387, + "loss": 0.014, "step": 116340 }, { - "epoch": 1.26, - "learning_rate": 0.00011132840371019004, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021194989178198987, + "loss": 0.0161, "step": 116350 }, { - "epoch": 1.26, - "learning_rate": 0.00011131218784458714, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021194232408897586, + "loss": 0.0161, "step": 116360 }, { - "epoch": 1.26, - "learning_rate": 0.00011129597197898422, - "loss": 0.0073, + "epoch": 0.59, + "learning_rate": 0.00021193475639596184, + "loss": 0.0153, "step": 116370 }, { - "epoch": 1.26, - "learning_rate": 0.00011127975611338133, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021192718870294785, + "loss": 0.0137, "step": 116380 }, { - "epoch": 1.26, - "learning_rate": 0.0001112635402477784, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021191962100993383, + "loss": 0.0154, "step": 116390 }, { - "epoch": 1.26, - "learning_rate": 0.00011124732438217551, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.0002119120533169198, + "loss": 0.0126, "step": 116400 }, { - "epoch": 1.26, - "learning_rate": 0.00011123110851657259, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021190448562390582, + "loss": 0.014, "step": 116410 }, { - "epoch": 1.26, - "learning_rate": 0.0001112148926509697, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.0002118969179308918, + "loss": 0.0166, "step": 116420 }, { - "epoch": 1.26, - "learning_rate": 0.00011119867678536679, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.00021188935023787778, + "loss": 0.0128, "step": 116430 }, { - "epoch": 1.26, - "learning_rate": 0.00011118246091976388, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002118817825448638, + "loss": 0.0144, "step": 116440 }, { - "epoch": 1.26, - "learning_rate": 0.00011116624505416098, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021187421485184977, + "loss": 0.0169, "step": 116450 }, { - "epoch": 1.26, - "learning_rate": 0.00011115002918855808, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021186664715883575, + "loss": 0.0134, "step": 116460 }, { - "epoch": 1.26, - "learning_rate": 0.00011113381332295516, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021185907946582176, + "loss": 0.0123, "step": 116470 }, { - "epoch": 1.26, - "learning_rate": 0.00011111759745735227, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021185151177280774, + "loss": 0.0149, "step": 116480 }, { - "epoch": 1.26, - "learning_rate": 0.00011110138159174935, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.00021184394407979372, + "loss": 0.0131, "step": 116490 }, { - "epoch": 1.26, - "learning_rate": 0.00011108516572614645, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.0002118363763867797, + "loss": 0.0142, "step": 116500 }, { - "epoch": 1.26, - "learning_rate": 0.00011106894986054353, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.0002118288086937657, + "loss": 0.015, "step": 116510 }, { - "epoch": 1.26, - "learning_rate": 0.00011105273399494064, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.0002118212410007517, + "loss": 0.0177, "step": 116520 }, { - "epoch": 1.26, - "learning_rate": 0.00011103651812933775, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021181367330773768, + "loss": 0.0133, "step": 116530 }, { - "epoch": 1.26, - "learning_rate": 0.00011102030226373482, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021180610561472368, + "loss": 0.0179, "step": 116540 }, { - "epoch": 1.26, - "learning_rate": 0.00011100408639813193, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.00021179853792170967, + "loss": 0.0136, "step": 116550 }, { - "epoch": 1.26, - "learning_rate": 0.00011098787053252901, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021179097022869565, + "loss": 0.0138, "step": 116560 }, { - "epoch": 1.26, - "learning_rate": 0.00011097165466692612, - "loss": 0.0113, + "epoch": 0.59, + "learning_rate": 0.00021178340253568166, + "loss": 0.0141, "step": 116570 }, { - "epoch": 1.26, - "learning_rate": 0.00011095543880132321, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021177583484266764, + "loss": 0.0142, "step": 116580 }, { - "epoch": 1.26, - "learning_rate": 0.0001109392229357203, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021176826714965362, + "loss": 0.013, "step": 116590 }, { - "epoch": 1.26, - "learning_rate": 0.0001109230070701174, - "loss": 0.0117, + "epoch": 0.59, + "learning_rate": 0.00021176069945663963, + "loss": 0.0142, "step": 116600 }, { - "epoch": 1.26, - "learning_rate": 0.0001109067912045145, - "loss": 0.0112, + "epoch": 0.59, + "learning_rate": 0.0002117531317636256, + "loss": 0.0128, "step": 116610 }, { - "epoch": 1.26, - "learning_rate": 0.00011089057533891158, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.0002117455640706116, + "loss": 0.0121, "step": 116620 }, { - "epoch": 1.26, - "learning_rate": 0.00011087435947330869, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.0002117379963775976, + "loss": 0.0155, "step": 116630 }, { - "epoch": 1.26, - "learning_rate": 0.00011085814360770577, - "loss": 0.012, + "epoch": 0.59, + "learning_rate": 0.00021173042868458358, + "loss": 0.014, "step": 116640 }, { - "epoch": 1.26, - "learning_rate": 0.00011084192774210287, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021172286099156956, + "loss": 0.0132, "step": 116650 }, { - "epoch": 1.26, - "learning_rate": 0.00011082571187649995, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021171529329855554, + "loss": 0.0128, "step": 116660 }, { - "epoch": 1.26, - "learning_rate": 0.00011080949601089706, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021170772560554155, + "loss": 0.0166, "step": 116670 }, { - "epoch": 1.26, - "learning_rate": 0.00011079328014529415, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021170015791252753, + "loss": 0.0124, "step": 116680 }, { - "epoch": 1.26, - "learning_rate": 0.00011077706427969124, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021169259021951351, + "loss": 0.0136, "step": 116690 }, { - "epoch": 1.26, - "learning_rate": 0.00011076084841408834, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021168502252649952, + "loss": 0.012, "step": 116700 }, { - "epoch": 1.26, - "learning_rate": 0.00011074463254848543, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.0002116774548334855, + "loss": 0.0143, "step": 116710 }, { - "epoch": 1.26, - "learning_rate": 0.00011072841668288252, - "loss": 0.0108, + "epoch": 0.59, + "learning_rate": 0.00021166988714047149, + "loss": 0.0139, "step": 116720 }, { - "epoch": 1.26, - "learning_rate": 0.00011071220081727963, - "loss": 0.0119, + "epoch": 0.59, + "learning_rate": 0.0002116623194474575, + "loss": 0.014, "step": 116730 }, { - "epoch": 1.26, - "learning_rate": 0.00011069598495167671, - "loss": 0.0154, + "epoch": 0.59, + "learning_rate": 0.00021165475175444348, + "loss": 0.0128, "step": 116740 }, { - "epoch": 1.26, - "learning_rate": 0.00011067976908607381, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021164718406142946, + "loss": 0.0136, "step": 116750 }, { - "epoch": 1.26, - "learning_rate": 0.00011066355322047089, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021163961636841547, + "loss": 0.0155, "step": 116760 }, { - "epoch": 1.26, - "learning_rate": 0.000110647337354868, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021163204867540145, + "loss": 0.0214, "step": 116770 }, { - "epoch": 1.26, - "learning_rate": 0.00011063112148926508, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021162448098238743, + "loss": 0.013, "step": 116780 }, { - "epoch": 1.26, - "learning_rate": 0.00011061490562366218, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021161691328937344, + "loss": 0.016, "step": 116790 }, { - "epoch": 1.26, - "learning_rate": 0.00011059868975805928, - "loss": 0.0123, + "epoch": 0.59, + "learning_rate": 0.00021160934559635942, + "loss": 0.0156, "step": 116800 }, { - "epoch": 1.26, - "learning_rate": 0.00011058247389245637, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002116017779033454, + "loss": 0.0171, "step": 116810 }, { - "epoch": 1.26, - "learning_rate": 0.00011056625802685346, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021159421021033138, + "loss": 0.0151, "step": 116820 }, { - "epoch": 1.26, - "learning_rate": 0.00011055004216125057, - "loss": 0.0121, + "epoch": 0.59, + "learning_rate": 0.0002115866425173174, + "loss": 0.013, "step": 116830 }, { - "epoch": 1.26, - "learning_rate": 0.00011053382629564765, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021157907482430337, + "loss": 0.0132, "step": 116840 }, { - "epoch": 1.26, - "learning_rate": 0.00011051761043004475, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021157150713128935, + "loss": 0.0106, "step": 116850 }, { - "epoch": 1.26, - "learning_rate": 0.00011050139456444183, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021156393943827536, + "loss": 0.014, "step": 116860 }, { - "epoch": 1.26, - "learning_rate": 0.00011048517869883894, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021155637174526134, + "loss": 0.0123, "step": 116870 }, { - "epoch": 1.26, - "learning_rate": 0.00011046896283323602, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021154880405224732, + "loss": 0.0143, "step": 116880 }, { - "epoch": 1.26, - "learning_rate": 0.00011045274696763313, - "loss": 0.0127, + "epoch": 0.59, + "learning_rate": 0.00021154123635923333, + "loss": 0.0156, "step": 116890 }, { - "epoch": 1.26, - "learning_rate": 0.00011043653110203022, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021153366866621931, + "loss": 0.0136, "step": 116900 }, { - "epoch": 1.26, - "learning_rate": 0.00011042031523642731, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.0002115261009732053, + "loss": 0.0118, "step": 116910 }, { - "epoch": 1.26, - "learning_rate": 0.0001104040993708244, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.0002115185332801913, + "loss": 0.0154, "step": 116920 }, { - "epoch": 1.26, - "learning_rate": 0.0001103878835052215, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021151096558717729, + "loss": 0.0148, "step": 116930 }, { - "epoch": 1.26, - "learning_rate": 0.00011037166763961859, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021150339789416327, + "loss": 0.0103, "step": 116940 }, { - "epoch": 1.26, - "learning_rate": 0.0001103554517740157, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021149583020114928, + "loss": 0.0173, "step": 116950 }, { - "epoch": 1.26, - "learning_rate": 0.00011033923590841277, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021148826250813526, + "loss": 0.0185, "step": 116960 }, { - "epoch": 1.26, - "learning_rate": 0.00011032302004280988, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021148069481512124, + "loss": 0.0136, "step": 116970 }, { - "epoch": 1.26, - "learning_rate": 0.00011030680417720696, - "loss": 0.0067, + "epoch": 0.59, + "learning_rate": 0.00021147312712210725, + "loss": 0.017, "step": 116980 }, { - "epoch": 1.26, - "learning_rate": 0.00011029058831160407, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021146555942909323, + "loss": 0.0213, "step": 116990 }, { - "epoch": 1.26, - "learning_rate": 0.00011027437244600116, - "loss": 0.0118, + "epoch": 0.59, + "learning_rate": 0.0002114579917360792, + "loss": 0.0164, "step": 117000 }, { - "epoch": 1.26, - "eval_cer": 0.9215373577445508, - "eval_loss": 0.007613795343786478, - "eval_runtime": 121.1129, - "eval_samples_per_second": 16.514, - "eval_steps_per_second": 4.128, + "epoch": 0.59, + "eval_cer": 0.9145207165016832, + "eval_loss": 0.01061397697776556, + "eval_runtime": 116.746, + "eval_samples_per_second": 17.131, + "eval_steps_per_second": 4.283, "step": 117000 }, { - "epoch": 1.26, - "learning_rate": 0.00011025815658039825, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.0002114504240430652, + "loss": 0.0129, "step": 117010 }, { - "epoch": 1.27, - "learning_rate": 0.00011024194071479534, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.0002114428563500512, + "loss": 0.0133, "step": 117020 }, { - "epoch": 1.27, - "learning_rate": 0.00011022572484919244, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021143528865703718, + "loss": 0.0135, "step": 117030 }, { - "epoch": 1.27, - "learning_rate": 0.00011020950898358953, - "loss": 0.013, + "epoch": 0.59, + "learning_rate": 0.00021142772096402316, + "loss": 0.0175, "step": 117040 }, { - "epoch": 1.27, - "learning_rate": 0.00011019329311798664, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021142015327100917, + "loss": 0.0157, "step": 117050 }, { - "epoch": 1.27, - "learning_rate": 0.00011017707725238372, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021141258557799515, + "loss": 0.0138, "step": 117060 }, { - "epoch": 1.27, - "learning_rate": 0.00011016086138678082, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021140501788498113, + "loss": 0.0155, "step": 117070 }, { - "epoch": 1.27, - "learning_rate": 0.0001101446455211779, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021139745019196714, + "loss": 0.0141, "step": 117080 }, { - "epoch": 1.27, - "learning_rate": 0.00011012842965557501, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021138988249895312, + "loss": 0.0133, "step": 117090 }, { - "epoch": 1.27, - "learning_rate": 0.00011011221378997209, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.0002113823148059391, + "loss": 0.0151, "step": 117100 }, { - "epoch": 1.27, - "learning_rate": 0.00011009599792436919, - "loss": 0.0108, + "epoch": 0.59, + "learning_rate": 0.00021137474711292511, + "loss": 0.0157, "step": 117110 }, { - "epoch": 1.27, - "learning_rate": 0.00011007978205876629, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.0002113671794199111, + "loss": 0.0164, "step": 117120 }, { - "epoch": 1.27, - "learning_rate": 0.00011006356619316338, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021135961172689708, + "loss": 0.016, "step": 117130 }, { - "epoch": 1.27, - "learning_rate": 0.00011004735032756047, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021135204403388309, + "loss": 0.0148, "step": 117140 }, { - "epoch": 1.27, - "learning_rate": 0.00011003113446195758, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021134447634086907, + "loss": 0.0135, "step": 117150 }, { - "epoch": 1.27, - "learning_rate": 0.00011001491859635466, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021133690864785505, + "loss": 0.0131, "step": 117160 }, { - "epoch": 1.27, - "learning_rate": 0.00010999870273075176, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021132934095484103, + "loss": 0.0162, "step": 117170 }, { - "epoch": 1.27, - "learning_rate": 0.00010998248686514884, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021132177326182704, + "loss": 0.0168, "step": 117180 }, { - "epoch": 1.27, - "learning_rate": 0.00010996627099954595, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021131420556881302, + "loss": 0.0176, "step": 117190 }, { - "epoch": 1.27, - "learning_rate": 0.00010995005513394303, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.000211306637875799, + "loss": 0.0166, "step": 117200 }, { - "epoch": 1.27, - "learning_rate": 0.00010993383926834013, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.000211299070182785, + "loss": 0.0153, "step": 117210 }, { - "epoch": 1.27, - "learning_rate": 0.00010991762340273723, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.000211291502489771, + "loss": 0.0149, "step": 117220 }, { - "epoch": 1.27, - "learning_rate": 0.00010990140753713432, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021128393479675697, + "loss": 0.0152, "step": 117230 }, { - "epoch": 1.27, - "learning_rate": 0.00010988519167153141, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021127636710374298, + "loss": 0.0146, "step": 117240 }, { - "epoch": 1.27, - "learning_rate": 0.0001098689758059285, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021126879941072896, + "loss": 0.0129, "step": 117250 }, { - "epoch": 1.27, - "learning_rate": 0.00010985275994032561, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021126123171771494, + "loss": 0.0137, "step": 117260 }, { - "epoch": 1.27, - "learning_rate": 0.0001098365440747227, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.00021125366402470095, + "loss": 0.013, "step": 117270 }, { - "epoch": 1.27, - "learning_rate": 0.0001098203282091198, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021124609633168693, + "loss": 0.0134, "step": 117280 }, { - "epoch": 1.27, - "learning_rate": 0.00010980411234351689, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021123852863867292, + "loss": 0.0115, "step": 117290 }, { - "epoch": 1.27, - "learning_rate": 0.000109787896477914, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021123096094565892, + "loss": 0.0174, "step": 117300 }, { - "epoch": 1.27, - "learning_rate": 0.00010977168061231107, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.0002112233932526449, + "loss": 0.0155, "step": 117310 }, { - "epoch": 1.27, - "learning_rate": 0.00010975546474670818, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.0002112158255596309, + "loss": 0.0114, "step": 117320 }, { - "epoch": 1.27, - "learning_rate": 0.00010973924888110526, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021120825786661687, + "loss": 0.0146, "step": 117330 }, { - "epoch": 1.27, - "learning_rate": 0.00010972303301550237, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021120069017360288, + "loss": 0.0154, "step": 117340 }, { - "epoch": 1.27, - "learning_rate": 0.00010970681714989945, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021119312248058886, + "loss": 0.0151, "step": 117350 }, { - "epoch": 1.27, - "learning_rate": 0.00010969060128429655, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021118555478757484, + "loss": 0.0113, "step": 117360 }, { - "epoch": 1.27, - "learning_rate": 0.00010967438541869364, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021117798709456085, + "loss": 0.0131, "step": 117370 }, { - "epoch": 1.27, - "learning_rate": 0.00010965816955309074, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021117041940154683, + "loss": 0.0129, "step": 117380 }, { - "epoch": 1.27, - "learning_rate": 0.00010964195368748783, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.0002111628517085328, + "loss": 0.0139, "step": 117390 }, { - "epoch": 1.27, - "learning_rate": 0.00010962573782188492, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021115528401551882, + "loss": 0.0163, "step": 117400 }, { - "epoch": 1.27, - "learning_rate": 0.00010960952195628202, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.0002111477163225048, + "loss": 0.016, "step": 117410 }, { - "epoch": 1.27, - "learning_rate": 0.00010959330609067912, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021114014862949078, + "loss": 0.018, "step": 117420 }, { - "epoch": 1.27, - "learning_rate": 0.0001095770902250762, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.0002111325809364768, + "loss": 0.0146, "step": 117430 }, { - "epoch": 1.27, - "learning_rate": 0.00010956087435947331, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021112501324346277, + "loss": 0.0153, "step": 117440 }, { - "epoch": 1.27, - "learning_rate": 0.00010954465849387039, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021111744555044875, + "loss": 0.0147, "step": 117450 }, { - "epoch": 1.27, - "learning_rate": 0.00010952844262826749, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021110987785743476, + "loss": 0.0149, "step": 117460 }, { - "epoch": 1.27, - "learning_rate": 0.00010951222676266459, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021110231016442074, + "loss": 0.0228, "step": 117470 }, { - "epoch": 1.27, - "learning_rate": 0.00010949601089706168, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021109474247140673, + "loss": 0.0154, "step": 117480 }, { - "epoch": 1.27, - "learning_rate": 0.00010947979503145877, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.0002110871747783927, + "loss": 0.0123, "step": 117490 }, { - "epoch": 1.27, - "learning_rate": 0.00010946357916585586, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021107960708537872, + "loss": 0.0124, "step": 117500 }, { - "epoch": 1.27, - "learning_rate": 0.00010944736330025296, - "loss": 0.0123, + "epoch": 0.59, + "learning_rate": 0.0002110720393923647, + "loss": 0.0125, "step": 117510 }, { - "epoch": 1.27, - "learning_rate": 0.00010943114743465006, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021106447169935065, + "loss": 0.0151, "step": 117520 }, { - "epoch": 1.27, - "learning_rate": 0.00010941493156904714, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021105690400633666, + "loss": 0.0168, "step": 117530 }, { - "epoch": 1.27, - "learning_rate": 0.00010939871570344425, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021104933631332264, + "loss": 0.0157, "step": 117540 }, { - "epoch": 1.27, - "learning_rate": 0.00010938249983784133, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021104176862030862, + "loss": 0.0147, "step": 117550 }, { - "epoch": 1.27, - "learning_rate": 0.00010936628397223843, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.0002110342009272946, + "loss": 0.0121, "step": 117560 }, { - "epoch": 1.27, - "learning_rate": 0.00010935006810663551, - "loss": 0.012, + "epoch": 0.59, + "learning_rate": 0.0002110266332342806, + "loss": 0.0139, "step": 117570 }, { - "epoch": 1.27, - "learning_rate": 0.00010933385224103262, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.0002110190655412666, + "loss": 0.0167, "step": 117580 }, { - "epoch": 1.27, - "learning_rate": 0.00010931763637542971, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021101149784825258, + "loss": 0.0138, "step": 117590 }, { - "epoch": 1.27, - "learning_rate": 0.0001093014205098268, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021100393015523858, + "loss": 0.0147, "step": 117600 }, { - "epoch": 1.27, - "learning_rate": 0.0001092852046442239, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021099636246222457, + "loss": 0.0164, "step": 117610 }, { - "epoch": 1.27, - "learning_rate": 0.000109268988778621, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021098879476921055, + "loss": 0.0148, "step": 117620 }, { - "epoch": 1.27, - "learning_rate": 0.00010925277291301808, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021098122707619656, + "loss": 0.0139, "step": 117630 }, { - "epoch": 1.27, - "learning_rate": 0.00010923655704741519, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021097365938318254, + "loss": 0.0129, "step": 117640 }, { - "epoch": 1.27, - "learning_rate": 0.00010922034118181227, - "loss": 0.0119, + "epoch": 0.59, + "learning_rate": 0.00021096609169016852, + "loss": 0.0179, "step": 117650 }, { - "epoch": 1.27, - "learning_rate": 0.00010920412531620937, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021095852399715453, + "loss": 0.0141, "step": 117660 }, { - "epoch": 1.27, - "learning_rate": 0.00010918790945060645, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.0002109509563041405, + "loss": 0.0157, "step": 117670 }, { - "epoch": 1.27, - "learning_rate": 0.00010917169358500356, - "loss": 0.0117, + "epoch": 0.59, + "learning_rate": 0.0002109433886111265, + "loss": 0.0187, "step": 117680 }, { - "epoch": 1.27, - "learning_rate": 0.00010915547771940065, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.0002109358209181125, + "loss": 0.012, "step": 117690 }, { - "epoch": 1.27, - "learning_rate": 0.00010913926185379775, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021092825322509848, + "loss": 0.0166, "step": 117700 }, { - "epoch": 1.27, - "learning_rate": 0.00010912304598819484, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021092068553208446, + "loss": 0.0137, "step": 117710 }, { - "epoch": 1.27, - "learning_rate": 0.00010910683012259193, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021091311783907044, + "loss": 0.0173, "step": 117720 }, { - "epoch": 1.27, - "learning_rate": 0.00010909061425698902, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021090555014605645, + "loss": 0.0204, "step": 117730 }, { - "epoch": 1.27, - "learning_rate": 0.00010907439839138613, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021089798245304243, + "loss": 0.0173, "step": 117740 }, { - "epoch": 1.27, - "learning_rate": 0.00010905818252578321, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021089041476002841, + "loss": 0.0138, "step": 117750 }, { - "epoch": 1.27, - "learning_rate": 0.00010904196666018032, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021088284706701442, + "loss": 0.0163, "step": 117760 }, { - "epoch": 1.27, - "learning_rate": 0.0001090257507945774, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.0002108752793740004, + "loss": 0.0114, "step": 117770 }, { - "epoch": 1.27, - "learning_rate": 0.0001090095349289745, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021086771168098639, + "loss": 0.0162, "step": 117780 }, { - "epoch": 1.27, - "learning_rate": 0.00010899331906337158, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002108601439879724, + "loss": 0.0134, "step": 117790 }, { - "epoch": 1.27, - "learning_rate": 0.00010897710319776869, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021085257629495838, + "loss": 0.0261, "step": 117800 }, { - "epoch": 1.27, - "learning_rate": 0.00010896088733216578, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021084500860194436, + "loss": 0.0144, "step": 117810 }, { - "epoch": 1.27, - "learning_rate": 0.00010894467146656287, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021083744090893037, + "loss": 0.0159, "step": 117820 }, { - "epoch": 1.27, - "learning_rate": 0.00010892845560095997, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021082987321591635, + "loss": 0.0143, "step": 117830 }, { - "epoch": 1.27, - "learning_rate": 0.00010891223973535707, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021082230552290233, + "loss": 0.0158, "step": 117840 }, { - "epoch": 1.27, - "learning_rate": 0.00010889602386975415, - "loss": 0.0109, + "epoch": 0.59, + "learning_rate": 0.00021081473782988834, + "loss": 0.018, "step": 117850 }, { - "epoch": 1.27, - "learning_rate": 0.00010887980800415126, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021080717013687432, + "loss": 0.0162, "step": 117860 }, { - "epoch": 1.27, - "learning_rate": 0.00010886359213854834, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.0002107996024438603, + "loss": 0.0135, "step": 117870 }, { - "epoch": 1.27, - "learning_rate": 0.00010884737627294544, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021079203475084628, + "loss": 0.0147, "step": 117880 }, { - "epoch": 1.27, - "learning_rate": 0.00010883116040734252, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.0002107844670578323, + "loss": 0.0208, "step": 117890 }, { - "epoch": 1.27, - "learning_rate": 0.00010881494454173963, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021077689936481827, + "loss": 0.0149, "step": 117900 }, { - "epoch": 1.27, - "learning_rate": 0.00010879872867613672, - "loss": 0.0072, + "epoch": 0.59, + "learning_rate": 0.00021076933167180425, + "loss": 0.0127, "step": 117910 }, { - "epoch": 1.27, - "learning_rate": 0.00010878251281053381, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021076176397879026, + "loss": 0.0122, "step": 117920 }, { - "epoch": 1.27, - "learning_rate": 0.0001087662969449309, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021075419628577624, + "loss": 0.0154, "step": 117930 }, { - "epoch": 1.27, - "learning_rate": 0.000108750081079328, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021074662859276222, + "loss": 0.0141, "step": 117940 }, { - "epoch": 1.28, - "learning_rate": 0.00010873386521372509, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00021073906089974823, + "loss": 0.0142, "step": 117950 }, { - "epoch": 1.28, - "learning_rate": 0.0001087176493481222, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021073149320673421, + "loss": 0.0141, "step": 117960 }, { - "epoch": 1.28, - "learning_rate": 0.00010870143348251929, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.0002107239255137202, + "loss": 0.0135, "step": 117970 }, { - "epoch": 1.28, - "learning_rate": 0.00010868521761691638, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.0002107163578207062, + "loss": 0.0156, "step": 117980 }, { - "epoch": 1.28, - "learning_rate": 0.00010866900175131349, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021070879012769219, + "loss": 0.0186, "step": 117990 }, { - "epoch": 1.28, - "learning_rate": 0.00010865278588571057, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021070122243467817, + "loss": 0.0162, "step": 118000 }, { - "epoch": 1.28, - "eval_cer": 0.9215364891415945, - "eval_loss": 0.00760659808292985, - "eval_runtime": 121.2431, - "eval_samples_per_second": 16.496, - "eval_steps_per_second": 4.124, + "epoch": 0.6, + "eval_cer": 0.9144702559031622, + "eval_loss": 0.011005792766809464, + "eval_runtime": 116.812, + "eval_samples_per_second": 17.122, + "eval_steps_per_second": 4.28, "step": 118000 }, { - "epoch": 1.28, - "learning_rate": 0.00010863657002010768, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00021069365474166418, + "loss": 0.0166, "step": 118010 }, { - "epoch": 1.28, - "learning_rate": 0.00010862035415450475, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021068608704865016, + "loss": 0.018, "step": 118020 }, { - "epoch": 1.28, - "learning_rate": 0.00010860413828890186, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021067851935563614, + "loss": 0.0176, "step": 118030 }, { - "epoch": 1.28, - "learning_rate": 0.00010858792242329894, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021067095166262215, + "loss": 0.015, "step": 118040 }, { - "epoch": 1.28, - "learning_rate": 0.00010857170655769605, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021066338396960813, + "loss": 0.0209, "step": 118050 }, { - "epoch": 1.28, - "learning_rate": 0.00010855549069209314, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.0002106558162765941, + "loss": 0.0169, "step": 118060 }, { - "epoch": 1.28, - "learning_rate": 0.00010853927482649023, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.0002106482485835801, + "loss": 0.0283, "step": 118070 }, { - "epoch": 1.28, - "learning_rate": 0.00010852305896088732, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.0002106406808905661, + "loss": 0.0113, "step": 118080 }, { - "epoch": 1.28, - "learning_rate": 0.00010850684309528442, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021063311319755208, + "loss": 0.0216, "step": 118090 }, { - "epoch": 1.28, - "learning_rate": 0.00010849062722968151, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021062554550453806, + "loss": 0.0129, "step": 118100 }, { - "epoch": 1.28, - "learning_rate": 0.00010847441136407862, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021061797781152407, + "loss": 0.0196, "step": 118110 }, { - "epoch": 1.28, - "learning_rate": 0.0001084581954984757, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00021061041011851005, + "loss": 0.0197, "step": 118120 }, { - "epoch": 1.28, - "learning_rate": 0.0001084419796328728, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00021060284242549603, + "loss": 0.0173, "step": 118130 }, { - "epoch": 1.28, - "learning_rate": 0.00010842576376726988, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021059527473248204, + "loss": 0.015, "step": 118140 }, { - "epoch": 1.28, - "learning_rate": 0.00010840954790166699, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021058770703946802, + "loss": 0.0151, "step": 118150 }, { - "epoch": 1.28, - "learning_rate": 0.00010839333203606408, - "loss": 0.0073, + "epoch": 0.6, + "learning_rate": 0.000210580139346454, + "loss": 0.0157, "step": 118160 }, { - "epoch": 1.28, - "learning_rate": 0.00010837711617046117, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00021057257165344001, + "loss": 0.0123, "step": 118170 }, { - "epoch": 1.28, - "learning_rate": 0.00010836090030485827, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.000210565003960426, + "loss": 0.0149, "step": 118180 }, { - "epoch": 1.28, - "learning_rate": 0.00010834468443925536, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021055743626741198, + "loss": 0.0152, "step": 118190 }, { - "epoch": 1.28, - "learning_rate": 0.00010832846857365245, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021054986857439799, + "loss": 0.0126, "step": 118200 }, { - "epoch": 1.28, - "learning_rate": 0.00010831225270804956, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021054230088138397, + "loss": 0.0138, "step": 118210 }, { - "epoch": 1.28, - "learning_rate": 0.00010829603684244664, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021053473318836995, + "loss": 0.0186, "step": 118220 }, { - "epoch": 1.28, - "learning_rate": 0.00010827982097684374, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00021052716549535593, + "loss": 0.0178, "step": 118230 }, { - "epoch": 1.28, - "learning_rate": 0.00010826360511124082, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021051959780234194, + "loss": 0.0149, "step": 118240 }, { - "epoch": 1.28, - "learning_rate": 0.00010824738924563793, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021051203010932792, + "loss": 0.0153, "step": 118250 }, { - "epoch": 1.28, - "learning_rate": 0.00010823117338003501, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.0002105044624163139, + "loss": 0.0157, "step": 118260 }, { - "epoch": 1.28, - "learning_rate": 0.00010821495751443211, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.0002104968947232999, + "loss": 0.0161, "step": 118270 }, { - "epoch": 1.28, - "learning_rate": 0.0001081987416488292, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.0002104893270302859, + "loss": 0.0169, "step": 118280 }, { - "epoch": 1.28, - "learning_rate": 0.0001081825257832263, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00021048175933727187, + "loss": 0.0169, "step": 118290 }, { - "epoch": 1.28, - "learning_rate": 0.00010816630991762339, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00021047419164425788, + "loss": 0.0122, "step": 118300 }, { - "epoch": 1.28, - "learning_rate": 0.0001081500940520205, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021046662395124386, + "loss": 0.0108, "step": 118310 }, { - "epoch": 1.28, - "learning_rate": 0.00010813387818641758, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.00021045905625822984, + "loss": 0.0183, "step": 118320 }, { - "epoch": 1.28, - "learning_rate": 0.00010811766232081468, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00021045148856521585, + "loss": 0.0128, "step": 118330 }, { - "epoch": 1.28, - "learning_rate": 0.00010810144645521176, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.00021044392087220183, + "loss": 0.0144, "step": 118340 }, { - "epoch": 1.28, - "learning_rate": 0.00010808523058960887, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021043635317918782, + "loss": 0.0143, "step": 118350 }, { - "epoch": 1.28, - "learning_rate": 0.00010806901472400595, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021042878548617382, + "loss": 0.0145, "step": 118360 }, { - "epoch": 1.28, - "learning_rate": 0.00010805279885840305, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.0002104212177931598, + "loss": 0.0146, "step": 118370 }, { - "epoch": 1.28, - "learning_rate": 0.00010803658299280015, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002104136501001458, + "loss": 0.014, "step": 118380 }, { - "epoch": 1.28, - "learning_rate": 0.00010802036712719724, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021040608240713177, + "loss": 0.0197, "step": 118390 }, { - "epoch": 1.28, - "learning_rate": 0.00010800415126159433, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00021039851471411778, + "loss": 0.014, "step": 118400 }, { - "epoch": 1.28, - "learning_rate": 0.00010798793539599143, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021039094702110376, + "loss": 0.0142, "step": 118410 }, { - "epoch": 1.28, - "learning_rate": 0.00010797171953038852, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021038337932808974, + "loss": 0.0147, "step": 118420 }, { - "epoch": 1.28, - "learning_rate": 0.00010795550366478562, - "loss": 0.0076, + "epoch": 0.6, + "learning_rate": 0.00021037581163507575, + "loss": 0.0132, "step": 118430 }, { - "epoch": 1.28, - "learning_rate": 0.0001079392877991827, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021036824394206173, + "loss": 0.0125, "step": 118440 }, { - "epoch": 1.28, - "learning_rate": 0.00010792307193357981, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.0002103606762490477, + "loss": 0.0166, "step": 118450 }, { - "epoch": 1.28, - "learning_rate": 0.00010790685606797689, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021035310855603372, + "loss": 0.0163, "step": 118460 }, { - "epoch": 1.28, - "learning_rate": 0.000107890640202374, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.0002103455408630197, + "loss": 0.0156, "step": 118470 }, { - "epoch": 1.28, - "learning_rate": 0.00010787442433677107, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021033797317000568, + "loss": 0.0151, "step": 118480 }, { - "epoch": 1.28, - "learning_rate": 0.00010785820847116818, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.0002103304054769917, + "loss": 0.0129, "step": 118490 }, { - "epoch": 1.28, - "learning_rate": 0.00010784199260556527, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021032283778397767, + "loss": 0.0152, "step": 118500 }, { - "epoch": 1.28, - "learning_rate": 0.00010782577673996237, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021031527009096365, + "loss": 0.0148, "step": 118510 }, { - "epoch": 1.28, - "learning_rate": 0.00010780956087435946, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021030770239794966, + "loss": 0.0142, "step": 118520 }, { - "epoch": 1.28, - "learning_rate": 0.00010779334500875657, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021030013470493564, + "loss": 0.013, "step": 118530 }, { - "epoch": 1.28, - "learning_rate": 0.00010777712914315364, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021029256701192163, + "loss": 0.018, "step": 118540 }, { - "epoch": 1.28, - "learning_rate": 0.00010776091327755075, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021028499931890763, + "loss": 0.0146, "step": 118550 }, { - "epoch": 1.28, - "learning_rate": 0.00010774469741194783, - "loss": 0.0107, + "epoch": 0.6, + "learning_rate": 0.00021027743162589362, + "loss": 0.0125, "step": 118560 }, { - "epoch": 1.28, - "learning_rate": 0.00010772848154634494, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.0002102698639328796, + "loss": 0.0145, "step": 118570 }, { - "epoch": 1.28, - "learning_rate": 0.00010771226568074202, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021026229623986558, + "loss": 0.0133, "step": 118580 }, { - "epoch": 1.28, - "learning_rate": 0.00010769604981513912, - "loss": 0.011, + "epoch": 0.6, + "learning_rate": 0.0002102547285468516, + "loss": 0.0145, "step": 118590 }, { - "epoch": 1.28, - "learning_rate": 0.00010767983394953621, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021024716085383757, + "loss": 0.0142, "step": 118600 }, { - "epoch": 1.28, - "learning_rate": 0.00010766361808393331, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021023959316082355, + "loss": 0.0131, "step": 118610 }, { - "epoch": 1.28, - "learning_rate": 0.0001076474022183304, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00021023202546780956, + "loss": 0.0132, "step": 118620 }, { - "epoch": 1.28, - "learning_rate": 0.0001076311863527275, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021022445777479554, + "loss": 0.0149, "step": 118630 }, { - "epoch": 1.28, - "learning_rate": 0.00010761497048712459, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021021689008178152, + "loss": 0.0152, "step": 118640 }, { - "epoch": 1.28, - "learning_rate": 0.00010759875462152169, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021020932238876753, + "loss": 0.0163, "step": 118650 }, { - "epoch": 1.28, - "learning_rate": 0.00010758253875591877, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.0002102017546957535, + "loss": 0.016, "step": 118660 }, { - "epoch": 1.28, - "learning_rate": 0.00010756632289031588, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.0002101941870027395, + "loss": 0.016, "step": 118670 }, { - "epoch": 1.28, - "learning_rate": 0.00010755010702471296, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.0002101866193097255, + "loss": 0.0181, "step": 118680 }, { - "epoch": 1.28, - "learning_rate": 0.00010753389115911006, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021017905161671148, + "loss": 0.0159, "step": 118690 }, { - "epoch": 1.28, - "learning_rate": 0.00010751767529350717, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.00021017148392369746, + "loss": 0.0128, "step": 118700 }, { - "epoch": 1.28, - "learning_rate": 0.00010750145942790425, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021016391623068347, + "loss": 0.0137, "step": 118710 }, { - "epoch": 1.28, - "learning_rate": 0.00010748524356230135, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00021015634853766945, + "loss": 0.0132, "step": 118720 }, { - "epoch": 1.28, - "learning_rate": 0.00010746902769669843, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00021014878084465544, + "loss": 0.0165, "step": 118730 }, { - "epoch": 1.28, - "learning_rate": 0.00010745281183109554, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021014121315164142, + "loss": 0.0123, "step": 118740 }, { - "epoch": 1.28, - "learning_rate": 0.00010743659596549263, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.00021013364545862743, + "loss": 0.0131, "step": 118750 }, { - "epoch": 1.28, - "learning_rate": 0.00010742038009988973, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.0002101260777656134, + "loss": 0.0165, "step": 118760 }, { - "epoch": 1.28, - "learning_rate": 0.00010740416423428682, - "loss": 0.0112, + "epoch": 0.6, + "learning_rate": 0.0002101185100725994, + "loss": 0.0175, "step": 118770 }, { - "epoch": 1.28, - "learning_rate": 0.00010738794836868392, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.00021011094237958534, + "loss": 0.0118, "step": 118780 }, { - "epoch": 1.28, - "learning_rate": 0.000107371732503081, - "loss": 0.0076, + "epoch": 0.6, + "learning_rate": 0.00021010337468657135, + "loss": 0.013, "step": 118790 }, { - "epoch": 1.28, - "learning_rate": 0.00010735551663747811, - "loss": 0.0118, + "epoch": 0.6, + "learning_rate": 0.00021009580699355733, + "loss": 0.0152, "step": 118800 }, { - "epoch": 1.28, - "learning_rate": 0.00010733930077187519, - "loss": 0.0107, + "epoch": 0.6, + "learning_rate": 0.00021008823930054331, + "loss": 0.0146, "step": 118810 }, { - "epoch": 1.28, - "learning_rate": 0.0001073230849062723, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021008067160752932, + "loss": 0.0164, "step": 118820 }, { - "epoch": 1.28, - "learning_rate": 0.00010730686904066937, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002100731039145153, + "loss": 0.0172, "step": 118830 }, { - "epoch": 1.28, - "learning_rate": 0.00010729065317506648, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021006553622150129, + "loss": 0.0176, "step": 118840 }, { - "epoch": 1.28, - "learning_rate": 0.00010727443730946357, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002100579685284873, + "loss": 0.0167, "step": 118850 }, { - "epoch": 1.28, - "learning_rate": 0.00010725822144386067, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00021005040083547328, + "loss": 0.0153, "step": 118860 }, { - "epoch": 1.29, - "learning_rate": 0.00010724200557825776, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00021004283314245926, + "loss": 0.0139, "step": 118870 }, { - "epoch": 1.29, - "learning_rate": 0.00010722578971265485, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.00021003526544944527, + "loss": 0.0144, "step": 118880 }, { - "epoch": 1.29, - "learning_rate": 0.00010720957384705194, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021002769775643125, + "loss": 0.0157, "step": 118890 }, { - "epoch": 1.29, - "learning_rate": 0.00010719335798144905, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021002013006341723, + "loss": 0.0137, "step": 118900 }, { - "epoch": 1.29, - "learning_rate": 0.00010717714211584613, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021001256237040324, + "loss": 0.0106, "step": 118910 }, { - "epoch": 1.29, - "learning_rate": 0.00010716092625024324, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.00021000499467738922, + "loss": 0.0191, "step": 118920 }, { - "epoch": 1.29, - "learning_rate": 0.00010714471038464032, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.0002099974269843752, + "loss": 0.0199, "step": 118930 }, { - "epoch": 1.29, - "learning_rate": 0.00010712849451903742, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002099898592913612, + "loss": 0.0165, "step": 118940 }, { - "epoch": 1.29, - "learning_rate": 0.0001071122786534345, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.0002099822915983472, + "loss": 0.017, "step": 118950 }, { - "epoch": 1.29, - "learning_rate": 0.00010709606278783161, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020997472390533317, + "loss": 0.0181, "step": 118960 }, { - "epoch": 1.29, - "learning_rate": 0.0001070798469222287, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020996715621231915, + "loss": 0.016, "step": 118970 }, { - "epoch": 1.29, - "learning_rate": 0.00010706363105662579, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020995958851930516, + "loss": 0.0137, "step": 118980 }, { - "epoch": 1.29, - "learning_rate": 0.00010704741519102289, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020995202082629114, + "loss": 0.0158, "step": 118990 }, { - "epoch": 1.29, - "learning_rate": 0.00010703119932541999, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020994445313327712, + "loss": 0.0123, "step": 119000 }, { - "epoch": 1.29, - "eval_cer": 0.9215321461268126, - "eval_loss": 0.007560289464890957, - "eval_runtime": 121.1493, - "eval_samples_per_second": 16.509, - "eval_steps_per_second": 4.127, + "epoch": 0.6, + "eval_cer": 0.9144935454101719, + "eval_loss": 0.010422189719974995, + "eval_runtime": 116.7072, + "eval_samples_per_second": 17.137, + "eval_steps_per_second": 4.284, "step": 119000 }, { - "epoch": 1.29, - "learning_rate": 0.00010701498345981707, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020993688544026313, + "loss": 0.0139, "step": 119010 }, { - "epoch": 1.29, - "learning_rate": 0.00010699876759421418, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020992931774724911, + "loss": 0.0162, "step": 119020 }, { - "epoch": 1.29, - "learning_rate": 0.00010698255172861126, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.0002099217500542351, + "loss": 0.016, "step": 119030 }, { - "epoch": 1.29, - "learning_rate": 0.00010696633586300836, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002099141823612211, + "loss": 0.0134, "step": 119040 }, { - "epoch": 1.29, - "learning_rate": 0.00010695011999740544, - "loss": 0.0066, + "epoch": 0.6, + "learning_rate": 0.00020990661466820709, + "loss": 0.0138, "step": 119050 }, { - "epoch": 1.29, - "learning_rate": 0.00010693390413180255, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.00020989904697519307, + "loss": 0.0166, "step": 119060 }, { - "epoch": 1.29, - "learning_rate": 0.00010691768826619964, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00020989147928217908, + "loss": 0.0143, "step": 119070 }, { - "epoch": 1.29, - "learning_rate": 0.00010690147240059673, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.00020988391158916506, + "loss": 0.0137, "step": 119080 }, { - "epoch": 1.29, - "learning_rate": 0.00010688525653499383, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00020987634389615104, + "loss": 0.0136, "step": 119090 }, { - "epoch": 1.29, - "learning_rate": 0.00010686904066939092, - "loss": 0.007, + "epoch": 0.6, + "learning_rate": 0.00020986877620313705, + "loss": 0.015, "step": 119100 }, { - "epoch": 1.29, - "learning_rate": 0.00010685282480378801, - "loss": 0.0121, + "epoch": 0.6, + "learning_rate": 0.00020986120851012303, + "loss": 0.012, "step": 119110 }, { - "epoch": 1.29, - "learning_rate": 0.00010683660893818512, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.000209853640817109, + "loss": 0.0143, "step": 119120 }, { - "epoch": 1.29, - "learning_rate": 0.0001068203930725822, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.000209846073124095, + "loss": 0.0157, "step": 119130 }, { - "epoch": 1.29, - "learning_rate": 0.0001068041772069793, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.000209838505431081, + "loss": 0.0152, "step": 119140 }, { - "epoch": 1.29, - "learning_rate": 0.00010678796134137638, - "loss": 0.0138, + "epoch": 0.6, + "learning_rate": 0.00020983093773806698, + "loss": 0.0142, "step": 119150 }, { - "epoch": 1.29, - "learning_rate": 0.00010677174547577349, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.00020982337004505296, + "loss": 0.0145, "step": 119160 }, { - "epoch": 1.29, - "learning_rate": 0.00010675552961017058, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020981580235203897, + "loss": 0.0181, "step": 119170 }, { - "epoch": 1.29, - "learning_rate": 0.00010673931374456768, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020980823465902495, + "loss": 0.0142, "step": 119180 }, { - "epoch": 1.29, - "learning_rate": 0.00010672309787896477, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020980066696601093, + "loss": 0.014, "step": 119190 }, { - "epoch": 1.29, - "learning_rate": 0.00010670688201336186, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020979309927299694, + "loss": 0.0137, "step": 119200 }, { - "epoch": 1.29, - "learning_rate": 0.00010669066614775895, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00020978553157998292, + "loss": 0.0153, "step": 119210 }, { - "epoch": 1.29, - "learning_rate": 0.00010667445028215606, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.0002097779638869689, + "loss": 0.0161, "step": 119220 }, { - "epoch": 1.29, - "learning_rate": 0.00010665823441655314, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020977039619395491, + "loss": 0.0139, "step": 119230 }, { - "epoch": 1.29, - "learning_rate": 0.00010664201855095025, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002097628285009409, + "loss": 0.0143, "step": 119240 }, { - "epoch": 1.29, - "learning_rate": 0.00010662580268534732, - "loss": 0.0118, + "epoch": 0.6, + "learning_rate": 0.00020975526080792688, + "loss": 0.0138, "step": 119250 }, { - "epoch": 1.29, - "learning_rate": 0.00010660958681974443, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020974769311491289, + "loss": 0.0141, "step": 119260 }, { - "epoch": 1.29, - "learning_rate": 0.00010659337095414151, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.00020974012542189887, + "loss": 0.0148, "step": 119270 }, { - "epoch": 1.29, - "learning_rate": 0.00010657715508853862, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020973255772888485, + "loss": 0.013, "step": 119280 }, { - "epoch": 1.29, - "learning_rate": 0.00010656093922293571, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020972499003587083, + "loss": 0.0177, "step": 119290 }, { - "epoch": 1.29, - "learning_rate": 0.0001065447233573328, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020971742234285684, + "loss": 0.015, "step": 119300 }, { - "epoch": 1.29, - "learning_rate": 0.0001065285074917299, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020970985464984282, + "loss": 0.0168, "step": 119310 }, { - "epoch": 1.29, - "learning_rate": 0.000106512291626127, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.0002097022869568288, + "loss": 0.0153, "step": 119320 }, { - "epoch": 1.29, - "learning_rate": 0.00010649607576052408, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.0002096947192638148, + "loss": 0.0144, "step": 119330 }, { - "epoch": 1.29, - "learning_rate": 0.00010647985989492119, - "loss": 0.0118, + "epoch": 0.6, + "learning_rate": 0.0002096871515708008, + "loss": 0.0113, "step": 119340 }, { - "epoch": 1.29, - "learning_rate": 0.00010646364402931827, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.00020967958387778677, + "loss": 0.0135, "step": 119350 }, { - "epoch": 1.29, - "learning_rate": 0.00010644742816371537, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020967201618477278, + "loss": 0.0132, "step": 119360 }, { - "epoch": 1.29, - "learning_rate": 0.00010643121229811245, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020966444849175876, + "loss": 0.0178, "step": 119370 }, { - "epoch": 1.29, - "learning_rate": 0.00010641499643250956, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020965688079874474, + "loss": 0.0146, "step": 119380 }, { - "epoch": 1.29, - "learning_rate": 0.00010639878056690665, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020964931310573075, + "loss": 0.0147, "step": 119390 }, { - "epoch": 1.29, - "learning_rate": 0.00010638256470130374, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020964174541271673, + "loss": 0.0146, "step": 119400 }, { - "epoch": 1.29, - "learning_rate": 0.00010636634883570085, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.00020963417771970272, + "loss": 0.013, "step": 119410 }, { - "epoch": 1.29, - "learning_rate": 0.00010635013297009793, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020962661002668872, + "loss": 0.0134, "step": 119420 }, { - "epoch": 1.29, - "learning_rate": 0.00010633391710449503, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.0002096190423336747, + "loss": 0.0145, "step": 119430 }, { - "epoch": 1.29, - "learning_rate": 0.00010631770123889213, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.0002096114746406607, + "loss": 0.0144, "step": 119440 }, { - "epoch": 1.29, - "learning_rate": 0.00010630148537328922, - "loss": 0.0117, + "epoch": 0.6, + "learning_rate": 0.0002096039069476467, + "loss": 0.0127, "step": 119450 }, { - "epoch": 1.29, - "learning_rate": 0.00010628526950768631, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020959633925463268, + "loss": 0.0136, "step": 119460 }, { - "epoch": 1.29, - "learning_rate": 0.00010626905364208342, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.00020958877156161866, + "loss": 0.0143, "step": 119470 }, { - "epoch": 1.29, - "learning_rate": 0.0001062528377764805, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020958120386860464, + "loss": 0.0137, "step": 119480 }, { - "epoch": 1.29, - "learning_rate": 0.0001062366219108776, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020957363617559065, + "loss": 0.0142, "step": 119490 }, { - "epoch": 1.29, - "learning_rate": 0.00010622040604527468, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020956606848257663, + "loss": 0.0145, "step": 119500 }, { - "epoch": 1.29, - "learning_rate": 0.00010620419017967179, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002095585007895626, + "loss": 0.0122, "step": 119510 }, { - "epoch": 1.29, - "learning_rate": 0.00010618797431406887, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020955093309654862, + "loss": 0.011, "step": 119520 }, { - "epoch": 1.29, - "learning_rate": 0.00010617175844846598, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.0002095433654035346, + "loss": 0.0145, "step": 119530 }, { - "epoch": 1.29, - "learning_rate": 0.00010615554258286307, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00020953579771052058, + "loss": 0.0115, "step": 119540 }, { - "epoch": 1.29, - "learning_rate": 0.00010613932671726016, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002095282300175066, + "loss": 0.0141, "step": 119550 }, { - "epoch": 1.29, - "learning_rate": 0.00010612311085165725, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00020952066232449257, + "loss": 0.013, "step": 119560 }, { - "epoch": 1.29, - "learning_rate": 0.00010610689498605435, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020951309463147855, + "loss": 0.0167, "step": 119570 }, { - "epoch": 1.29, - "learning_rate": 0.00010609067912045144, - "loss": 0.0063, + "epoch": 0.6, + "learning_rate": 0.00020950552693846456, + "loss": 0.014, "step": 119580 }, { - "epoch": 1.29, - "learning_rate": 0.00010607446325484855, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020949795924545054, + "loss": 0.0142, "step": 119590 }, { - "epoch": 1.29, - "learning_rate": 0.00010605824738924562, - "loss": 0.0125, + "epoch": 0.6, + "learning_rate": 0.00020949039155243653, + "loss": 0.0164, "step": 119600 }, { - "epoch": 1.29, - "learning_rate": 0.00010604203152364273, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020948282385942253, + "loss": 0.0139, "step": 119610 }, { - "epoch": 1.29, - "learning_rate": 0.00010602581565803981, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00020947525616640852, + "loss": 0.0117, "step": 119620 }, { - "epoch": 1.29, - "learning_rate": 0.00010600959979243692, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.0002094676884733945, + "loss": 0.013, "step": 119630 }, { - "epoch": 1.29, - "learning_rate": 0.00010599338392683401, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00020946012078038048, + "loss": 0.0174, "step": 119640 }, { - "epoch": 1.29, - "learning_rate": 0.0001059771680612311, - "loss": 0.007, + "epoch": 0.6, + "learning_rate": 0.0002094525530873665, + "loss": 0.016, "step": 119650 }, { - "epoch": 1.29, - "learning_rate": 0.0001059609521956282, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020944498539435247, + "loss": 0.0191, "step": 119660 }, { - "epoch": 1.29, - "learning_rate": 0.00010594473633002529, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.00020943741770133845, + "loss": 0.0144, "step": 119670 }, { - "epoch": 1.29, - "learning_rate": 0.00010592852046442238, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020942985000832446, + "loss": 0.0164, "step": 119680 }, { - "epoch": 1.29, - "learning_rate": 0.00010591230459881949, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020942228231531044, + "loss": 0.0128, "step": 119690 }, { - "epoch": 1.29, - "learning_rate": 0.00010589608873321657, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020941471462229642, + "loss": 0.0169, "step": 119700 }, { - "epoch": 1.29, - "learning_rate": 0.00010587987286761367, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00020940714692928243, + "loss": 0.0163, "step": 119710 }, { - "epoch": 1.29, - "learning_rate": 0.00010586365700201075, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.0002093995792362684, + "loss": 0.021, "step": 119720 }, { - "epoch": 1.29, - "learning_rate": 0.00010584744113640786, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.0002093920115432544, + "loss": 0.0151, "step": 119730 }, { - "epoch": 1.29, - "learning_rate": 0.00010583122527080494, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.0002093844438502404, + "loss": 0.017, "step": 119740 }, { - "epoch": 1.29, - "learning_rate": 0.00010581500940520204, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020937687615722638, + "loss": 0.0143, "step": 119750 }, { - "epoch": 1.29, - "learning_rate": 0.00010579879353959914, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020936930846421236, + "loss": 0.0155, "step": 119760 }, { - "epoch": 1.29, - "learning_rate": 0.00010578257767399623, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020936174077119837, + "loss": 0.0139, "step": 119770 }, { - "epoch": 1.29, - "learning_rate": 0.00010576636180839332, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00020935417307818435, + "loss": 0.0162, "step": 119780 }, { - "epoch": 1.29, - "learning_rate": 0.00010575014594279043, - "loss": 0.0107, + "epoch": 0.6, + "learning_rate": 0.00020934660538517034, + "loss": 0.0112, "step": 119790 }, { - "epoch": 1.3, - "learning_rate": 0.0001057339300771875, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00020933903769215632, + "loss": 0.0147, "step": 119800 }, { - "epoch": 1.3, - "learning_rate": 0.00010571771421158461, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020933146999914233, + "loss": 0.0165, "step": 119810 }, { - "epoch": 1.3, - "learning_rate": 0.00010570149834598169, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.0002093239023061283, + "loss": 0.0204, "step": 119820 }, { - "epoch": 1.3, - "learning_rate": 0.0001056852824803788, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002093163346131143, + "loss": 0.0165, "step": 119830 }, { - "epoch": 1.3, - "learning_rate": 0.00010566906661477588, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.0002093087669201003, + "loss": 0.0146, "step": 119840 }, { - "epoch": 1.3, - "learning_rate": 0.00010565285074917298, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020930119922708628, + "loss": 0.0148, "step": 119850 }, { - "epoch": 1.3, - "learning_rate": 0.00010563663488357008, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020929363153407226, + "loss": 0.0122, "step": 119860 }, { - "epoch": 1.3, - "learning_rate": 0.00010562041901796717, - "loss": 0.0121, + "epoch": 0.6, + "learning_rate": 0.00020928606384105827, + "loss": 0.0138, "step": 119870 }, { - "epoch": 1.3, - "learning_rate": 0.00010560420315236426, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020927849614804425, + "loss": 0.0156, "step": 119880 }, { - "epoch": 1.3, - "learning_rate": 0.00010558798728676135, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020927092845503023, + "loss": 0.0138, "step": 119890 }, { - "epoch": 1.3, - "learning_rate": 0.00010557177142115845, - "loss": 0.0121, + "epoch": 0.6, + "learning_rate": 0.00020926336076201624, + "loss": 0.0159, "step": 119900 }, { - "epoch": 1.3, - "learning_rate": 0.00010555555555555555, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020925579306900222, + "loss": 0.0143, "step": 119910 }, { - "epoch": 1.3, - "learning_rate": 0.00010553933968995263, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002092482253759882, + "loss": 0.0155, "step": 119920 }, { - "epoch": 1.3, - "learning_rate": 0.00010552312382434974, - "loss": 0.0121, + "epoch": 0.61, + "learning_rate": 0.0002092406576829742, + "loss": 0.0276, "step": 119930 }, { - "epoch": 1.3, - "learning_rate": 0.00010550690795874682, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.0002092330899899602, + "loss": 0.0167, "step": 119940 }, { - "epoch": 1.3, - "learning_rate": 0.00010549069209314392, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020922552229694617, + "loss": 0.019, "step": 119950 }, { - "epoch": 1.3, - "learning_rate": 0.000105474476227541, - "loss": 0.0117, + "epoch": 0.61, + "learning_rate": 0.00020921795460393218, + "loss": 0.0149, "step": 119960 }, { - "epoch": 1.3, - "learning_rate": 0.00010545826036193811, - "loss": 0.0067, + "epoch": 0.61, + "learning_rate": 0.00020921038691091816, + "loss": 0.0166, "step": 119970 }, { - "epoch": 1.3, - "learning_rate": 0.0001054420444963352, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020920281921790415, + "loss": 0.0147, "step": 119980 }, { - "epoch": 1.3, - "learning_rate": 0.0001054258286307323, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020919525152489013, + "loss": 0.013, "step": 119990 }, { - "epoch": 1.3, - "learning_rate": 0.00010540961276512939, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020918768383187614, + "loss": 0.0134, "step": 120000 }, { - "epoch": 1.3, - "eval_cer": 0.921546912377071, - "eval_loss": 0.007600127719342709, - "eval_runtime": 121.3753, - "eval_samples_per_second": 16.478, - "eval_steps_per_second": 4.119, + "epoch": 0.61, + "eval_cer": 0.9144925750140465, + "eval_loss": 0.0107016796246171, + "eval_runtime": 116.8152, + "eval_samples_per_second": 17.121, + "eval_steps_per_second": 4.28, "step": 120000 }, { - "epoch": 1.3, - "learning_rate": 0.0001053933968995265, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020918011613886212, + "loss": 0.0128, "step": 120010 }, { - "epoch": 1.3, - "learning_rate": 0.00010537718103392357, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.0002091725484458481, + "loss": 0.0138, "step": 120020 }, { - "epoch": 1.3, - "learning_rate": 0.00010536096516832068, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002091649807528341, + "loss": 0.0138, "step": 120030 }, { - "epoch": 1.3, - "learning_rate": 0.00010534474930271776, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020915741305982006, + "loss": 0.0128, "step": 120040 }, { - "epoch": 1.3, - "learning_rate": 0.00010532853343711487, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020914984536680604, + "loss": 0.0164, "step": 120050 }, { - "epoch": 1.3, - "learning_rate": 0.00010531231757151194, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020914227767379202, + "loss": 0.0129, "step": 120060 }, { - "epoch": 1.3, - "learning_rate": 0.00010529610170590905, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020913470998077803, + "loss": 0.0156, "step": 120070 }, { - "epoch": 1.3, - "learning_rate": 0.00010527988584030614, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020912714228776401, + "loss": 0.0199, "step": 120080 }, { - "epoch": 1.3, - "learning_rate": 0.00010526366997470324, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020911957459475, + "loss": 0.0168, "step": 120090 }, { - "epoch": 1.3, - "learning_rate": 0.00010524745410910033, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.000209112006901736, + "loss": 0.0181, "step": 120100 }, { - "epoch": 1.3, - "learning_rate": 0.00010523123824349742, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020910443920872199, + "loss": 0.0154, "step": 120110 }, { - "epoch": 1.3, - "learning_rate": 0.00010521502237789452, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020909687151570797, + "loss": 0.0125, "step": 120120 }, { - "epoch": 1.3, - "learning_rate": 0.00010519880651229162, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020908930382269398, + "loss": 0.0178, "step": 120130 }, { - "epoch": 1.3, - "learning_rate": 0.00010518259064668871, - "loss": 0.0055, + "epoch": 0.61, + "learning_rate": 0.00020908173612967996, + "loss": 0.0169, "step": 120140 }, { - "epoch": 1.3, - "learning_rate": 0.00010516637478108581, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020907416843666594, + "loss": 0.0147, "step": 120150 }, { - "epoch": 1.3, - "learning_rate": 0.00010515015891548291, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020906660074365195, + "loss": 0.0131, "step": 120160 }, { - "epoch": 1.3, - "learning_rate": 0.00010513394304987999, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020905903305063793, + "loss": 0.0128, "step": 120170 }, { - "epoch": 1.3, - "learning_rate": 0.0001051177271842771, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.0002090514653576239, + "loss": 0.0131, "step": 120180 }, { - "epoch": 1.3, - "learning_rate": 0.00010510151131867418, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.0002090438976646099, + "loss": 0.0158, "step": 120190 }, { - "epoch": 1.3, - "learning_rate": 0.00010508529545307128, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002090363299715959, + "loss": 0.0133, "step": 120200 }, { - "epoch": 1.3, - "learning_rate": 0.00010506907958746836, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020902876227858188, + "loss": 0.0129, "step": 120210 }, { - "epoch": 1.3, - "learning_rate": 0.00010505286372186547, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020902119458556786, + "loss": 0.0143, "step": 120220 }, { - "epoch": 1.3, - "learning_rate": 0.00010503664785626256, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020901362689255387, + "loss": 0.0149, "step": 120230 }, { - "epoch": 1.3, - "learning_rate": 0.00010502043199065966, - "loss": 0.0132, + "epoch": 0.61, + "learning_rate": 0.00020900605919953985, + "loss": 0.0151, "step": 120240 }, { - "epoch": 1.3, - "learning_rate": 0.00010500421612505675, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020899849150652583, + "loss": 0.0167, "step": 120250 }, { - "epoch": 1.3, - "learning_rate": 0.00010498800025945384, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020899092381351184, + "loss": 0.0139, "step": 120260 }, { - "epoch": 1.3, - "learning_rate": 0.00010497178439385093, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020898335612049782, + "loss": 0.0131, "step": 120270 }, { - "epoch": 1.3, - "learning_rate": 0.00010495556852824804, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.0002089757884274838, + "loss": 0.0173, "step": 120280 }, { - "epoch": 1.3, - "learning_rate": 0.00010493935266264512, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020896822073446981, + "loss": 0.0135, "step": 120290 }, { - "epoch": 1.3, - "learning_rate": 0.00010492313679704223, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.0002089606530414558, + "loss": 0.0149, "step": 120300 }, { - "epoch": 1.3, - "learning_rate": 0.0001049069209314393, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020895308534844178, + "loss": 0.0184, "step": 120310 }, { - "epoch": 1.3, - "learning_rate": 0.00010489070506583641, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020894551765542779, + "loss": 0.0142, "step": 120320 }, { - "epoch": 1.3, - "learning_rate": 0.0001048744892002335, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020893794996241377, + "loss": 0.0196, "step": 120330 }, { - "epoch": 1.3, - "learning_rate": 0.0001048582733346306, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020893038226939975, + "loss": 0.0188, "step": 120340 }, { - "epoch": 1.3, - "learning_rate": 0.00010484205746902769, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020892281457638576, + "loss": 0.0132, "step": 120350 }, { - "epoch": 1.3, - "learning_rate": 0.00010482584160342478, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020891524688337174, + "loss": 0.0193, "step": 120360 }, { - "epoch": 1.3, - "learning_rate": 0.00010480962573782187, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020890767919035772, + "loss": 0.0121, "step": 120370 }, { - "epoch": 1.3, - "learning_rate": 0.00010479340987221898, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.0002089001114973437, + "loss": 0.0174, "step": 120380 }, { - "epoch": 1.3, - "learning_rate": 0.00010477719400661606, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.0002088925438043297, + "loss": 0.0142, "step": 120390 }, { - "epoch": 1.3, - "learning_rate": 0.00010476097814101317, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.0002088849761113157, + "loss": 0.0119, "step": 120400 }, { - "epoch": 1.3, - "learning_rate": 0.00010474476227541025, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020887740841830167, + "loss": 0.0116, "step": 120410 }, { - "epoch": 1.3, - "learning_rate": 0.00010472854640980735, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020886984072528768, + "loss": 0.0146, "step": 120420 }, { - "epoch": 1.3, - "learning_rate": 0.00010471233054420443, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020886227303227366, + "loss": 0.0198, "step": 120430 }, { - "epoch": 1.3, - "learning_rate": 0.00010469611467860154, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020885470533925964, + "loss": 0.0147, "step": 120440 }, { - "epoch": 1.3, - "learning_rate": 0.00010467989881299863, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020884713764624565, + "loss": 0.0152, "step": 120450 }, { - "epoch": 1.3, - "learning_rate": 0.00010466368294739572, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020883956995323163, + "loss": 0.015, "step": 120460 }, { - "epoch": 1.3, - "learning_rate": 0.00010464746708179282, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020883200226021762, + "loss": 0.0122, "step": 120470 }, { - "epoch": 1.3, - "learning_rate": 0.00010463125121618992, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020882443456720362, + "loss": 0.0163, "step": 120480 }, { - "epoch": 1.3, - "learning_rate": 0.000104615035350587, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.0002088168668741896, + "loss": 0.0124, "step": 120490 }, { - "epoch": 1.3, - "learning_rate": 0.00010459881948498411, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.0002088092991811756, + "loss": 0.0133, "step": 120500 }, { - "epoch": 1.3, - "learning_rate": 0.00010458260361938119, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.0002088017314881616, + "loss": 0.0107, "step": 120510 }, { - "epoch": 1.3, - "learning_rate": 0.00010456638775377829, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020879416379514758, + "loss": 0.0141, "step": 120520 }, { - "epoch": 1.3, - "learning_rate": 0.00010455017188817537, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020878659610213356, + "loss": 0.0142, "step": 120530 }, { - "epoch": 1.3, - "learning_rate": 0.00010453395602257248, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020877902840911954, + "loss": 0.0169, "step": 120540 }, { - "epoch": 1.3, - "learning_rate": 0.00010451774015696957, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020877146071610555, + "loss": 0.016, "step": 120550 }, { - "epoch": 1.3, - "learning_rate": 0.00010450152429136666, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020876389302309153, + "loss": 0.0174, "step": 120560 }, { - "epoch": 1.3, - "learning_rate": 0.00010448530842576376, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.0002087563253300775, + "loss": 0.0186, "step": 120570 }, { - "epoch": 1.3, - "learning_rate": 0.00010446909256016085, - "loss": 0.0071, + "epoch": 0.61, + "learning_rate": 0.00020874875763706352, + "loss": 0.0281, "step": 120580 }, { - "epoch": 1.3, - "learning_rate": 0.00010445287669455794, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002087411899440495, + "loss": 0.014, "step": 120590 }, { - "epoch": 1.3, - "learning_rate": 0.00010443666082895505, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020873362225103548, + "loss": 0.0112, "step": 120600 }, { - "epoch": 1.3, - "learning_rate": 0.00010442044496335213, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.0002087260545580215, + "loss": 0.018, "step": 120610 }, { - "epoch": 1.3, - "learning_rate": 0.00010440422909774923, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020871848686500747, + "loss": 0.0143, "step": 120620 }, { - "epoch": 1.3, - "learning_rate": 0.00010438801323214631, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020871091917199345, + "loss": 0.0158, "step": 120630 }, { - "epoch": 1.3, - "learning_rate": 0.00010437179736654342, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020870335147897946, + "loss": 0.0145, "step": 120640 }, { - "epoch": 1.3, - "learning_rate": 0.00010435558150094051, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020869578378596544, + "loss": 0.0171, "step": 120650 }, { - "epoch": 1.3, - "learning_rate": 0.0001043393656353376, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020868821609295143, + "loss": 0.0136, "step": 120660 }, { - "epoch": 1.3, - "learning_rate": 0.0001043231497697347, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020868064839993743, + "loss": 0.0166, "step": 120670 }, { - "epoch": 1.3, - "learning_rate": 0.00010430693390413179, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020867308070692342, + "loss": 0.0151, "step": 120680 }, { - "epoch": 1.3, - "learning_rate": 0.00010429071803852888, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.0002086655130139094, + "loss": 0.0136, "step": 120690 }, { - "epoch": 1.3, - "learning_rate": 0.00010427450217292599, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020865794532089538, + "loss": 0.0127, "step": 120700 }, { - "epoch": 1.3, - "learning_rate": 0.00010425828630732307, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002086503776278814, + "loss": 0.0199, "step": 120710 }, { - "epoch": 1.31, - "learning_rate": 0.00010424207044172017, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020864280993486737, + "loss": 0.0166, "step": 120720 }, { - "epoch": 1.31, - "learning_rate": 0.00010422585457611725, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020863524224185335, + "loss": 0.0137, "step": 120730 }, { - "epoch": 1.31, - "learning_rate": 0.00010420963871051436, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020862767454883936, + "loss": 0.0138, "step": 120740 }, { - "epoch": 1.31, - "learning_rate": 0.00010419342284491144, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020862010685582534, + "loss": 0.015, "step": 120750 }, { - "epoch": 1.31, - "learning_rate": 0.00010417720697930855, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020861253916281132, + "loss": 0.0144, "step": 120760 }, { - "epoch": 1.31, - "learning_rate": 0.00010416099111370564, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020860497146979733, + "loss": 0.0176, "step": 120770 }, { - "epoch": 1.31, - "learning_rate": 0.00010414477524810273, - "loss": 0.0071, + "epoch": 0.61, + "learning_rate": 0.0002085974037767833, + "loss": 0.0132, "step": 120780 }, { - "epoch": 1.31, - "learning_rate": 0.00010412855938249982, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002085898360837693, + "loss": 0.0153, "step": 120790 }, { - "epoch": 1.31, - "learning_rate": 0.00010411234351689693, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.0002085822683907553, + "loss": 0.0152, "step": 120800 }, { - "epoch": 1.31, - "learning_rate": 0.00010409612765129401, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020857470069774128, + "loss": 0.0111, "step": 120810 }, { - "epoch": 1.31, - "learning_rate": 0.00010407991178569112, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020856713300472726, + "loss": 0.014, "step": 120820 }, { - "epoch": 1.31, - "learning_rate": 0.0001040636959200882, - "loss": 0.0107, + "epoch": 0.61, + "learning_rate": 0.00020855956531171327, + "loss": 0.014, "step": 120830 }, { - "epoch": 1.31, - "learning_rate": 0.0001040474800544853, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020855199761869925, + "loss": 0.0146, "step": 120840 }, { - "epoch": 1.31, - "learning_rate": 0.00010403126418888241, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020854442992568524, + "loss": 0.0185, "step": 120850 }, { - "epoch": 1.31, - "learning_rate": 0.00010401504832327949, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020853686223267124, + "loss": 0.0151, "step": 120860 }, { - "epoch": 1.31, - "learning_rate": 0.00010399883245767659, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020852929453965723, + "loss": 0.0157, "step": 120870 }, { - "epoch": 1.31, - "learning_rate": 0.00010398261659207367, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.0002085217268466432, + "loss": 0.0119, "step": 120880 }, { - "epoch": 1.31, - "learning_rate": 0.00010396640072647078, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.0002085141591536292, + "loss": 0.0171, "step": 120890 }, { - "epoch": 1.31, - "learning_rate": 0.00010395018486086786, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.0002085065914606152, + "loss": 0.017, "step": 120900 }, { - "epoch": 1.31, - "learning_rate": 0.00010393396899526496, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020849902376760118, + "loss": 0.0143, "step": 120910 }, { - "epoch": 1.31, - "learning_rate": 0.00010391775312966206, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020849145607458716, + "loss": 0.013, "step": 120920 }, { - "epoch": 1.31, - "learning_rate": 0.00010390153726405915, - "loss": 0.0114, + "epoch": 0.61, + "learning_rate": 0.00020848388838157317, + "loss": 0.0156, "step": 120930 }, { - "epoch": 1.31, - "learning_rate": 0.00010388532139845624, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020847632068855915, + "loss": 0.0149, "step": 120940 }, { - "epoch": 1.31, - "learning_rate": 0.00010386910553285335, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020846875299554513, + "loss": 0.015, "step": 120950 }, { - "epoch": 1.31, - "learning_rate": 0.00010385288966725043, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020846118530253114, + "loss": 0.0135, "step": 120960 }, { - "epoch": 1.31, - "learning_rate": 0.00010383667380164753, - "loss": 0.0135, + "epoch": 0.61, + "learning_rate": 0.00020845361760951712, + "loss": 0.0167, "step": 120970 }, { - "epoch": 1.31, - "learning_rate": 0.00010382045793604461, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.0002084460499165031, + "loss": 0.0149, "step": 120980 }, { - "epoch": 1.31, - "learning_rate": 0.00010380424207044172, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.0002084384822234891, + "loss": 0.0136, "step": 120990 }, { - "epoch": 1.31, - "learning_rate": 0.0001037880262048388, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.0002084309145304751, + "loss": 0.0164, "step": 121000 }, { - "epoch": 1.31, - "eval_cer": 0.9215330147297689, - "eval_loss": 0.007609688676893711, - "eval_runtime": 121.1646, - "eval_samples_per_second": 16.506, - "eval_steps_per_second": 4.127, + "epoch": 0.61, + "eval_cer": 0.9144799598644162, + "eval_loss": 0.010320211760699749, + "eval_runtime": 116.7947, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, "step": 121000 }, { - "epoch": 1.31, - "learning_rate": 0.0001037718103392359, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020842334683746107, + "loss": 0.0171, "step": 121010 }, { - "epoch": 1.31, - "learning_rate": 0.000103755594473633, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020841577914444708, + "loss": 0.0128, "step": 121020 }, { - "epoch": 1.31, - "learning_rate": 0.00010373937860803009, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020840821145143306, + "loss": 0.0111, "step": 121030 }, { - "epoch": 1.31, - "learning_rate": 0.00010372316274242718, - "loss": 0.0067, + "epoch": 0.61, + "learning_rate": 0.00020840064375841905, + "loss": 0.0125, "step": 121040 }, { - "epoch": 1.31, - "learning_rate": 0.00010370694687682428, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020839307606540503, + "loss": 0.0127, "step": 121050 }, { - "epoch": 1.31, - "learning_rate": 0.00010369073101122137, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020838550837239104, + "loss": 0.0125, "step": 121060 }, { - "epoch": 1.31, - "learning_rate": 0.00010367451514561847, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020837794067937702, + "loss": 0.0152, "step": 121070 }, { - "epoch": 1.31, - "learning_rate": 0.00010365829928001555, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.000208370372986363, + "loss": 0.0127, "step": 121080 }, { - "epoch": 1.31, - "learning_rate": 0.00010364208341441266, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.000208362805293349, + "loss": 0.015, "step": 121090 }, { - "epoch": 1.31, - "learning_rate": 0.00010362586754880974, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.000208355237600335, + "loss": 0.0185, "step": 121100 }, { - "epoch": 1.31, - "learning_rate": 0.00010360965168320685, - "loss": 0.0113, + "epoch": 0.61, + "learning_rate": 0.00020834766990732097, + "loss": 0.013, "step": 121110 }, { - "epoch": 1.31, - "learning_rate": 0.00010359343581760392, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020834010221430698, + "loss": 0.0158, "step": 121120 }, { - "epoch": 1.31, - "learning_rate": 0.00010357721995200103, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020833253452129296, + "loss": 0.013, "step": 121130 }, { - "epoch": 1.31, - "learning_rate": 0.00010356100408639812, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020832496682827894, + "loss": 0.0131, "step": 121140 }, { - "epoch": 1.31, - "learning_rate": 0.00010354478822079522, - "loss": 0.0125, + "epoch": 0.61, + "learning_rate": 0.00020831739913526495, + "loss": 0.0155, "step": 121150 }, { - "epoch": 1.31, - "learning_rate": 0.00010352857235519231, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020830983144225093, + "loss": 0.0147, "step": 121160 }, { - "epoch": 1.31, - "learning_rate": 0.00010351235648958942, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.0002083022637492369, + "loss": 0.0139, "step": 121170 }, { - "epoch": 1.31, - "learning_rate": 0.0001034961406239865, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020829469605622292, + "loss": 0.0123, "step": 121180 }, { - "epoch": 1.31, - "learning_rate": 0.0001034799247583836, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.0002082871283632089, + "loss": 0.0152, "step": 121190 }, { - "epoch": 1.31, - "learning_rate": 0.00010346370889278068, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020827956067019488, + "loss": 0.0135, "step": 121200 }, { - "epoch": 1.31, - "learning_rate": 0.00010344749302717779, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020827199297718087, + "loss": 0.014, "step": 121210 }, { - "epoch": 1.31, - "learning_rate": 0.00010343127716157487, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.00020826442528416687, + "loss": 0.0158, "step": 121220 }, { - "epoch": 1.31, - "learning_rate": 0.00010341506129597197, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020825685759115286, + "loss": 0.0178, "step": 121230 }, { - "epoch": 1.31, - "learning_rate": 0.00010339884543036906, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020824928989813884, + "loss": 0.013, "step": 121240 }, { - "epoch": 1.31, - "learning_rate": 0.00010338262956476616, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020824172220512485, + "loss": 0.012, "step": 121250 }, { - "epoch": 1.31, - "learning_rate": 0.00010336641369916325, - "loss": 0.0121, + "epoch": 0.61, + "learning_rate": 0.00020823415451211083, + "loss": 0.0182, "step": 121260 }, { - "epoch": 1.31, - "learning_rate": 0.00010335019783356034, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.0002082265868190968, + "loss": 0.0134, "step": 121270 }, { - "epoch": 1.31, - "learning_rate": 0.00010333398196795744, - "loss": 0.0107, + "epoch": 0.61, + "learning_rate": 0.00020821901912608282, + "loss": 0.0131, "step": 121280 }, { - "epoch": 1.31, - "learning_rate": 0.00010331776610235454, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020821145143306877, + "loss": 0.0132, "step": 121290 }, { - "epoch": 1.31, - "learning_rate": 0.00010330155023675162, - "loss": 0.0068, + "epoch": 0.61, + "learning_rate": 0.00020820388374005475, + "loss": 0.0175, "step": 121300 }, { - "epoch": 1.31, - "learning_rate": 0.00010328533437114873, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020819631604704073, + "loss": 0.014, "step": 121310 }, { - "epoch": 1.31, - "learning_rate": 0.00010326911850554581, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020818874835402674, + "loss": 0.0147, "step": 121320 }, { - "epoch": 1.31, - "learning_rate": 0.00010325290263994291, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.00020818118066101272, + "loss": 0.0177, "step": 121330 }, { - "epoch": 1.31, - "learning_rate": 0.00010323668677434, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002081736129679987, + "loss": 0.0204, "step": 121340 }, { - "epoch": 1.31, - "learning_rate": 0.0001032204709087371, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020816604527498471, + "loss": 0.0134, "step": 121350 }, { - "epoch": 1.31, - "learning_rate": 0.00010320425504313419, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.0002081584775819707, + "loss": 0.0176, "step": 121360 }, { - "epoch": 1.31, - "learning_rate": 0.00010318803917753128, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020815090988895668, + "loss": 0.0171, "step": 121370 }, { - "epoch": 1.31, - "learning_rate": 0.00010317182331192838, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020814334219594269, + "loss": 0.0166, "step": 121380 }, { - "epoch": 1.31, - "learning_rate": 0.00010315560744632548, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020813577450292867, + "loss": 0.0158, "step": 121390 }, { - "epoch": 1.31, - "learning_rate": 0.00010313939158072256, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020812820680991465, + "loss": 0.0142, "step": 121400 }, { - "epoch": 1.31, - "learning_rate": 0.00010312317571511967, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020812063911690066, + "loss": 0.0157, "step": 121410 }, { - "epoch": 1.31, - "learning_rate": 0.00010310695984951675, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020811307142388664, + "loss": 0.0127, "step": 121420 }, { - "epoch": 1.31, - "learning_rate": 0.00010309074398391385, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020810550373087262, + "loss": 0.0142, "step": 121430 }, { - "epoch": 1.31, - "learning_rate": 0.00010307452811831093, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.0002080979360378586, + "loss": 0.0117, "step": 121440 }, { - "epoch": 1.31, - "learning_rate": 0.00010305831225270804, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002080903683448446, + "loss": 0.0126, "step": 121450 }, { - "epoch": 1.31, - "learning_rate": 0.00010304209638710513, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.0002080828006518306, + "loss": 0.0128, "step": 121460 }, { - "epoch": 1.31, - "learning_rate": 0.00010302588052150223, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020807523295881657, + "loss": 0.0128, "step": 121470 }, { - "epoch": 1.31, - "learning_rate": 0.00010300966465589932, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020806766526580258, + "loss": 0.0146, "step": 121480 }, { - "epoch": 1.31, - "learning_rate": 0.00010299344879029642, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020806009757278856, + "loss": 0.0152, "step": 121490 }, { - "epoch": 1.31, - "learning_rate": 0.0001029772329246935, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020805252987977455, + "loss": 0.0143, "step": 121500 }, { - "epoch": 1.31, - "learning_rate": 0.00010296101705909061, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020804496218676055, + "loss": 0.0154, "step": 121510 }, { - "epoch": 1.31, - "learning_rate": 0.00010294480119348769, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020803739449374654, + "loss": 0.0153, "step": 121520 }, { - "epoch": 1.31, - "learning_rate": 0.0001029285853278848, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020802982680073252, + "loss": 0.0131, "step": 121530 }, { - "epoch": 1.31, - "learning_rate": 0.00010291236946228187, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020802225910771853, + "loss": 0.0113, "step": 121540 }, { - "epoch": 1.31, - "learning_rate": 0.00010289615359667898, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.0002080146914147045, + "loss": 0.0138, "step": 121550 }, { - "epoch": 1.31, - "learning_rate": 0.00010287993773107607, - "loss": 0.0111, + "epoch": 0.61, + "learning_rate": 0.0002080071237216905, + "loss": 0.015, "step": 121560 }, { - "epoch": 1.31, - "learning_rate": 0.00010286372186547317, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.0002079995560286765, + "loss": 0.0168, "step": 121570 }, { - "epoch": 1.31, - "learning_rate": 0.00010284750599987027, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020799198833566248, + "loss": 0.0139, "step": 121580 }, { - "epoch": 1.31, - "learning_rate": 0.00010283129013426735, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020798442064264846, + "loss": 0.0132, "step": 121590 }, { - "epoch": 1.31, - "learning_rate": 0.00010281507426866446, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020797685294963444, + "loss": 0.0164, "step": 121600 }, { - "epoch": 1.31, - "learning_rate": 0.00010279885840306155, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020796928525662045, + "loss": 0.0167, "step": 121610 }, { - "epoch": 1.31, - "learning_rate": 0.00010278264253745864, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020796171756360643, + "loss": 0.0149, "step": 121620 }, { - "epoch": 1.31, - "learning_rate": 0.00010276642667185574, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.0002079541498705924, + "loss": 0.0126, "step": 121630 }, { - "epoch": 1.31, - "learning_rate": 0.00010275021080625284, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020794658217757842, + "loss": 0.0148, "step": 121640 }, { - "epoch": 1.32, - "learning_rate": 0.00010273399494064992, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002079390144845644, + "loss": 0.0133, "step": 121650 }, { - "epoch": 1.32, - "learning_rate": 0.00010271777907504703, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020793144679155038, + "loss": 0.0149, "step": 121660 }, { - "epoch": 1.32, - "learning_rate": 0.00010270156320944411, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.0002079238790985364, + "loss": 0.015, "step": 121670 }, { - "epoch": 1.32, - "learning_rate": 0.00010268534734384121, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020791631140552237, + "loss": 0.0141, "step": 121680 }, { - "epoch": 1.32, - "learning_rate": 0.00010266913147823829, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020790874371250836, + "loss": 0.0146, "step": 121690 }, { - "epoch": 1.32, - "learning_rate": 0.0001026529156126354, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020790117601949436, + "loss": 0.0159, "step": 121700 }, { - "epoch": 1.32, - "learning_rate": 0.00010263669974703249, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020789360832648035, + "loss": 0.0128, "step": 121710 }, { - "epoch": 1.32, - "learning_rate": 0.00010262048388142958, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020788604063346633, + "loss": 0.012, "step": 121720 }, { - "epoch": 1.32, - "learning_rate": 0.00010260426801582668, - "loss": 0.0065, + "epoch": 0.61, + "learning_rate": 0.00020787847294045234, + "loss": 0.0172, "step": 121730 }, { - "epoch": 1.32, - "learning_rate": 0.00010258805215022377, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020787090524743832, + "loss": 0.0151, "step": 121740 }, { - "epoch": 1.32, - "learning_rate": 0.00010257183628462086, - "loss": 0.0125, + "epoch": 0.61, + "learning_rate": 0.0002078633375544243, + "loss": 0.0109, "step": 121750 }, { - "epoch": 1.32, - "learning_rate": 0.00010255562041901797, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020785576986141028, + "loss": 0.0139, "step": 121760 }, { - "epoch": 1.32, - "learning_rate": 0.00010253940455341505, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002078482021683963, + "loss": 0.0149, "step": 121770 }, { - "epoch": 1.32, - "learning_rate": 0.00010252318868781215, - "loss": 0.0105, + "epoch": 0.61, + "learning_rate": 0.00020784063447538227, + "loss": 0.0122, "step": 121780 }, { - "epoch": 1.32, - "learning_rate": 0.00010250697282220923, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020783306678236825, + "loss": 0.012, "step": 121790 }, { - "epoch": 1.32, - "learning_rate": 0.00010249075695660634, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020782549908935426, + "loss": 0.0131, "step": 121800 }, { - "epoch": 1.32, - "learning_rate": 0.00010247454109100343, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020781793139634024, + "loss": 0.0137, "step": 121810 }, { - "epoch": 1.32, - "learning_rate": 0.00010245832522540053, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020781036370332622, + "loss": 0.0151, "step": 121820 }, { - "epoch": 1.32, - "learning_rate": 0.00010244210935979762, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020780279601031223, + "loss": 0.015, "step": 121830 }, { - "epoch": 1.32, - "learning_rate": 0.00010242589349419471, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.0002077952283172982, + "loss": 0.0129, "step": 121840 }, { - "epoch": 1.32, - "learning_rate": 0.0001024096776285918, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.0002077876606242842, + "loss": 0.0156, "step": 121850 }, { - "epoch": 1.32, - "learning_rate": 0.00010239346176298891, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.0002077800929312702, + "loss": 0.0112, "step": 121860 }, { - "epoch": 1.32, - "learning_rate": 0.00010237724589738599, - "loss": 0.0116, + "epoch": 0.61, + "learning_rate": 0.00020777252523825618, + "loss": 0.0146, "step": 121870 }, { - "epoch": 1.32, - "learning_rate": 0.0001023610300317831, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020776495754524217, + "loss": 0.0176, "step": 121880 }, { - "epoch": 1.32, - "learning_rate": 0.00010234481416618017, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020775738985222817, + "loss": 0.0188, "step": 121890 }, { - "epoch": 1.32, - "learning_rate": 0.00010232859830057728, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020774982215921416, + "loss": 0.0149, "step": 121900 }, { - "epoch": 1.32, - "learning_rate": 0.00010231238243497436, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020774225446620014, + "loss": 0.0143, "step": 121910 }, { - "epoch": 1.32, - "learning_rate": 0.00010229616656937147, - "loss": 0.012, + "epoch": 0.62, + "learning_rate": 0.00020773468677318615, + "loss": 0.0137, "step": 121920 }, { - "epoch": 1.32, - "learning_rate": 0.00010227995070376856, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020772711908017213, + "loss": 0.0125, "step": 121930 }, { - "epoch": 1.32, - "learning_rate": 0.00010226373483816565, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.0002077195513871581, + "loss": 0.0152, "step": 121940 }, { - "epoch": 1.32, - "learning_rate": 0.00010224751897256274, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002077119836941441, + "loss": 0.0134, "step": 121950 }, { - "epoch": 1.32, - "learning_rate": 0.00010223130310695985, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.0002077044160011301, + "loss": 0.0138, "step": 121960 }, { - "epoch": 1.32, - "learning_rate": 0.00010221508724135693, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.00020769684830811608, + "loss": 0.0137, "step": 121970 }, { - "epoch": 1.32, - "learning_rate": 0.00010219887137575404, - "loss": 0.0103, + "epoch": 0.62, + "learning_rate": 0.00020768928061510206, + "loss": 0.0126, "step": 121980 }, { - "epoch": 1.32, - "learning_rate": 0.00010218265551015112, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020768171292208807, + "loss": 0.0138, "step": 121990 }, { - "epoch": 1.32, - "learning_rate": 0.00010216643964454822, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020767414522907405, + "loss": 0.0116, "step": 122000 }, { - "epoch": 1.32, - "eval_cer": 0.9215382263475072, - "eval_loss": 0.007727743126451969, - "eval_runtime": 121.0265, - "eval_samples_per_second": 16.525, - "eval_steps_per_second": 4.131, + "epoch": 0.62, + "eval_cer": 0.9145071309559275, + "eval_loss": 0.010251490399241447, + "eval_runtime": 116.7533, + "eval_samples_per_second": 17.13, + "eval_steps_per_second": 4.283, "step": 122000 }, { - "epoch": 1.32, - "learning_rate": 0.0001021502237789453, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020766657753606003, + "loss": 0.0127, "step": 122010 }, { - "epoch": 1.32, - "learning_rate": 0.00010213400791334241, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020765900984304604, + "loss": 0.0129, "step": 122020 }, { - "epoch": 1.32, - "learning_rate": 0.0001021177920477395, - "loss": 0.0115, + "epoch": 0.62, + "learning_rate": 0.00020765144215003202, + "loss": 0.0125, "step": 122030 }, { - "epoch": 1.32, - "learning_rate": 0.00010210157618213659, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.000207643874457018, + "loss": 0.0144, "step": 122040 }, { - "epoch": 1.32, - "learning_rate": 0.00010208536031653369, - "loss": 0.0069, + "epoch": 0.62, + "learning_rate": 0.000207636306764004, + "loss": 0.0132, "step": 122050 }, { - "epoch": 1.32, - "learning_rate": 0.00010206914445093078, - "loss": 0.013, + "epoch": 0.62, + "learning_rate": 0.00020762873907099, + "loss": 0.0163, "step": 122060 }, { - "epoch": 1.32, - "learning_rate": 0.00010205292858532787, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020762117137797598, + "loss": 0.0123, "step": 122070 }, { - "epoch": 1.32, - "learning_rate": 0.00010203671271972498, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020761360368496198, + "loss": 0.0163, "step": 122080 }, { - "epoch": 1.32, - "learning_rate": 0.00010202049685412206, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020760603599194797, + "loss": 0.0137, "step": 122090 }, { - "epoch": 1.32, - "learning_rate": 0.00010200428098851916, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.00020759846829893395, + "loss": 0.0135, "step": 122100 }, { - "epoch": 1.32, - "learning_rate": 0.00010198806512291624, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020759090060591993, + "loss": 0.0141, "step": 122110 }, { - "epoch": 1.32, - "learning_rate": 0.00010197184925731335, - "loss": 0.0098, + "epoch": 0.62, + "learning_rate": 0.00020758333291290594, + "loss": 0.0157, "step": 122120 }, { - "epoch": 1.32, - "learning_rate": 0.00010195563339171043, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020757576521989192, + "loss": 0.0123, "step": 122130 }, { - "epoch": 1.32, - "learning_rate": 0.00010193941752610753, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.0002075681975268779, + "loss": 0.0138, "step": 122140 }, { - "epoch": 1.32, - "learning_rate": 0.00010192320166050463, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.0002075606298338639, + "loss": 0.0136, "step": 122150 }, { - "epoch": 1.32, - "learning_rate": 0.00010190698579490172, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.0002075530621408499, + "loss": 0.0135, "step": 122160 }, { - "epoch": 1.32, - "learning_rate": 0.00010189076992929881, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020754549444783587, + "loss": 0.0155, "step": 122170 }, { - "epoch": 1.32, - "learning_rate": 0.00010187455406369592, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020753792675482188, + "loss": 0.0187, "step": 122180 }, { - "epoch": 1.32, - "learning_rate": 0.000101858338198093, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020753035906180786, + "loss": 0.0157, "step": 122190 }, { - "epoch": 1.32, - "learning_rate": 0.0001018421223324901, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020752279136879384, + "loss": 0.0145, "step": 122200 }, { - "epoch": 1.32, - "learning_rate": 0.00010182590646688718, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020751522367577985, + "loss": 0.0169, "step": 122210 }, { - "epoch": 1.32, - "learning_rate": 0.00010180969060128429, - "loss": 0.0114, + "epoch": 0.62, + "learning_rate": 0.00020750765598276583, + "loss": 0.0125, "step": 122220 }, { - "epoch": 1.32, - "learning_rate": 0.00010179347473568137, - "loss": 0.0118, + "epoch": 0.62, + "learning_rate": 0.00020750008828975181, + "loss": 0.0133, "step": 122230 }, { - "epoch": 1.32, - "learning_rate": 0.00010177725887007847, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020749252059673782, + "loss": 0.0157, "step": 122240 }, { - "epoch": 1.32, - "learning_rate": 0.00010176104300447557, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002074849529037238, + "loss": 0.0152, "step": 122250 }, { - "epoch": 1.32, - "learning_rate": 0.00010174482713887266, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020747738521070979, + "loss": 0.0164, "step": 122260 }, { - "epoch": 1.32, - "learning_rate": 0.00010172861127326975, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020746981751769577, + "loss": 0.014, "step": 122270 }, { - "epoch": 1.32, - "learning_rate": 0.00010171239540766685, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020746224982468178, + "loss": 0.0145, "step": 122280 }, { - "epoch": 1.32, - "learning_rate": 0.00010169617954206395, - "loss": 0.0071, + "epoch": 0.62, + "learning_rate": 0.00020745468213166776, + "loss": 0.0139, "step": 122290 }, { - "epoch": 1.32, - "learning_rate": 0.00010167996367646104, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020744711443865374, + "loss": 0.0148, "step": 122300 }, { - "epoch": 1.32, - "learning_rate": 0.00010166374781085814, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020743954674563975, + "loss": 0.0156, "step": 122310 }, { - "epoch": 1.32, - "learning_rate": 0.00010164753194525523, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020743197905262573, + "loss": 0.0123, "step": 122320 }, { - "epoch": 1.32, - "learning_rate": 0.00010163131607965234, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.0002074244113596117, + "loss": 0.0146, "step": 122330 }, { - "epoch": 1.32, - "learning_rate": 0.00010161510021404942, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020741684366659772, + "loss": 0.011, "step": 122340 }, { - "epoch": 1.32, - "learning_rate": 0.00010159888434844652, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002074092759735837, + "loss": 0.012, "step": 122350 }, { - "epoch": 1.32, - "learning_rate": 0.0001015826684828436, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020740170828056968, + "loss": 0.0123, "step": 122360 }, { - "epoch": 1.32, - "learning_rate": 0.00010156645261724071, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.0002073941405875557, + "loss": 0.0145, "step": 122370 }, { - "epoch": 1.32, - "learning_rate": 0.00010155023675163779, - "loss": 0.0072, + "epoch": 0.62, + "learning_rate": 0.00020738657289454167, + "loss": 0.0435, "step": 122380 }, { - "epoch": 1.32, - "learning_rate": 0.00010153402088603489, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020737900520152765, + "loss": 0.0144, "step": 122390 }, { - "epoch": 1.32, - "learning_rate": 0.00010151780502043199, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.00020737143750851366, + "loss": 0.015, "step": 122400 }, { - "epoch": 1.32, - "learning_rate": 0.00010150158915482908, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020736386981549964, + "loss": 0.0163, "step": 122410 }, { - "epoch": 1.32, - "learning_rate": 0.00010148537328922617, - "loss": 0.011, + "epoch": 0.62, + "learning_rate": 0.00020735630212248562, + "loss": 0.0156, "step": 122420 }, { - "epoch": 1.32, - "learning_rate": 0.00010146915742362326, - "loss": 0.0124, + "epoch": 0.62, + "learning_rate": 0.00020734873442947163, + "loss": 0.0174, "step": 122430 }, { - "epoch": 1.32, - "learning_rate": 0.00010145294155802036, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020734116673645761, + "loss": 0.0168, "step": 122440 }, { - "epoch": 1.32, - "learning_rate": 0.00010143672569241746, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002073335990434436, + "loss": 0.0173, "step": 122450 }, { - "epoch": 1.32, - "learning_rate": 0.00010142050982681454, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020732603135042958, + "loss": 0.0157, "step": 122460 }, { - "epoch": 1.32, - "learning_rate": 0.00010140429396121165, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020731846365741559, + "loss": 0.013, "step": 122470 }, { - "epoch": 1.32, - "learning_rate": 0.00010138807809560873, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020731089596440157, + "loss": 0.0131, "step": 122480 }, { - "epoch": 1.32, - "learning_rate": 0.00010137186223000583, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020730332827138755, + "loss": 0.0142, "step": 122490 }, { - "epoch": 1.32, - "learning_rate": 0.00010135564636440293, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020729576057837356, + "loss": 0.0159, "step": 122500 }, { - "epoch": 1.32, - "learning_rate": 0.00010133943049880002, - "loss": 0.0072, + "epoch": 0.62, + "learning_rate": 0.00020728819288535954, + "loss": 0.0119, "step": 122510 }, { - "epoch": 1.32, - "learning_rate": 0.00010132321463319711, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020728062519234552, + "loss": 0.0148, "step": 122520 }, { - "epoch": 1.32, - "learning_rate": 0.0001013069987675942, - "loss": 0.0111, + "epoch": 0.62, + "learning_rate": 0.00020727305749933153, + "loss": 0.0173, "step": 122530 }, { - "epoch": 1.32, - "learning_rate": 0.0001012907829019913, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.0002072654898063175, + "loss": 0.0134, "step": 122540 }, { - "epoch": 1.32, - "learning_rate": 0.0001012745670363884, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020725792211330346, + "loss": 0.0196, "step": 122550 }, { - "epoch": 1.32, - "learning_rate": 0.00010125835117078548, - "loss": 0.0124, + "epoch": 0.62, + "learning_rate": 0.00020725035442028945, + "loss": 0.0138, "step": 122560 }, { - "epoch": 1.33, - "learning_rate": 0.00010124213530518259, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020724278672727545, + "loss": 0.014, "step": 122570 }, { - "epoch": 1.33, - "learning_rate": 0.00010122591943957967, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020723521903426144, + "loss": 0.0147, "step": 122580 }, { - "epoch": 1.33, - "learning_rate": 0.00010120970357397678, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020722765134124742, + "loss": 0.0126, "step": 122590 }, { - "epoch": 1.33, - "learning_rate": 0.00010119348770837385, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020722008364823343, + "loss": 0.013, "step": 122600 }, { - "epoch": 1.33, - "learning_rate": 0.00010117727184277096, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.0002072125159552194, + "loss": 0.0132, "step": 122610 }, { - "epoch": 1.33, - "learning_rate": 0.00010116105597716805, - "loss": 0.0109, + "epoch": 0.62, + "learning_rate": 0.0002072049482622054, + "loss": 0.0158, "step": 122620 }, { - "epoch": 1.33, - "learning_rate": 0.00010114484011156515, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.0002071973805691914, + "loss": 0.0161, "step": 122630 }, { - "epoch": 1.33, - "learning_rate": 0.00010112862424596224, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020718981287617738, + "loss": 0.0117, "step": 122640 }, { - "epoch": 1.33, - "learning_rate": 0.00010111240838035935, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020718224518316336, + "loss": 0.0157, "step": 122650 }, { - "epoch": 1.33, - "learning_rate": 0.00010109619251475642, - "loss": 0.0135, + "epoch": 0.62, + "learning_rate": 0.00020717467749014934, + "loss": 0.0152, "step": 122660 }, { - "epoch": 1.33, - "learning_rate": 0.00010107997664915353, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020716710979713535, + "loss": 0.0143, "step": 122670 }, { - "epoch": 1.33, - "learning_rate": 0.00010106376078355061, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020715954210412133, + "loss": 0.0175, "step": 122680 }, { - "epoch": 1.33, - "learning_rate": 0.00010104754491794772, - "loss": 0.0118, + "epoch": 0.62, + "learning_rate": 0.0002071519744111073, + "loss": 0.0141, "step": 122690 }, { - "epoch": 1.33, - "learning_rate": 0.0001010313290523448, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020714440671809332, + "loss": 0.0143, "step": 122700 }, { - "epoch": 1.33, - "learning_rate": 0.0001010151131867419, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.0002071368390250793, + "loss": 0.0162, "step": 122710 }, { - "epoch": 1.33, - "learning_rate": 0.000100998897321139, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020712927133206528, + "loss": 0.018, "step": 122720 }, { - "epoch": 1.33, - "learning_rate": 0.00010098268145553609, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.0002071217036390513, + "loss": 0.013, "step": 122730 }, { - "epoch": 1.33, - "learning_rate": 0.00010096646558993318, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020711413594603727, + "loss": 0.017, "step": 122740 }, { - "epoch": 1.33, - "learning_rate": 0.00010095024972433027, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020710656825302326, + "loss": 0.0204, "step": 122750 }, { - "epoch": 1.33, - "learning_rate": 0.00010093403385872737, - "loss": 0.0112, + "epoch": 0.62, + "learning_rate": 0.00020709900056000926, + "loss": 0.0187, "step": 122760 }, { - "epoch": 1.33, - "learning_rate": 0.00010091781799312447, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020709143286699525, + "loss": 0.0143, "step": 122770 }, { - "epoch": 1.33, - "learning_rate": 0.00010090160212752155, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020708386517398123, + "loss": 0.0157, "step": 122780 }, { - "epoch": 1.33, - "learning_rate": 0.00010088538626191866, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020707629748096724, + "loss": 0.014, "step": 122790 }, { - "epoch": 1.33, - "learning_rate": 0.00010086917039631574, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020706872978795322, + "loss": 0.0141, "step": 122800 }, { - "epoch": 1.33, - "learning_rate": 0.00010085295453071284, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.0002070611620949392, + "loss": 0.0142, "step": 122810 }, { - "epoch": 1.33, - "learning_rate": 0.00010083673866510994, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.0002070535944019252, + "loss": 0.0147, "step": 122820 }, { - "epoch": 1.33, - "learning_rate": 0.00010082052279950703, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.0002070460267089112, + "loss": 0.0161, "step": 122830 }, { - "epoch": 1.33, - "learning_rate": 0.00010080430693390412, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020703845901589717, + "loss": 0.0122, "step": 122840 }, { - "epoch": 1.33, - "learning_rate": 0.00010078809106830121, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020703089132288315, + "loss": 0.0147, "step": 122850 }, { - "epoch": 1.33, - "learning_rate": 0.0001007718752026983, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020702332362986916, + "loss": 0.0143, "step": 122860 }, { - "epoch": 1.33, - "learning_rate": 0.00010075565933709541, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020701575593685514, + "loss": 0.0124, "step": 122870 }, { - "epoch": 1.33, - "learning_rate": 0.00010073944347149249, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020700818824384112, + "loss": 0.0143, "step": 122880 }, { - "epoch": 1.33, - "learning_rate": 0.0001007232276058896, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020700062055082713, + "loss": 0.0104, "step": 122890 }, { - "epoch": 1.33, - "learning_rate": 0.00010070701174028668, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.0002069930528578131, + "loss": 0.014, "step": 122900 }, { - "epoch": 1.33, - "learning_rate": 0.00010069079587468378, - "loss": 0.0116, + "epoch": 0.62, + "learning_rate": 0.0002069854851647991, + "loss": 0.0162, "step": 122910 }, { - "epoch": 1.33, - "learning_rate": 0.00010067458000908086, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.0002069779174717851, + "loss": 0.017, "step": 122920 }, { - "epoch": 1.33, - "learning_rate": 0.00010065836414347797, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020697034977877108, + "loss": 0.0131, "step": 122930 }, { - "epoch": 1.33, - "learning_rate": 0.00010064214827787506, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020696278208575707, + "loss": 0.0142, "step": 122940 }, { - "epoch": 1.33, - "learning_rate": 0.00010062593241227215, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020695521439274307, + "loss": 0.0143, "step": 122950 }, { - "epoch": 1.33, - "learning_rate": 0.00010060971654666925, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020694764669972906, + "loss": 0.0151, "step": 122960 }, { - "epoch": 1.33, - "learning_rate": 0.00010059350068106635, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020694007900671504, + "loss": 0.0127, "step": 122970 }, { - "epoch": 1.33, - "learning_rate": 0.00010057728481546343, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020693251131370105, + "loss": 0.0159, "step": 122980 }, { - "epoch": 1.33, - "learning_rate": 0.00010056106894986054, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020692494362068703, + "loss": 0.0124, "step": 122990 }, { - "epoch": 1.33, - "learning_rate": 0.00010054485308425762, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.000206917375927673, + "loss": 0.0134, "step": 123000 }, { - "epoch": 1.33, - "eval_cer": 0.9215703646568931, - "eval_loss": 0.007654594257473946, - "eval_runtime": 121.0821, - "eval_samples_per_second": 16.518, - "eval_steps_per_second": 4.129, + "epoch": 0.62, + "eval_cer": 0.9144566703574066, + "eval_loss": 0.010365525260567665, + "eval_runtime": 116.8218, + "eval_samples_per_second": 17.12, + "eval_steps_per_second": 4.28, "step": 123000 }, { - "epoch": 1.33, - "learning_rate": 0.00010052863721865472, - "loss": 0.0111, + "epoch": 0.62, + "learning_rate": 0.000206909808234659, + "loss": 0.0145, "step": 123010 }, { - "epoch": 1.33, - "learning_rate": 0.00010051242135305183, - "loss": 0.0112, + "epoch": 0.62, + "learning_rate": 0.000206902240541645, + "loss": 0.0131, "step": 123020 }, { - "epoch": 1.33, - "learning_rate": 0.00010049620548744891, - "loss": 0.0136, + "epoch": 0.62, + "learning_rate": 0.00020689467284863098, + "loss": 0.0168, "step": 123030 }, { - "epoch": 1.33, - "learning_rate": 0.00010047998962184602, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020688710515561696, + "loss": 0.016, "step": 123040 }, { - "epoch": 1.33, - "learning_rate": 0.0001004637737562431, - "loss": 0.006, + "epoch": 0.62, + "learning_rate": 0.00020687953746260297, + "loss": 0.0169, "step": 123050 }, { - "epoch": 1.33, - "learning_rate": 0.0001004475578906402, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020687196976958895, + "loss": 0.0119, "step": 123060 }, { - "epoch": 1.33, - "learning_rate": 0.00010043134202503728, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020686440207657493, + "loss": 0.0143, "step": 123070 }, { - "epoch": 1.33, - "learning_rate": 0.00010041512615943439, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020685683438356094, + "loss": 0.0136, "step": 123080 }, { - "epoch": 1.33, - "learning_rate": 0.00010039891029383148, - "loss": 0.0114, + "epoch": 0.62, + "learning_rate": 0.00020684926669054692, + "loss": 0.0125, "step": 123090 }, { - "epoch": 1.33, - "learning_rate": 0.00010038269442822857, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.0002068416989975329, + "loss": 0.0148, "step": 123100 }, { - "epoch": 1.33, - "learning_rate": 0.00010036647856262567, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.0002068341313045189, + "loss": 0.0182, "step": 123110 }, { - "epoch": 1.33, - "learning_rate": 0.00010035026269702277, - "loss": 0.0066, + "epoch": 0.62, + "learning_rate": 0.0002068265636115049, + "loss": 0.0126, "step": 123120 }, { - "epoch": 1.33, - "learning_rate": 0.00010033404683141985, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020681899591849088, + "loss": 0.0186, "step": 123130 }, { - "epoch": 1.33, - "learning_rate": 0.00010031783096581696, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020681142822547688, + "loss": 0.015, "step": 123140 }, { - "epoch": 1.33, - "learning_rate": 0.00010030161510021404, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020680386053246287, + "loss": 0.0183, "step": 123150 }, { - "epoch": 1.33, - "learning_rate": 0.00010028539923461114, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020679629283944885, + "loss": 0.0152, "step": 123160 }, { - "epoch": 1.33, - "learning_rate": 0.00010026918336900822, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020678872514643483, + "loss": 0.0167, "step": 123170 }, { - "epoch": 1.33, - "learning_rate": 0.00010025296750340533, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020678115745342084, + "loss": 0.0172, "step": 123180 }, { - "epoch": 1.33, - "learning_rate": 0.00010023675163780242, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020677358976040682, + "loss": 0.0158, "step": 123190 }, { - "epoch": 1.33, - "learning_rate": 0.00010022053577219951, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.0002067660220673928, + "loss": 0.0166, "step": 123200 }, { - "epoch": 1.33, - "learning_rate": 0.0001002043199065966, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.0002067584543743788, + "loss": 0.0189, "step": 123210 }, { - "epoch": 1.33, - "learning_rate": 0.0001001881040409937, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.0002067508866813648, + "loss": 0.0145, "step": 123220 }, { - "epoch": 1.33, - "learning_rate": 0.00010017188817539079, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020674331898835077, + "loss": 0.0174, "step": 123230 }, { - "epoch": 1.33, - "learning_rate": 0.0001001556723097879, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020673575129533678, + "loss": 0.0134, "step": 123240 }, { - "epoch": 1.33, - "learning_rate": 0.00010013945644418498, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020672818360232276, + "loss": 0.0143, "step": 123250 }, { - "epoch": 1.33, - "learning_rate": 0.00010012324057858208, - "loss": 0.0112, + "epoch": 0.62, + "learning_rate": 0.00020672061590930874, + "loss": 0.0149, "step": 123260 }, { - "epoch": 1.33, - "learning_rate": 0.00010010702471297916, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020671304821629475, + "loss": 0.0132, "step": 123270 }, { - "epoch": 1.33, - "learning_rate": 0.00010009080884737627, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020670548052328073, + "loss": 0.0122, "step": 123280 }, { - "epoch": 1.33, - "learning_rate": 0.00010007459298177335, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020669791283026671, + "loss": 0.0134, "step": 123290 }, { - "epoch": 1.33, - "learning_rate": 0.00010005837711617045, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020669034513725272, + "loss": 0.0132, "step": 123300 }, { - "epoch": 1.33, - "learning_rate": 0.00010004216125056755, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002066827774442387, + "loss": 0.0129, "step": 123310 }, { - "epoch": 1.33, - "learning_rate": 0.00010002594538496464, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020667520975122469, + "loss": 0.0147, "step": 123320 }, { - "epoch": 1.33, - "learning_rate": 0.00010000972951936173, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002066676420582107, + "loss": 0.0126, "step": 123330 }, { - "epoch": 1.33, - "learning_rate": 9.999351365375884e-05, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020666007436519668, + "loss": 0.0118, "step": 123340 }, { - "epoch": 1.33, - "learning_rate": 9.997729778815592e-05, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020665250667218266, + "loss": 0.0151, "step": 123350 }, { - "epoch": 1.33, - "learning_rate": 9.996108192255302e-05, - "loss": 0.0071, + "epoch": 0.62, + "learning_rate": 0.00020664493897916864, + "loss": 0.0155, "step": 123360 }, { - "epoch": 1.33, - "learning_rate": 9.99448660569501e-05, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020663737128615465, + "loss": 0.0147, "step": 123370 }, { - "epoch": 1.33, - "learning_rate": 9.992865019134721e-05, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020662980359314063, + "loss": 0.0131, "step": 123380 }, { - "epoch": 1.33, - "learning_rate": 9.991243432574429e-05, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.0002066222359001266, + "loss": 0.0148, "step": 123390 }, { - "epoch": 1.33, - "learning_rate": 9.98962184601414e-05, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020661466820711262, + "loss": 0.0121, "step": 123400 }, { - "epoch": 1.33, - "learning_rate": 9.988000259453849e-05, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.0002066071005140986, + "loss": 0.0143, "step": 123410 }, { - "epoch": 1.33, - "learning_rate": 9.986378672893558e-05, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020659953282108458, + "loss": 0.0121, "step": 123420 }, { - "epoch": 1.33, - "learning_rate": 9.984757086333267e-05, - "loss": 0.0116, + "epoch": 0.62, + "learning_rate": 0.0002065919651280706, + "loss": 0.0118, "step": 123430 }, { - "epoch": 1.33, - "learning_rate": 9.983135499772977e-05, - "loss": 0.0065, + "epoch": 0.62, + "learning_rate": 0.00020658439743505657, + "loss": 0.0133, "step": 123440 }, { - "epoch": 1.33, - "learning_rate": 9.981513913212686e-05, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020657682974204255, + "loss": 0.011, "step": 123450 }, { - "epoch": 1.33, - "learning_rate": 9.979892326652397e-05, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020656926204902856, + "loss": 0.014, "step": 123460 }, { - "epoch": 1.33, - "learning_rate": 9.978270740092104e-05, - "loss": 0.0062, + "epoch": 0.62, + "learning_rate": 0.00020656169435601454, + "loss": 0.0164, "step": 123470 }, { - "epoch": 1.33, - "learning_rate": 9.976649153531815e-05, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020655412666300052, + "loss": 0.0161, "step": 123480 }, { - "epoch": 1.33, - "learning_rate": 9.975027566971523e-05, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020654655896998653, + "loss": 0.015, "step": 123490 }, { - "epoch": 1.34, - "learning_rate": 9.973405980411234e-05, - "loss": 0.0103, + "epoch": 0.62, + "learning_rate": 0.00020653899127697251, + "loss": 0.0125, "step": 123500 }, { - "epoch": 1.34, - "learning_rate": 9.971784393850943e-05, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.0002065314235839585, + "loss": 0.0124, "step": 123510 }, { - "epoch": 1.34, - "learning_rate": 9.970162807290652e-05, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020652385589094448, + "loss": 0.014, "step": 123520 }, { - "epoch": 1.34, - "learning_rate": 9.968541220730361e-05, - "loss": 0.0103, + "epoch": 0.62, + "learning_rate": 0.00020651628819793049, + "loss": 0.0137, "step": 123530 }, { - "epoch": 1.34, - "learning_rate": 9.966919634170071e-05, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020650872050491647, + "loss": 0.0161, "step": 123540 }, { - "epoch": 1.34, - "learning_rate": 9.96529804760978e-05, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020650115281190245, + "loss": 0.0128, "step": 123550 }, { - "epoch": 1.34, - "learning_rate": 9.96367646104949e-05, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020649358511888846, + "loss": 0.0125, "step": 123560 }, { - "epoch": 1.34, - "learning_rate": 9.962054874489199e-05, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020648601742587444, + "loss": 0.0125, "step": 123570 }, { - "epoch": 1.34, - "learning_rate": 9.960433287928909e-05, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020647844973286042, + "loss": 0.0165, "step": 123580 }, { - "epoch": 1.34, - "learning_rate": 9.958811701368617e-05, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020647088203984643, + "loss": 0.0129, "step": 123590 }, { - "epoch": 1.34, - "learning_rate": 9.957190114808328e-05, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002064633143468324, + "loss": 0.0127, "step": 123600 }, { - "epoch": 1.34, - "learning_rate": 9.955568528248036e-05, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002064557466538184, + "loss": 0.0133, "step": 123610 }, { - "epoch": 1.34, - "learning_rate": 9.953946941687746e-05, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002064481789608044, + "loss": 0.0152, "step": 123620 }, { - "epoch": 1.34, - "learning_rate": 9.952325355127456e-05, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020644061126779038, + "loss": 0.0143, "step": 123630 }, { - "epoch": 1.34, - "learning_rate": 9.950703768567165e-05, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020643304357477636, + "loss": 0.0128, "step": 123640 }, { - "epoch": 1.34, - "learning_rate": 9.949082182006874e-05, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020642547588176237, + "loss": 0.0133, "step": 123650 }, { - "epoch": 1.34, - "learning_rate": 9.947460595446585e-05, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020641790818874835, + "loss": 0.0152, "step": 123660 }, { - "epoch": 1.34, - "learning_rate": 9.945839008886293e-05, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020641034049573433, + "loss": 0.0143, "step": 123670 }, { - "epoch": 1.34, - "learning_rate": 9.944217422326003e-05, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020640277280272032, + "loss": 0.014, "step": 123680 }, { - "epoch": 1.34, - "learning_rate": 9.942595835765711e-05, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020639520510970632, + "loss": 0.0123, "step": 123690 }, { - "epoch": 1.34, - "learning_rate": 9.940974249205422e-05, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.0002063876374166923, + "loss": 0.0147, "step": 123700 }, { - "epoch": 1.34, - "learning_rate": 9.93935266264513e-05, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.0002063800697236783, + "loss": 0.016, "step": 123710 }, { - "epoch": 1.34, - "learning_rate": 9.93773107608484e-05, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002063725020306643, + "loss": 0.0119, "step": 123720 }, { - "epoch": 1.34, - "learning_rate": 9.936109489524551e-05, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020636493433765028, + "loss": 0.015, "step": 123730 }, { - "epoch": 1.34, - "learning_rate": 9.934487902964259e-05, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020635736664463626, + "loss": 0.0141, "step": 123740 }, { - "epoch": 1.34, - "learning_rate": 9.93286631640397e-05, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020634979895162227, + "loss": 0.0183, "step": 123750 }, { - "epoch": 1.34, - "learning_rate": 9.931244729843678e-05, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020634223125860825, + "loss": 0.0192, "step": 123760 }, { - "epoch": 1.34, - "learning_rate": 9.929623143283388e-05, - "loss": 0.007, + "epoch": 0.62, + "learning_rate": 0.00020633466356559423, + "loss": 0.0139, "step": 123770 }, { - "epoch": 1.34, - "learning_rate": 9.928001556723097e-05, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020632709587258024, + "loss": 0.0143, "step": 123780 }, { - "epoch": 1.34, - "learning_rate": 9.926379970162807e-05, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.00020631952817956622, + "loss": 0.0165, "step": 123790 }, { - "epoch": 1.34, - "learning_rate": 9.924758383602516e-05, - "loss": 0.0136, + "epoch": 0.62, + "learning_rate": 0.0002063119604865522, + "loss": 0.0146, "step": 123800 }, { - "epoch": 1.34, - "learning_rate": 9.923136797042227e-05, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.00020630439279353816, + "loss": 0.0111, "step": 123810 }, { - "epoch": 1.34, - "learning_rate": 9.921515210481935e-05, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020629682510052416, + "loss": 0.0121, "step": 123820 }, { - "epoch": 1.34, - "learning_rate": 9.919893623921645e-05, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020628925740751015, + "loss": 0.0158, "step": 123830 }, { - "epoch": 1.34, - "learning_rate": 9.918272037361353e-05, - "loss": 0.0119, + "epoch": 0.62, + "learning_rate": 0.00020628168971449613, + "loss": 0.0139, "step": 123840 }, { - "epoch": 1.34, - "learning_rate": 9.916650450801064e-05, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020627412202148214, + "loss": 0.0149, "step": 123850 }, { - "epoch": 1.34, - "learning_rate": 9.915028864240772e-05, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020626655432846812, + "loss": 0.0138, "step": 123860 }, { - "epoch": 1.34, - "learning_rate": 9.913407277680482e-05, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002062589866354541, + "loss": 0.0158, "step": 123870 }, { - "epoch": 1.34, - "learning_rate": 9.911785691120192e-05, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002062514189424401, + "loss": 0.0114, "step": 123880 }, { - "epoch": 1.34, - "learning_rate": 9.910164104559901e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.0002062438512494261, + "loss": 0.0118, "step": 123890 }, { - "epoch": 1.34, - "learning_rate": 9.90854251799961e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020623628355641207, + "loss": 0.0163, "step": 123900 }, { - "epoch": 1.34, - "learning_rate": 9.90692093143932e-05, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020622871586339805, + "loss": 0.0161, "step": 123910 }, { - "epoch": 1.34, - "learning_rate": 9.905299344879029e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020622114817038406, + "loss": 0.0138, "step": 123920 }, { - "epoch": 1.34, - "learning_rate": 9.903677758318739e-05, - "loss": 0.0109, + "epoch": 0.63, + "learning_rate": 0.00020621358047737004, + "loss": 0.0166, "step": 123930 }, { - "epoch": 1.34, - "learning_rate": 9.902056171758447e-05, - "loss": 0.0109, + "epoch": 0.63, + "learning_rate": 0.00020620601278435602, + "loss": 0.0141, "step": 123940 }, { - "epoch": 1.34, - "learning_rate": 9.900434585198158e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020619844509134203, + "loss": 0.0147, "step": 123950 }, { - "epoch": 1.34, - "learning_rate": 9.898812998637866e-05, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.000206190877398328, + "loss": 0.0161, "step": 123960 }, { - "epoch": 1.34, - "learning_rate": 9.897191412077576e-05, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.000206183309705314, + "loss": 0.0162, "step": 123970 }, { - "epoch": 1.34, - "learning_rate": 9.895569825517286e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.0002061757420123, + "loss": 0.0101, "step": 123980 }, { - "epoch": 1.34, - "learning_rate": 9.893948238956995e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020616817431928598, + "loss": 0.0125, "step": 123990 }, { - "epoch": 1.34, - "learning_rate": 9.892326652396704e-05, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.00020616060662627197, + "loss": 0.0134, "step": 124000 }, { - "epoch": 1.34, - "eval_cer": 0.9215547298036784, - "eval_loss": 0.0075076548382639885, - "eval_runtime": 121.2801, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.63, + "eval_cer": 0.9144877230334195, + "eval_loss": 0.010582580231130123, + "eval_runtime": 116.7375, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, "step": 124000 }, { - "epoch": 1.34, - "learning_rate": 9.890705065836413e-05, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020615303893325797, + "loss": 0.0157, "step": 124010 }, { - "epoch": 1.34, - "learning_rate": 9.889083479276123e-05, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020614547124024396, + "loss": 0.0124, "step": 124020 }, { - "epoch": 1.34, - "learning_rate": 9.887461892715833e-05, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020613790354722994, + "loss": 0.0161, "step": 124030 }, { - "epoch": 1.34, - "learning_rate": 9.885840306155541e-05, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020613033585421595, + "loss": 0.0163, "step": 124040 }, { - "epoch": 1.34, - "learning_rate": 9.884218719595252e-05, - "loss": 0.0071, + "epoch": 0.63, + "learning_rate": 0.00020612276816120193, + "loss": 0.0119, "step": 124050 }, { - "epoch": 1.34, - "learning_rate": 9.88259713303496e-05, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.0002061152004681879, + "loss": 0.0167, "step": 124060 }, { - "epoch": 1.34, - "learning_rate": 9.88097554647467e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002061076327751739, + "loss": 0.0129, "step": 124070 }, { - "epoch": 1.34, - "learning_rate": 9.879353959914378e-05, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.0002061000650821599, + "loss": 0.0137, "step": 124080 }, { - "epoch": 1.34, - "learning_rate": 9.877732373354089e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020609249738914588, + "loss": 0.0138, "step": 124090 }, { - "epoch": 1.34, - "learning_rate": 9.876110786793798e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020608492969613186, + "loss": 0.0148, "step": 124100 }, { - "epoch": 1.34, - "learning_rate": 9.874489200233508e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020607736200311787, + "loss": 0.0134, "step": 124110 }, { - "epoch": 1.34, - "learning_rate": 9.872867613673217e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020606979431010385, + "loss": 0.0143, "step": 124120 }, { - "epoch": 1.34, - "learning_rate": 9.871246027112927e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020606222661708983, + "loss": 0.0169, "step": 124130 }, { - "epoch": 1.34, - "learning_rate": 9.869624440552635e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020605465892407584, + "loss": 0.0122, "step": 124140 }, { - "epoch": 1.34, - "learning_rate": 9.868002853992346e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020604709123106182, + "loss": 0.0155, "step": 124150 }, { - "epoch": 1.34, - "learning_rate": 9.866381267432054e-05, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.0002060395235380478, + "loss": 0.0132, "step": 124160 }, { - "epoch": 1.34, - "learning_rate": 9.864759680871765e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.0002060319558450338, + "loss": 0.0157, "step": 124170 }, { - "epoch": 1.34, - "learning_rate": 9.863138094311472e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.0002060243881520198, + "loss": 0.0148, "step": 124180 }, { - "epoch": 1.34, - "learning_rate": 9.861516507751183e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020601682045900578, + "loss": 0.0143, "step": 124190 }, { - "epoch": 1.34, - "learning_rate": 9.859894921190892e-05, - "loss": 0.012, + "epoch": 0.63, + "learning_rate": 0.00020600925276599178, + "loss": 0.0121, "step": 124200 }, { - "epoch": 1.34, - "learning_rate": 9.858273334630602e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020600168507297777, + "loss": 0.0146, "step": 124210 }, { - "epoch": 1.34, - "learning_rate": 9.856651748070311e-05, - "loss": 0.0119, + "epoch": 0.63, + "learning_rate": 0.00020599411737996375, + "loss": 0.0146, "step": 124220 }, { - "epoch": 1.34, - "learning_rate": 9.85503016151002e-05, - "loss": 0.0124, + "epoch": 0.63, + "learning_rate": 0.00020598654968694976, + "loss": 0.014, "step": 124230 }, { - "epoch": 1.34, - "learning_rate": 9.85340857494973e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020597898199393574, + "loss": 0.0173, "step": 124240 }, { - "epoch": 1.34, - "learning_rate": 9.85178698838944e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020597141430092172, + "loss": 0.0149, "step": 124250 }, { - "epoch": 1.34, - "learning_rate": 9.850165401829148e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.0002059638466079077, + "loss": 0.0125, "step": 124260 }, { - "epoch": 1.34, - "learning_rate": 9.848543815268859e-05, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002059562789148937, + "loss": 0.0131, "step": 124270 }, { - "epoch": 1.34, - "learning_rate": 9.846922228708567e-05, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.0002059487112218797, + "loss": 0.0132, "step": 124280 }, { - "epoch": 1.34, - "learning_rate": 9.845300642148277e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020594114352886567, + "loss": 0.0145, "step": 124290 }, { - "epoch": 1.34, - "learning_rate": 9.843679055587985e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020593357583585168, + "loss": 0.0133, "step": 124300 }, { - "epoch": 1.34, - "learning_rate": 9.842057469027696e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020592600814283766, + "loss": 0.0132, "step": 124310 }, { - "epoch": 1.34, - "learning_rate": 9.840435882467405e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020591844044982364, + "loss": 0.0158, "step": 124320 }, { - "epoch": 1.34, - "learning_rate": 9.838814295907114e-05, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020591087275680965, + "loss": 0.0158, "step": 124330 }, { - "epoch": 1.34, - "learning_rate": 9.837192709346824e-05, - "loss": 0.0066, + "epoch": 0.63, + "learning_rate": 0.00020590330506379563, + "loss": 0.0154, "step": 124340 }, { - "epoch": 1.34, - "learning_rate": 9.835571122786534e-05, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020589573737078161, + "loss": 0.0133, "step": 124350 }, { - "epoch": 1.34, - "learning_rate": 9.833949536226242e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020588816967776762, + "loss": 0.0126, "step": 124360 }, { - "epoch": 1.34, - "learning_rate": 9.832327949665953e-05, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.0002058806019847536, + "loss": 0.016, "step": 124370 }, { - "epoch": 1.34, - "learning_rate": 9.83070636310566e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020587303429173959, + "loss": 0.0133, "step": 124380 }, { - "epoch": 1.34, - "learning_rate": 9.829084776545371e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.0002058654665987256, + "loss": 0.0157, "step": 124390 }, { - "epoch": 1.34, - "learning_rate": 9.827463189985079e-05, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020585789890571158, + "loss": 0.0272, "step": 124400 }, { - "epoch": 1.34, - "learning_rate": 9.82584160342479e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020585033121269756, + "loss": 0.0157, "step": 124410 }, { - "epoch": 1.35, - "learning_rate": 9.824220016864499e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020584276351968354, + "loss": 0.0145, "step": 124420 }, { - "epoch": 1.35, - "learning_rate": 9.822598430304208e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020583519582666955, + "loss": 0.0132, "step": 124430 }, { - "epoch": 1.35, - "learning_rate": 9.820976843743919e-05, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020582762813365553, + "loss": 0.0104, "step": 124440 }, { - "epoch": 1.35, - "learning_rate": 9.819355257183627e-05, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.0002058200604406415, + "loss": 0.0154, "step": 124450 }, { - "epoch": 1.35, - "learning_rate": 9.817733670623338e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020581249274762752, + "loss": 0.0152, "step": 124460 }, { - "epoch": 1.35, - "learning_rate": 9.816112084063047e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.0002058049250546135, + "loss": 0.0136, "step": 124470 }, { - "epoch": 1.35, - "learning_rate": 9.814490497502756e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020579735736159948, + "loss": 0.013, "step": 124480 }, { - "epoch": 1.35, - "learning_rate": 9.812868910942465e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002057897896685855, + "loss": 0.0133, "step": 124490 }, { - "epoch": 1.35, - "learning_rate": 9.811247324382176e-05, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020578222197557147, + "loss": 0.0135, "step": 124500 }, { - "epoch": 1.35, - "learning_rate": 9.809625737821884e-05, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.00020577465428255745, + "loss": 0.014, "step": 124510 }, { - "epoch": 1.35, - "learning_rate": 9.808004151261595e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020576708658954346, + "loss": 0.0176, "step": 124520 }, { - "epoch": 1.35, - "learning_rate": 9.806382564701302e-05, - "loss": 0.0067, + "epoch": 0.63, + "learning_rate": 0.00020575951889652944, + "loss": 0.0134, "step": 124530 }, { - "epoch": 1.35, - "learning_rate": 9.804760978141013e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020575195120351542, + "loss": 0.0143, "step": 124540 }, { - "epoch": 1.35, - "learning_rate": 9.803139391580721e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020574438351050143, + "loss": 0.017, "step": 124550 }, { - "epoch": 1.35, - "learning_rate": 9.801517805020432e-05, - "loss": 0.0071, + "epoch": 0.63, + "learning_rate": 0.00020573681581748741, + "loss": 0.0151, "step": 124560 }, { - "epoch": 1.35, - "learning_rate": 9.799896218460141e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.0002057292481244734, + "loss": 0.0118, "step": 124570 }, { - "epoch": 1.35, - "learning_rate": 9.79827463189985e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020572168043145938, + "loss": 0.014, "step": 124580 }, { - "epoch": 1.35, - "learning_rate": 9.79665304533956e-05, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.00020571411273844539, + "loss": 0.0118, "step": 124590 }, { - "epoch": 1.35, - "learning_rate": 9.795031458779269e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020570654504543137, + "loss": 0.0144, "step": 124600 }, { - "epoch": 1.35, - "learning_rate": 9.793409872218978e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020569897735241735, + "loss": 0.0149, "step": 124610 }, { - "epoch": 1.35, - "learning_rate": 9.791788285658689e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020569140965940336, + "loss": 0.0164, "step": 124620 }, { - "epoch": 1.35, - "learning_rate": 9.790166699098397e-05, - "loss": 0.0109, + "epoch": 0.63, + "learning_rate": 0.00020568384196638934, + "loss": 0.0174, "step": 124630 }, { - "epoch": 1.35, - "learning_rate": 9.788545112538107e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020567627427337532, + "loss": 0.0131, "step": 124640 }, { - "epoch": 1.35, - "learning_rate": 9.786923525977815e-05, - "loss": 0.0126, + "epoch": 0.63, + "learning_rate": 0.00020566870658036133, + "loss": 0.0133, "step": 124650 }, { - "epoch": 1.35, - "learning_rate": 9.785301939417526e-05, - "loss": 0.0113, + "epoch": 0.63, + "learning_rate": 0.0002056611388873473, + "loss": 0.0157, "step": 124660 }, { - "epoch": 1.35, - "learning_rate": 9.783680352857235e-05, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.0002056535711943333, + "loss": 0.0131, "step": 124670 }, { - "epoch": 1.35, - "learning_rate": 9.782058766296944e-05, - "loss": 0.0119, + "epoch": 0.63, + "learning_rate": 0.0002056460035013193, + "loss": 0.0143, "step": 124680 }, { - "epoch": 1.35, - "learning_rate": 9.780437179736654e-05, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020563843580830528, + "loss": 0.0127, "step": 124690 }, { - "epoch": 1.35, - "learning_rate": 9.778815593176363e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020563086811529126, + "loss": 0.0128, "step": 124700 }, { - "epoch": 1.35, - "learning_rate": 9.777194006616072e-05, - "loss": 0.0132, + "epoch": 0.63, + "learning_rate": 0.00020562330042227727, + "loss": 0.0173, "step": 124710 }, { - "epoch": 1.35, - "learning_rate": 9.775572420055783e-05, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020561573272926325, + "loss": 0.0166, "step": 124720 }, { - "epoch": 1.35, - "learning_rate": 9.77395083349549e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020560816503624923, + "loss": 0.0147, "step": 124730 }, { - "epoch": 1.35, - "learning_rate": 9.772329246935201e-05, - "loss": 0.0119, + "epoch": 0.63, + "learning_rate": 0.00020560059734323524, + "loss": 0.0121, "step": 124740 }, { - "epoch": 1.35, - "learning_rate": 9.770707660374909e-05, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020559302965022122, + "loss": 0.0116, "step": 124750 }, { - "epoch": 1.35, - "learning_rate": 9.76908607381462e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002055854619572072, + "loss": 0.0155, "step": 124760 }, { - "epoch": 1.35, - "learning_rate": 9.767464487254328e-05, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.0002055778942641932, + "loss": 0.0136, "step": 124770 }, { - "epoch": 1.35, - "learning_rate": 9.765842900694038e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.0002055703265711792, + "loss": 0.013, "step": 124780 }, { - "epoch": 1.35, - "learning_rate": 9.764221314133748e-05, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.00020556275887816518, + "loss": 0.0167, "step": 124790 }, { - "epoch": 1.35, - "learning_rate": 9.762599727573457e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020555519118515116, + "loss": 0.0149, "step": 124800 }, { - "epoch": 1.35, - "learning_rate": 9.760978141013166e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020554762349213717, + "loss": 0.0176, "step": 124810 }, { - "epoch": 1.35, - "learning_rate": 9.759356554452877e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020554005579912315, + "loss": 0.0127, "step": 124820 }, { - "epoch": 1.35, - "learning_rate": 9.757734967892585e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020553248810610913, + "loss": 0.0127, "step": 124830 }, { - "epoch": 1.35, - "learning_rate": 9.756113381332295e-05, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020552492041309514, + "loss": 0.0134, "step": 124840 }, { - "epoch": 1.35, - "learning_rate": 9.754491794772003e-05, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020551735272008112, + "loss": 0.0144, "step": 124850 }, { - "epoch": 1.35, - "learning_rate": 9.752870208211714e-05, - "loss": 0.0119, + "epoch": 0.63, + "learning_rate": 0.0002055097850270671, + "loss": 0.0129, "step": 124860 }, { - "epoch": 1.35, - "learning_rate": 9.751248621651422e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.0002055022173340531, + "loss": 0.0165, "step": 124870 }, { - "epoch": 1.35, - "learning_rate": 9.749627035091132e-05, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.0002054946496410391, + "loss": 0.0154, "step": 124880 }, { - "epoch": 1.35, - "learning_rate": 9.748005448530842e-05, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020548708194802507, + "loss": 0.0165, "step": 124890 }, { - "epoch": 1.35, - "learning_rate": 9.746383861970551e-05, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020547951425501108, + "loss": 0.0141, "step": 124900 }, { - "epoch": 1.35, - "learning_rate": 9.74476227541026e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020547194656199706, + "loss": 0.0107, "step": 124910 }, { - "epoch": 1.35, - "learning_rate": 9.74314068884997e-05, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020546437886898304, + "loss": 0.0128, "step": 124920 }, { - "epoch": 1.35, - "learning_rate": 9.741519102289679e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020545681117596903, + "loss": 0.0165, "step": 124930 }, { - "epoch": 1.35, - "learning_rate": 9.73989751572939e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020544924348295503, + "loss": 0.0152, "step": 124940 }, { - "epoch": 1.35, - "learning_rate": 9.738275929169097e-05, - "loss": 0.0151, + "epoch": 0.63, + "learning_rate": 0.00020544167578994102, + "loss": 0.0172, "step": 124950 }, { - "epoch": 1.35, - "learning_rate": 9.736654342608808e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.000205434108096927, + "loss": 0.0126, "step": 124960 }, { - "epoch": 1.35, - "learning_rate": 9.735032756048516e-05, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.000205426540403913, + "loss": 0.0121, "step": 124970 }, { - "epoch": 1.35, - "learning_rate": 9.733411169488227e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.000205418972710899, + "loss": 0.0107, "step": 124980 }, { - "epoch": 1.35, - "learning_rate": 9.731789582927936e-05, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020541140501788497, + "loss": 0.0136, "step": 124990 }, { - "epoch": 1.35, - "learning_rate": 9.730167996367645e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020540383732487098, + "loss": 0.0122, "step": 125000 }, { - "epoch": 1.35, - "eval_cer": 0.9215807878923696, - "eval_loss": 0.007421437185257673, - "eval_runtime": 121.2555, - "eval_samples_per_second": 16.494, - "eval_steps_per_second": 4.124, + "epoch": 0.63, + "eval_cer": 0.9144945158062973, + "eval_loss": 0.010605525225400925, + "eval_runtime": 116.7031, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.284, "step": 125000 }, { - "epoch": 1.35, - "learning_rate": 9.728546409807354e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020539626963185696, + "loss": 0.0155, "step": 125010 }, { - "epoch": 1.35, - "learning_rate": 9.726924823247064e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020538870193884294, + "loss": 0.0101, "step": 125020 }, { - "epoch": 1.35, - "learning_rate": 9.725303236686773e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020538113424582895, + "loss": 0.0155, "step": 125030 }, { - "epoch": 1.35, - "learning_rate": 9.723681650126484e-05, - "loss": 0.0114, + "epoch": 0.63, + "learning_rate": 0.00020537356655281493, + "loss": 0.0162, "step": 125040 }, { - "epoch": 1.35, - "learning_rate": 9.722060063566192e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002053659988598009, + "loss": 0.0154, "step": 125050 }, { - "epoch": 1.35, - "learning_rate": 9.720438477005902e-05, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020535843116678692, + "loss": 0.013, "step": 125060 }, { - "epoch": 1.35, - "learning_rate": 9.71881689044561e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020535086347377287, + "loss": 0.0175, "step": 125070 }, { - "epoch": 1.35, - "learning_rate": 9.717195303885321e-05, - "loss": 0.0113, + "epoch": 0.63, + "learning_rate": 0.00020534329578075886, + "loss": 0.0138, "step": 125080 }, { - "epoch": 1.35, - "learning_rate": 9.715573717325029e-05, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020533572808774484, + "loss": 0.0142, "step": 125090 }, { - "epoch": 1.35, - "learning_rate": 9.713952130764739e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020532816039473085, + "loss": 0.0121, "step": 125100 }, { - "epoch": 1.35, - "learning_rate": 9.712330544204449e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020532059270171683, + "loss": 0.0125, "step": 125110 }, { - "epoch": 1.35, - "learning_rate": 9.710708957644158e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.0002053130250087028, + "loss": 0.0135, "step": 125120 }, { - "epoch": 1.35, - "learning_rate": 9.709087371083867e-05, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020530545731568882, + "loss": 0.0145, "step": 125130 }, { - "epoch": 1.35, - "learning_rate": 9.707465784523578e-05, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.0002052978896226748, + "loss": 0.0122, "step": 125140 }, { - "epoch": 1.35, - "learning_rate": 9.705844197963286e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020529032192966078, + "loss": 0.0107, "step": 125150 }, { - "epoch": 1.35, - "learning_rate": 9.704222611402996e-05, - "loss": 0.0107, + "epoch": 0.63, + "learning_rate": 0.00020528275423664676, + "loss": 0.0136, "step": 125160 }, { - "epoch": 1.35, - "learning_rate": 9.702601024842706e-05, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020527518654363277, + "loss": 0.0103, "step": 125170 }, { - "epoch": 1.35, - "learning_rate": 9.700979438282415e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020526761885061875, + "loss": 0.0146, "step": 125180 }, { - "epoch": 1.35, - "learning_rate": 9.699357851722125e-05, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020526005115760473, + "loss": 0.0118, "step": 125190 }, { - "epoch": 1.35, - "learning_rate": 9.697736265161833e-05, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020525248346459074, + "loss": 0.0113, "step": 125200 }, { - "epoch": 1.35, - "learning_rate": 9.696114678601544e-05, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020524491577157672, + "loss": 0.0166, "step": 125210 }, { - "epoch": 1.35, - "learning_rate": 9.694493092041252e-05, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002052373480785627, + "loss": 0.0146, "step": 125220 }, { - "epoch": 1.35, - "learning_rate": 9.692871505480963e-05, - "loss": 0.0126, + "epoch": 0.63, + "learning_rate": 0.0002052297803855487, + "loss": 0.016, "step": 125230 }, { - "epoch": 1.35, - "learning_rate": 9.69124991892067e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.0002052222126925347, + "loss": 0.0173, "step": 125240 }, { - "epoch": 1.35, - "learning_rate": 9.689628332360381e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020521464499952068, + "loss": 0.0163, "step": 125250 }, { - "epoch": 1.35, - "learning_rate": 9.68800674580009e-05, - "loss": 0.0071, + "epoch": 0.63, + "learning_rate": 0.00020520707730650668, + "loss": 0.0192, "step": 125260 }, { - "epoch": 1.35, - "learning_rate": 9.6863851592398e-05, - "loss": 0.0123, + "epoch": 0.63, + "learning_rate": 0.00020519950961349267, + "loss": 0.0153, "step": 125270 }, { - "epoch": 1.35, - "learning_rate": 9.684763572679509e-05, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020519194192047865, + "loss": 0.0139, "step": 125280 }, { - "epoch": 1.35, - "learning_rate": 9.68314198611922e-05, - "loss": 0.0067, + "epoch": 0.63, + "learning_rate": 0.00020518437422746466, + "loss": 0.0154, "step": 125290 }, { - "epoch": 1.35, - "learning_rate": 9.681520399558927e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020517680653445064, + "loss": 0.0135, "step": 125300 }, { - "epoch": 1.35, - "learning_rate": 9.679898812998638e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020516923884143662, + "loss": 0.0164, "step": 125310 }, { - "epoch": 1.35, - "learning_rate": 9.678277226438346e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.0002051616711484226, + "loss": 0.0139, "step": 125320 }, { - "epoch": 1.35, - "learning_rate": 9.676655639878057e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.0002051541034554086, + "loss": 0.0178, "step": 125330 }, { - "epoch": 1.35, - "learning_rate": 9.675034053317765e-05, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002051465357623946, + "loss": 0.0122, "step": 125340 }, { - "epoch": 1.36, - "learning_rate": 9.673412466757475e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020513896806938057, + "loss": 0.0152, "step": 125350 }, { - "epoch": 1.36, - "learning_rate": 9.671790880197184e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020513140037636658, + "loss": 0.0173, "step": 125360 }, { - "epoch": 1.36, - "learning_rate": 9.670169293636894e-05, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020512383268335256, + "loss": 0.0151, "step": 125370 }, { - "epoch": 1.36, - "learning_rate": 9.668547707076603e-05, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020511626499033854, + "loss": 0.0117, "step": 125380 }, { - "epoch": 1.36, - "learning_rate": 9.666926120516312e-05, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020510869729732455, + "loss": 0.0149, "step": 125390 }, { - "epoch": 1.36, - "learning_rate": 9.665304533956022e-05, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020510112960431053, + "loss": 0.0164, "step": 125400 }, { - "epoch": 1.36, - "learning_rate": 9.663682947395732e-05, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020509356191129651, + "loss": 0.015, "step": 125410 }, { - "epoch": 1.36, - "learning_rate": 9.66206136083544e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020508599421828252, + "loss": 0.0124, "step": 125420 }, { - "epoch": 1.36, - "learning_rate": 9.660439774275151e-05, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.0002050784265252685, + "loss": 0.0146, "step": 125430 }, { - "epoch": 1.36, - "learning_rate": 9.658818187714859e-05, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020507085883225449, + "loss": 0.0131, "step": 125440 }, { - "epoch": 1.36, - "learning_rate": 9.657196601154569e-05, - "loss": 0.0063, + "epoch": 0.63, + "learning_rate": 0.0002050632911392405, + "loss": 0.0147, "step": 125450 }, { - "epoch": 1.36, - "learning_rate": 9.655575014594277e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020505572344622648, + "loss": 0.0165, "step": 125460 }, { - "epoch": 1.36, - "learning_rate": 9.653953428033988e-05, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020504815575321246, + "loss": 0.0154, "step": 125470 }, { - "epoch": 1.36, - "learning_rate": 9.652331841473697e-05, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020504058806019844, + "loss": 0.0142, "step": 125480 }, { - "epoch": 1.36, - "learning_rate": 9.650710254913406e-05, - "loss": 0.0113, + "epoch": 0.63, + "learning_rate": 0.00020503302036718445, + "loss": 0.0135, "step": 125490 }, { - "epoch": 1.36, - "learning_rate": 9.649088668353116e-05, - "loss": 0.0127, + "epoch": 0.63, + "learning_rate": 0.00020502545267417043, + "loss": 0.0154, "step": 125500 }, { - "epoch": 1.36, - "learning_rate": 9.647467081792826e-05, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002050178849811564, + "loss": 0.0153, "step": 125510 }, { - "epoch": 1.36, - "learning_rate": 9.645845495232534e-05, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020501031728814242, + "loss": 0.0153, "step": 125520 }, { - "epoch": 1.36, - "learning_rate": 9.644223908672245e-05, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.0002050027495951284, + "loss": 0.012, "step": 125530 }, { - "epoch": 1.36, - "learning_rate": 9.642602322111953e-05, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.00020499518190211438, + "loss": 0.0141, "step": 125540 }, { - "epoch": 1.36, - "learning_rate": 9.640980735551663e-05, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.0002049876142091004, + "loss": 0.0155, "step": 125550 }, { - "epoch": 1.36, - "learning_rate": 9.639359148991371e-05, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020498004651608637, + "loss": 0.0136, "step": 125560 }, { - "epoch": 1.36, - "learning_rate": 9.637737562431082e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020497247882307235, + "loss": 0.0139, "step": 125570 }, { - "epoch": 1.36, - "learning_rate": 9.636115975870791e-05, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020496491113005836, + "loss": 0.0128, "step": 125580 }, { - "epoch": 1.36, - "learning_rate": 9.6344943893105e-05, - "loss": 0.0116, + "epoch": 0.63, + "learning_rate": 0.00020495734343704434, + "loss": 0.0139, "step": 125590 }, { - "epoch": 1.36, - "learning_rate": 9.63287280275021e-05, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020494977574403032, + "loss": 0.0159, "step": 125600 }, { - "epoch": 1.36, - "learning_rate": 9.631251216189919e-05, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020494220805101633, + "loss": 0.0131, "step": 125610 }, { - "epoch": 1.36, - "learning_rate": 9.629629629629628e-05, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020493464035800231, + "loss": 0.0133, "step": 125620 }, { - "epoch": 1.36, - "learning_rate": 9.628008043069339e-05, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.0002049270726649883, + "loss": 0.0143, "step": 125630 }, { - "epoch": 1.36, - "learning_rate": 9.626386456509047e-05, - "loss": 0.0145, + "epoch": 0.63, + "learning_rate": 0.00020491950497197428, + "loss": 0.0164, "step": 125640 }, { - "epoch": 1.36, - "learning_rate": 9.624764869948757e-05, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020491193727896029, + "loss": 0.0103, "step": 125650 }, { - "epoch": 1.36, - "learning_rate": 9.623143283388465e-05, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020490436958594627, + "loss": 0.0116, "step": 125660 }, { - "epoch": 1.36, - "learning_rate": 9.621521696828176e-05, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.00020489680189293225, + "loss": 0.0149, "step": 125670 }, { - "epoch": 1.36, - "learning_rate": 9.619900110267885e-05, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020488923419991826, + "loss": 0.0128, "step": 125680 }, { - "epoch": 1.36, - "learning_rate": 9.618278523707595e-05, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020488166650690424, + "loss": 0.0188, "step": 125690 }, { - "epoch": 1.36, - "learning_rate": 9.616656937147304e-05, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020487409881389022, + "loss": 0.014, "step": 125700 }, { - "epoch": 1.36, - "learning_rate": 9.615035350587013e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020486653112087623, + "loss": 0.0131, "step": 125710 }, { - "epoch": 1.36, - "learning_rate": 9.613413764026722e-05, - "loss": 0.0067, + "epoch": 0.63, + "learning_rate": 0.0002048589634278622, + "loss": 0.0123, "step": 125720 }, { - "epoch": 1.36, - "learning_rate": 9.611792177466433e-05, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.0002048513957348482, + "loss": 0.0125, "step": 125730 }, { - "epoch": 1.36, - "learning_rate": 9.610170590906141e-05, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002048438280418342, + "loss": 0.0127, "step": 125740 }, { - "epoch": 1.36, - "learning_rate": 9.608549004345852e-05, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020483626034882018, + "loss": 0.019, "step": 125750 }, { - "epoch": 1.36, - "learning_rate": 9.60692741778556e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020482869265580616, + "loss": 0.0151, "step": 125760 }, { - "epoch": 1.36, - "learning_rate": 9.60530583122527e-05, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020482112496279217, + "loss": 0.0157, "step": 125770 }, { - "epoch": 1.36, - "learning_rate": 9.603684244664978e-05, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020481355726977815, + "loss": 0.0133, "step": 125780 }, { - "epoch": 1.36, - "learning_rate": 9.602062658104689e-05, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020480598957676413, + "loss": 0.0143, "step": 125790 }, { - "epoch": 1.36, - "learning_rate": 9.600441071544398e-05, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020479842188375014, + "loss": 0.0131, "step": 125800 }, { - "epoch": 1.36, - "learning_rate": 9.598819484984107e-05, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020479085419073612, + "loss": 0.0138, "step": 125810 }, { - "epoch": 1.36, - "learning_rate": 9.597197898423816e-05, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.0002047832864977221, + "loss": 0.013, "step": 125820 }, { - "epoch": 1.36, - "learning_rate": 9.595576311863527e-05, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.0002047757188047081, + "loss": 0.0137, "step": 125830 }, { - "epoch": 1.36, - "learning_rate": 9.593954725303235e-05, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.0002047681511116941, + "loss": 0.0138, "step": 125840 }, { - "epoch": 1.36, - "learning_rate": 9.592333138742946e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020476058341868008, + "loss": 0.0178, "step": 125850 }, { - "epoch": 1.36, - "learning_rate": 9.590711552182654e-05, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020475301572566606, + "loss": 0.013, "step": 125860 }, { - "epoch": 1.36, - "learning_rate": 9.589089965622364e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020474544803265207, + "loss": 0.017, "step": 125870 }, { - "epoch": 1.36, - "learning_rate": 9.587468379062075e-05, - "loss": 0.0059, + "epoch": 0.64, + "learning_rate": 0.00020473788033963805, + "loss": 0.0139, "step": 125880 }, { - "epoch": 1.36, - "learning_rate": 9.585846792501783e-05, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020473031264662403, + "loss": 0.0129, "step": 125890 }, { - "epoch": 1.36, - "learning_rate": 9.584225205941493e-05, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020472274495361004, + "loss": 0.0113, "step": 125900 }, { - "epoch": 1.36, - "learning_rate": 9.582603619381201e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020471517726059602, + "loss": 0.0142, "step": 125910 }, { - "epoch": 1.36, - "learning_rate": 9.580982032820912e-05, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.000204707609567582, + "loss": 0.0166, "step": 125920 }, { - "epoch": 1.36, - "learning_rate": 9.57936044626062e-05, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.000204700041874568, + "loss": 0.0154, "step": 125930 }, { - "epoch": 1.36, - "learning_rate": 9.57773885970033e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.000204692474181554, + "loss": 0.0121, "step": 125940 }, { - "epoch": 1.36, - "learning_rate": 9.57611727314004e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020468490648853997, + "loss": 0.0149, "step": 125950 }, { - "epoch": 1.36, - "learning_rate": 9.574495686579749e-05, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020467733879552598, + "loss": 0.0165, "step": 125960 }, { - "epoch": 1.36, - "learning_rate": 9.572874100019458e-05, - "loss": 0.012, + "epoch": 0.64, + "learning_rate": 0.00020466977110251196, + "loss": 0.0161, "step": 125970 }, { - "epoch": 1.36, - "learning_rate": 9.571252513459169e-05, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.00020466220340949794, + "loss": 0.0138, "step": 125980 }, { - "epoch": 1.36, - "learning_rate": 9.569630926898877e-05, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020465463571648393, + "loss": 0.0133, "step": 125990 }, { - "epoch": 1.36, - "learning_rate": 9.568009340338587e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020464706802346993, + "loss": 0.015, "step": 126000 }, { - "epoch": 1.36, - "eval_cer": 0.9215417007593327, - "eval_loss": 0.007199176587164402, - "eval_runtime": 121.2136, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.64, + "eval_cer": 0.9145129533326799, + "eval_loss": 0.010170434601604939, + "eval_runtime": 116.6449, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.287, "step": 126000 }, { - "epoch": 1.36, - "learning_rate": 9.566387753778295e-05, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.00020463950033045592, + "loss": 0.0141, "step": 126010 }, { - "epoch": 1.36, - "learning_rate": 9.564766167218006e-05, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.0002046319326374419, + "loss": 0.0159, "step": 126020 }, { - "epoch": 1.36, - "learning_rate": 9.563144580657714e-05, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.0002046243649444279, + "loss": 0.0171, "step": 126030 }, { - "epoch": 1.36, - "learning_rate": 9.561522994097425e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.0002046167972514139, + "loss": 0.014, "step": 126040 }, { - "epoch": 1.36, - "learning_rate": 9.559901407537134e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020460922955839987, + "loss": 0.0152, "step": 126050 }, { - "epoch": 1.36, - "learning_rate": 9.558279820976843e-05, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020460166186538588, + "loss": 0.0184, "step": 126060 }, { - "epoch": 1.36, - "learning_rate": 9.556658234416552e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020459409417237186, + "loss": 0.0149, "step": 126070 }, { - "epoch": 1.36, - "learning_rate": 9.555036647856262e-05, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020458652647935784, + "loss": 0.0139, "step": 126080 }, { - "epoch": 1.36, - "learning_rate": 9.553415061295971e-05, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020457895878634385, + "loss": 0.0134, "step": 126090 }, { - "epoch": 1.36, - "learning_rate": 9.551793474735682e-05, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020457139109332983, + "loss": 0.0206, "step": 126100 }, { - "epoch": 1.36, - "learning_rate": 9.55017188817539e-05, - "loss": 0.0067, + "epoch": 0.64, + "learning_rate": 0.0002045638234003158, + "loss": 0.0154, "step": 126110 }, { - "epoch": 1.36, - "learning_rate": 9.5485503016151e-05, - "loss": 0.0111, + "epoch": 0.64, + "learning_rate": 0.00020455625570730182, + "loss": 0.0186, "step": 126120 }, { - "epoch": 1.36, - "learning_rate": 9.546928715054808e-05, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.0002045486880142878, + "loss": 0.0124, "step": 126130 }, { - "epoch": 1.36, - "learning_rate": 9.545307128494519e-05, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020454112032127378, + "loss": 0.0152, "step": 126140 }, { - "epoch": 1.36, - "learning_rate": 9.543685541934228e-05, - "loss": 0.0391, + "epoch": 0.64, + "learning_rate": 0.00020453355262825976, + "loss": 0.0171, "step": 126150 }, { - "epoch": 1.36, - "learning_rate": 9.542063955373937e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020452598493524577, + "loss": 0.0144, "step": 126160 }, { - "epoch": 1.36, - "learning_rate": 9.540442368813647e-05, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020451841724223175, + "loss": 0.013, "step": 126170 }, { - "epoch": 1.36, - "learning_rate": 9.538820782253356e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020451084954921774, + "loss": 0.0151, "step": 126180 }, { - "epoch": 1.36, - "learning_rate": 9.537199195693065e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020450328185620374, + "loss": 0.0122, "step": 126190 }, { - "epoch": 1.36, - "learning_rate": 9.535577609132776e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020449571416318973, + "loss": 0.0144, "step": 126200 }, { - "epoch": 1.36, - "learning_rate": 9.533956022572484e-05, - "loss": 0.0106, + "epoch": 0.64, + "learning_rate": 0.0002044881464701757, + "loss": 0.014, "step": 126210 }, { - "epoch": 1.36, - "learning_rate": 9.532334436012194e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020448057877716172, + "loss": 0.0135, "step": 126220 }, { - "epoch": 1.36, - "learning_rate": 9.530712849451902e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002044730110841477, + "loss": 0.0141, "step": 126230 }, { - "epoch": 1.36, - "learning_rate": 9.529091262891613e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020446544339113368, + "loss": 0.015, "step": 126240 }, { - "epoch": 1.36, - "learning_rate": 9.527469676331321e-05, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.0002044578756981197, + "loss": 0.0137, "step": 126250 }, { - "epoch": 1.36, - "learning_rate": 9.525848089771031e-05, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020445030800510567, + "loss": 0.0139, "step": 126260 }, { - "epoch": 1.37, - "learning_rate": 9.52422650321074e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020444274031209165, + "loss": 0.0187, "step": 126270 }, { - "epoch": 1.37, - "learning_rate": 9.52260491665045e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020443517261907766, + "loss": 0.0163, "step": 126280 }, { - "epoch": 1.37, - "learning_rate": 9.520983330090159e-05, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.00020442760492606364, + "loss": 0.0122, "step": 126290 }, { - "epoch": 1.37, - "learning_rate": 9.51936174352987e-05, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020442003723304962, + "loss": 0.0123, "step": 126300 }, { - "epoch": 1.37, - "learning_rate": 9.517740156969578e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020441246954003563, + "loss": 0.0142, "step": 126310 }, { - "epoch": 1.37, - "learning_rate": 9.516118570409288e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020440490184702158, + "loss": 0.0132, "step": 126320 }, { - "epoch": 1.37, - "learning_rate": 9.514496983848996e-05, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020439733415400757, + "loss": 0.0179, "step": 126330 }, { - "epoch": 1.37, - "learning_rate": 9.512875397288707e-05, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020438976646099355, + "loss": 0.0159, "step": 126340 }, { - "epoch": 1.37, - "learning_rate": 9.511253810728415e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020438219876797956, + "loss": 0.0154, "step": 126350 }, { - "epoch": 1.37, - "learning_rate": 9.509632224168125e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020437463107496554, + "loss": 0.0138, "step": 126360 }, { - "epoch": 1.37, - "learning_rate": 9.508010637607835e-05, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.00020436706338195152, + "loss": 0.0133, "step": 126370 }, { - "epoch": 1.37, - "learning_rate": 9.506389051047544e-05, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.0002043594956889375, + "loss": 0.0143, "step": 126380 }, { - "epoch": 1.37, - "learning_rate": 9.504767464487253e-05, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.0002043519279959235, + "loss": 0.0127, "step": 126390 }, { - "epoch": 1.37, - "learning_rate": 9.503145877926963e-05, - "loss": 0.0066, + "epoch": 0.64, + "learning_rate": 0.0002043443603029095, + "loss": 0.0161, "step": 126400 }, { - "epoch": 1.37, - "learning_rate": 9.501524291366672e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020433679260989547, + "loss": 0.0146, "step": 126410 }, { - "epoch": 1.37, - "learning_rate": 9.499902704806382e-05, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020432922491688148, + "loss": 0.0124, "step": 126420 }, { - "epoch": 1.37, - "learning_rate": 9.49828111824609e-05, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020432165722386746, + "loss": 0.0115, "step": 126430 }, { - "epoch": 1.37, - "learning_rate": 9.496659531685801e-05, - "loss": 0.0159, + "epoch": 0.64, + "learning_rate": 0.00020431408953085344, + "loss": 0.0145, "step": 126440 }, { - "epoch": 1.37, - "learning_rate": 9.495037945125509e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020430652183783945, + "loss": 0.0143, "step": 126450 }, { - "epoch": 1.37, - "learning_rate": 9.49341635856522e-05, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020429895414482543, + "loss": 0.0117, "step": 126460 }, { - "epoch": 1.37, - "learning_rate": 9.491794772004927e-05, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020429138645181141, + "loss": 0.0154, "step": 126470 }, { - "epoch": 1.37, - "learning_rate": 9.490173185444638e-05, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020428381875879742, + "loss": 0.0141, "step": 126480 }, { - "epoch": 1.37, - "learning_rate": 9.488551598884347e-05, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002042762510657834, + "loss": 0.0148, "step": 126490 }, { - "epoch": 1.37, - "learning_rate": 9.486930012324057e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020426868337276939, + "loss": 0.0143, "step": 126500 }, { - "epoch": 1.37, - "learning_rate": 9.485308425763766e-05, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.0002042611156797554, + "loss": 0.0168, "step": 126510 }, { - "epoch": 1.37, - "learning_rate": 9.483686839203477e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020425354798674138, + "loss": 0.0119, "step": 126520 }, { - "epoch": 1.37, - "learning_rate": 9.482065252643184e-05, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020424598029372736, + "loss": 0.0133, "step": 126530 }, { - "epoch": 1.37, - "learning_rate": 9.480443666082895e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020423841260071334, + "loss": 0.0125, "step": 126540 }, { - "epoch": 1.37, - "learning_rate": 9.478822079522603e-05, - "loss": 0.0112, + "epoch": 0.64, + "learning_rate": 0.00020423084490769935, + "loss": 0.0125, "step": 126550 }, { - "epoch": 1.37, - "learning_rate": 9.477200492962314e-05, - "loss": 0.0065, + "epoch": 0.64, + "learning_rate": 0.00020422327721468533, + "loss": 0.0168, "step": 126560 }, { - "epoch": 1.37, - "learning_rate": 9.475578906402022e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.0002042157095216713, + "loss": 0.0127, "step": 126570 }, { - "epoch": 1.37, - "learning_rate": 9.473957319841732e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020420814182865732, + "loss": 0.0128, "step": 126580 }, { - "epoch": 1.37, - "learning_rate": 9.472335733281441e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002042005741356433, + "loss": 0.0142, "step": 126590 }, { - "epoch": 1.37, - "learning_rate": 9.470714146721151e-05, - "loss": 0.0102, + "epoch": 0.64, + "learning_rate": 0.00020419300644262928, + "loss": 0.0161, "step": 126600 }, { - "epoch": 1.37, - "learning_rate": 9.469092560160861e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.0002041854387496153, + "loss": 0.0128, "step": 126610 }, { - "epoch": 1.37, - "learning_rate": 9.467470973600569e-05, - "loss": 0.0067, + "epoch": 0.64, + "learning_rate": 0.00020417787105660127, + "loss": 0.015, "step": 126620 }, { - "epoch": 1.37, - "learning_rate": 9.46584938704028e-05, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020417030336358725, + "loss": 0.0137, "step": 126630 }, { - "epoch": 1.37, - "learning_rate": 9.464227800479989e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020416273567057326, + "loss": 0.0127, "step": 126640 }, { - "epoch": 1.37, - "learning_rate": 9.462606213919698e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020415516797755924, + "loss": 0.0119, "step": 126650 }, { - "epoch": 1.37, - "learning_rate": 9.460984627359408e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020414760028454522, + "loss": 0.0109, "step": 126660 }, { - "epoch": 1.37, - "learning_rate": 9.459363040799118e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020414003259153123, + "loss": 0.0129, "step": 126670 }, { - "epoch": 1.37, - "learning_rate": 9.457741454238826e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020413246489851721, + "loss": 0.014, "step": 126680 }, { - "epoch": 1.37, - "learning_rate": 9.456119867678537e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.0002041248972055032, + "loss": 0.0144, "step": 126690 }, { - "epoch": 1.37, - "learning_rate": 9.454498281118245e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002041173295124892, + "loss": 0.0172, "step": 126700 }, { - "epoch": 1.37, - "learning_rate": 9.452876694557955e-05, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020410976181947519, + "loss": 0.0159, "step": 126710 }, { - "epoch": 1.37, - "learning_rate": 9.451255107997663e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020410219412646117, + "loss": 0.0163, "step": 126720 }, { - "epoch": 1.37, - "learning_rate": 9.449633521437374e-05, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020409462643344715, + "loss": 0.0143, "step": 126730 }, { - "epoch": 1.37, - "learning_rate": 9.448011934877083e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020408705874043316, + "loss": 0.0148, "step": 126740 }, { - "epoch": 1.37, - "learning_rate": 9.446390348316793e-05, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020407949104741914, + "loss": 0.0125, "step": 126750 }, { - "epoch": 1.37, - "learning_rate": 9.444768761756502e-05, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020407192335440512, + "loss": 0.0148, "step": 126760 }, { - "epoch": 1.37, - "learning_rate": 9.443147175196212e-05, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020406435566139113, + "loss": 0.0166, "step": 126770 }, { - "epoch": 1.37, - "learning_rate": 9.44152558863592e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.0002040567879683771, + "loss": 0.0163, "step": 126780 }, { - "epoch": 1.37, - "learning_rate": 9.439904002075631e-05, - "loss": 0.0115, + "epoch": 0.64, + "learning_rate": 0.0002040492202753631, + "loss": 0.0127, "step": 126790 }, { - "epoch": 1.37, - "learning_rate": 9.438282415515339e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002040416525823491, + "loss": 0.0124, "step": 126800 }, { - "epoch": 1.37, - "learning_rate": 9.43666082895505e-05, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020403408488933508, + "loss": 0.0161, "step": 126810 }, { - "epoch": 1.37, - "learning_rate": 9.435039242394757e-05, - "loss": 0.0056, + "epoch": 0.64, + "learning_rate": 0.00020402651719632106, + "loss": 0.0161, "step": 126820 }, { - "epoch": 1.37, - "learning_rate": 9.433417655834468e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020401894950330707, + "loss": 0.0134, "step": 126830 }, { - "epoch": 1.37, - "learning_rate": 9.431796069274177e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020401138181029305, + "loss": 0.0134, "step": 126840 }, { - "epoch": 1.37, - "learning_rate": 9.430174482713887e-05, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020400381411727903, + "loss": 0.0131, "step": 126850 }, { - "epoch": 1.37, - "learning_rate": 9.428552896153596e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020399624642426504, + "loss": 0.0145, "step": 126860 }, { - "epoch": 1.37, - "learning_rate": 9.426931309593305e-05, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020398867873125102, + "loss": 0.0111, "step": 126870 }, { - "epoch": 1.37, - "learning_rate": 9.425309723033014e-05, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.000203981111038237, + "loss": 0.0137, "step": 126880 }, { - "epoch": 1.37, - "learning_rate": 9.423688136472725e-05, - "loss": 0.0107, + "epoch": 0.64, + "learning_rate": 0.000203973543345223, + "loss": 0.0146, "step": 126890 }, { - "epoch": 1.37, - "learning_rate": 9.422066549912433e-05, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.000203965975652209, + "loss": 0.0117, "step": 126900 }, { - "epoch": 1.37, - "learning_rate": 9.420444963352144e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020395840795919498, + "loss": 0.0152, "step": 126910 }, { - "epoch": 1.37, - "learning_rate": 9.418823376791852e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020395084026618096, + "loss": 0.0147, "step": 126920 }, { - "epoch": 1.37, - "learning_rate": 9.417201790231562e-05, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020394327257316697, + "loss": 0.0108, "step": 126930 }, { - "epoch": 1.37, - "learning_rate": 9.41558020367127e-05, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020393570488015295, + "loss": 0.0163, "step": 126940 }, { - "epoch": 1.37, - "learning_rate": 9.413958617110981e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020392813718713893, + "loss": 0.0122, "step": 126950 }, { - "epoch": 1.37, - "learning_rate": 9.41233703055069e-05, - "loss": 0.0114, + "epoch": 0.64, + "learning_rate": 0.00020392056949412494, + "loss": 0.019, "step": 126960 }, { - "epoch": 1.37, - "learning_rate": 9.410715443990399e-05, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020391300180111092, + "loss": 0.0196, "step": 126970 }, { - "epoch": 1.37, - "learning_rate": 9.409093857430109e-05, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002039054341080969, + "loss": 0.0141, "step": 126980 }, { - "epoch": 1.37, - "learning_rate": 9.407472270869819e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002038978664150829, + "loss": 0.012, "step": 126990 }, { - "epoch": 1.37, - "learning_rate": 9.405850684309527e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.0002038902987220689, + "loss": 0.0183, "step": 127000 }, { - "epoch": 1.37, - "eval_cer": 0.9215199856854233, - "eval_loss": 0.007032403256744146, - "eval_runtime": 121.345, - "eval_samples_per_second": 16.482, - "eval_steps_per_second": 4.12, + "epoch": 0.64, + "eval_cer": 0.9145129533326799, + "eval_loss": 0.010238048620522022, + "eval_runtime": 116.573, + "eval_samples_per_second": 17.157, + "eval_steps_per_second": 4.289, "step": 127000 }, { - "epoch": 1.37, - "learning_rate": 9.404229097749238e-05, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020388273102905487, + "loss": 0.0118, "step": 127010 }, { - "epoch": 1.37, - "learning_rate": 9.402607511188946e-05, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020387516333604088, + "loss": 0.0171, "step": 127020 }, { - "epoch": 1.37, - "learning_rate": 9.400985924628656e-05, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020386759564302686, + "loss": 0.0134, "step": 127030 }, { - "epoch": 1.37, - "learning_rate": 9.399364338068364e-05, - "loss": 0.0111, + "epoch": 0.64, + "learning_rate": 0.00020386002795001284, + "loss": 0.0142, "step": 127040 }, { - "epoch": 1.37, - "learning_rate": 9.397742751508075e-05, - "loss": 0.0109, + "epoch": 0.64, + "learning_rate": 0.00020385246025699883, + "loss": 0.0163, "step": 127050 }, { - "epoch": 1.37, - "learning_rate": 9.396121164947784e-05, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020384489256398483, + "loss": 0.0146, "step": 127060 }, { - "epoch": 1.37, - "learning_rate": 9.394499578387493e-05, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020383732487097082, + "loss": 0.0149, "step": 127070 }, { - "epoch": 1.37, - "learning_rate": 9.392877991827203e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002038297571779568, + "loss": 0.0122, "step": 127080 }, { - "epoch": 1.37, - "learning_rate": 9.391256405266912e-05, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.0002038221894849428, + "loss": 0.0158, "step": 127090 }, { - "epoch": 1.37, - "learning_rate": 9.389634818706621e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.0002038146217919288, + "loss": 0.0139, "step": 127100 }, { - "epoch": 1.37, - "learning_rate": 9.388013232146332e-05, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020380705409891477, + "loss": 0.0133, "step": 127110 }, { - "epoch": 1.37, - "learning_rate": 9.38639164558604e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020379948640590078, + "loss": 0.0113, "step": 127120 }, { - "epoch": 1.37, - "learning_rate": 9.38477005902575e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020379191871288676, + "loss": 0.0169, "step": 127130 }, { - "epoch": 1.37, - "learning_rate": 9.383148472465458e-05, - "loss": 0.011, + "epoch": 0.64, + "learning_rate": 0.00020378435101987274, + "loss": 0.0146, "step": 127140 }, { - "epoch": 1.37, - "learning_rate": 9.381526885905169e-05, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020377678332685875, + "loss": 0.0159, "step": 127150 }, { - "epoch": 1.37, - "learning_rate": 9.379905299344878e-05, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020376921563384473, + "loss": 0.0127, "step": 127160 }, { - "epoch": 1.37, - "learning_rate": 9.378283712784587e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002037616479408307, + "loss": 0.0113, "step": 127170 }, { - "epoch": 1.37, - "learning_rate": 9.376662126224297e-05, - "loss": 0.0068, + "epoch": 0.64, + "learning_rate": 0.00020375408024781672, + "loss": 0.0157, "step": 127180 }, { - "epoch": 1.37, - "learning_rate": 9.375040539664006e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.0002037465125548027, + "loss": 0.0146, "step": 127190 }, { - "epoch": 1.38, - "learning_rate": 9.373418953103715e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020373894486178868, + "loss": 0.0126, "step": 127200 }, { - "epoch": 1.38, - "learning_rate": 9.371797366543426e-05, - "loss": 0.0124, + "epoch": 0.64, + "learning_rate": 0.0002037313771687747, + "loss": 0.0143, "step": 127210 }, { - "epoch": 1.38, - "learning_rate": 9.370175779983134e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020372380947576067, + "loss": 0.0108, "step": 127220 }, { - "epoch": 1.38, - "learning_rate": 9.368554193422844e-05, - "loss": 0.0124, + "epoch": 0.64, + "learning_rate": 0.00020371624178274665, + "loss": 0.0135, "step": 127230 }, { - "epoch": 1.38, - "learning_rate": 9.366932606862552e-05, - "loss": 0.0107, + "epoch": 0.64, + "learning_rate": 0.00020370867408973264, + "loss": 0.0126, "step": 127240 }, { - "epoch": 1.38, - "learning_rate": 9.365311020302263e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020370110639671864, + "loss": 0.0116, "step": 127250 }, { - "epoch": 1.38, - "learning_rate": 9.363689433741971e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020369353870370463, + "loss": 0.0129, "step": 127260 }, { - "epoch": 1.38, - "learning_rate": 9.362067847181682e-05, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.0002036859710106906, + "loss": 0.0125, "step": 127270 }, { - "epoch": 1.38, - "learning_rate": 9.360446260621391e-05, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020367840331767662, + "loss": 0.0186, "step": 127280 }, { - "epoch": 1.38, - "learning_rate": 9.3588246740611e-05, - "loss": 0.0059, + "epoch": 0.64, + "learning_rate": 0.0002036708356246626, + "loss": 0.012, "step": 127290 }, { - "epoch": 1.38, - "learning_rate": 9.35720308750081e-05, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020366326793164858, + "loss": 0.0162, "step": 127300 }, { - "epoch": 1.38, - "learning_rate": 9.35558150094052e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.0002036557002386346, + "loss": 0.0141, "step": 127310 }, { - "epoch": 1.38, - "learning_rate": 9.353959914380229e-05, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.00020364813254562057, + "loss": 0.0152, "step": 127320 }, { - "epoch": 1.38, - "learning_rate": 9.352338327819939e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020364056485260655, + "loss": 0.0136, "step": 127330 }, { - "epoch": 1.38, - "learning_rate": 9.350716741259648e-05, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020363299715959256, + "loss": 0.0158, "step": 127340 }, { - "epoch": 1.38, - "learning_rate": 9.349095154699357e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020362542946657854, + "loss": 0.0128, "step": 127350 }, { - "epoch": 1.38, - "learning_rate": 9.347473568139068e-05, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020361786177356452, + "loss": 0.0141, "step": 127360 }, { - "epoch": 1.38, - "learning_rate": 9.345851981578776e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020361029408055053, + "loss": 0.0118, "step": 127370 }, { - "epoch": 1.38, - "learning_rate": 9.344230395018486e-05, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002036027263875365, + "loss": 0.0121, "step": 127380 }, { - "epoch": 1.38, - "learning_rate": 9.342608808458194e-05, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.0002035951586945225, + "loss": 0.0129, "step": 127390 }, { - "epoch": 1.38, - "learning_rate": 9.340987221897905e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020358759100150848, + "loss": 0.0127, "step": 127400 }, { - "epoch": 1.38, - "learning_rate": 9.339365635337613e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020358002330849448, + "loss": 0.0146, "step": 127410 }, { - "epoch": 1.38, - "learning_rate": 9.337744048777323e-05, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020357245561548047, + "loss": 0.0154, "step": 127420 }, { - "epoch": 1.38, - "learning_rate": 9.336122462217033e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020356488792246645, + "loss": 0.0091, "step": 127430 }, { - "epoch": 1.38, - "learning_rate": 9.334500875656742e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020355732022945246, + "loss": 0.0132, "step": 127440 }, { - "epoch": 1.38, - "learning_rate": 9.332879289096451e-05, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020354975253643844, + "loss": 0.0116, "step": 127450 }, { - "epoch": 1.38, - "learning_rate": 9.331257702536162e-05, - "loss": 0.0064, + "epoch": 0.64, + "learning_rate": 0.00020354218484342442, + "loss": 0.0136, "step": 127460 }, { - "epoch": 1.38, - "learning_rate": 9.32963611597587e-05, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020353461715041043, + "loss": 0.0141, "step": 127470 }, { - "epoch": 1.38, - "learning_rate": 9.32801452941558e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002035270494573964, + "loss": 0.0129, "step": 127480 }, { - "epoch": 1.38, - "learning_rate": 9.326392942855288e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.0002035194817643824, + "loss": 0.016, "step": 127490 }, { - "epoch": 1.38, - "learning_rate": 9.324771356294999e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.0002035119140713684, + "loss": 0.0121, "step": 127500 }, { - "epoch": 1.38, - "learning_rate": 9.323149769734707e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020350434637835438, + "loss": 0.0146, "step": 127510 }, { - "epoch": 1.38, - "learning_rate": 9.321528183174418e-05, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020349677868534036, + "loss": 0.0117, "step": 127520 }, { - "epoch": 1.38, - "learning_rate": 9.319906596614127e-05, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020348921099232637, + "loss": 0.0141, "step": 127530 }, { - "epoch": 1.38, - "learning_rate": 9.318285010053836e-05, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.00020348164329931235, + "loss": 0.0107, "step": 127540 }, { - "epoch": 1.38, - "learning_rate": 9.316663423493545e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020347407560629833, + "loss": 0.0138, "step": 127550 }, { - "epoch": 1.38, - "learning_rate": 9.315041836933255e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020346650791328431, + "loss": 0.0116, "step": 127560 }, { - "epoch": 1.38, - "learning_rate": 9.313420250372964e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020345894022027032, + "loss": 0.0131, "step": 127570 }, { - "epoch": 1.38, - "learning_rate": 9.311798663812675e-05, - "loss": 0.0063, + "epoch": 0.64, + "learning_rate": 0.00020345137252725628, + "loss": 0.0171, "step": 127580 }, { - "epoch": 1.38, - "learning_rate": 9.310177077252382e-05, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020344380483424226, + "loss": 0.0128, "step": 127590 }, { - "epoch": 1.38, - "learning_rate": 9.308555490692093e-05, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020343623714122827, + "loss": 0.0127, "step": 127600 }, { - "epoch": 1.38, - "learning_rate": 9.306933904131801e-05, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.00020342866944821425, + "loss": 0.0133, "step": 127610 }, { - "epoch": 1.38, - "learning_rate": 9.305312317571512e-05, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020342110175520023, + "loss": 0.0124, "step": 127620 }, { - "epoch": 1.38, - "learning_rate": 9.30369073101122e-05, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002034135340621862, + "loss": 0.0123, "step": 127630 }, { - "epoch": 1.38, - "learning_rate": 9.30206914445093e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020340596636917222, + "loss": 0.0148, "step": 127640 }, { - "epoch": 1.38, - "learning_rate": 9.30044755789064e-05, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002033983986761582, + "loss": 0.0109, "step": 127650 }, { - "epoch": 1.38, - "learning_rate": 9.298825971330349e-05, - "loss": 0.0144, + "epoch": 0.64, + "learning_rate": 0.00020339083098314418, + "loss": 0.013, "step": 127660 }, { - "epoch": 1.38, - "learning_rate": 9.297204384770058e-05, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.0002033832632901302, + "loss": 0.0124, "step": 127670 }, { - "epoch": 1.38, - "learning_rate": 9.295582798209769e-05, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020337569559711617, + "loss": 0.0161, "step": 127680 }, { - "epoch": 1.38, - "learning_rate": 9.293961211649477e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020336812790410215, + "loss": 0.0146, "step": 127690 }, { - "epoch": 1.38, - "learning_rate": 9.292339625089187e-05, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020336056021108816, + "loss": 0.0156, "step": 127700 }, { - "epoch": 1.38, - "learning_rate": 9.290718038528895e-05, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020335299251807414, + "loss": 0.0141, "step": 127710 }, { - "epoch": 1.38, - "learning_rate": 9.289096451968606e-05, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020334542482506013, + "loss": 0.0164, "step": 127720 }, { - "epoch": 1.38, - "learning_rate": 9.287474865408314e-05, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020333785713204613, + "loss": 0.0194, "step": 127730 }, { - "epoch": 1.38, - "learning_rate": 9.285853278848024e-05, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020333028943903212, + "loss": 0.0193, "step": 127740 }, { - "epoch": 1.38, - "learning_rate": 9.284231692287734e-05, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.0002033227217460181, + "loss": 0.0237, "step": 127750 }, { - "epoch": 1.38, - "learning_rate": 9.282610105727443e-05, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.0002033151540530041, + "loss": 0.0147, "step": 127760 }, { - "epoch": 1.38, - "learning_rate": 9.280988519167152e-05, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002033075863599901, + "loss": 0.0134, "step": 127770 }, { - "epoch": 1.38, - "learning_rate": 9.279366932606863e-05, - "loss": 0.015, + "epoch": 0.64, + "learning_rate": 0.00020330001866697607, + "loss": 0.0156, "step": 127780 }, { - "epoch": 1.38, - "learning_rate": 9.27774534604657e-05, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020329245097396205, + "loss": 0.0145, "step": 127790 }, { - "epoch": 1.38, - "learning_rate": 9.276123759486281e-05, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020328488328094806, + "loss": 0.015, "step": 127800 }, { - "epoch": 1.38, - "learning_rate": 9.274502172925989e-05, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020327731558793404, + "loss": 0.0155, "step": 127810 }, { - "epoch": 1.38, - "learning_rate": 9.2728805863657e-05, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020326974789492002, + "loss": 0.0139, "step": 127820 }, { - "epoch": 1.38, - "learning_rate": 9.271258999805408e-05, - "loss": 0.0063, + "epoch": 0.64, + "learning_rate": 0.00020326218020190603, + "loss": 0.015, "step": 127830 }, { - "epoch": 1.38, - "learning_rate": 9.269637413245118e-05, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.000203254612508892, + "loss": 0.0138, "step": 127840 }, { - "epoch": 1.38, - "learning_rate": 9.268015826684828e-05, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.000203247044815878, + "loss": 0.0129, "step": 127850 }, { - "epoch": 1.38, - "learning_rate": 9.266394240124537e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.000203239477122864, + "loss": 0.0147, "step": 127860 }, { - "epoch": 1.38, - "learning_rate": 9.264772653564246e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020323190942984998, + "loss": 0.0156, "step": 127870 }, { - "epoch": 1.38, - "learning_rate": 9.263151067003955e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020322434173683596, + "loss": 0.0125, "step": 127880 }, { - "epoch": 1.38, - "learning_rate": 9.261529480443665e-05, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020321677404382197, + "loss": 0.0148, "step": 127890 }, { - "epoch": 1.38, - "learning_rate": 9.259907893883375e-05, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020320920635080795, + "loss": 0.0119, "step": 127900 }, { - "epoch": 1.38, - "learning_rate": 9.258286307323083e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020320163865779394, + "loss": 0.0138, "step": 127910 }, { - "epoch": 1.38, - "learning_rate": 9.256664720762794e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020319407096477994, + "loss": 0.0157, "step": 127920 }, { - "epoch": 1.38, - "learning_rate": 9.255043134202502e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020318650327176593, + "loss": 0.0142, "step": 127930 }, { - "epoch": 1.38, - "learning_rate": 9.253421547642212e-05, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.0002031789355787519, + "loss": 0.0132, "step": 127940 }, { - "epoch": 1.38, - "learning_rate": 9.25179996108192e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.0002031713678857379, + "loss": 0.0162, "step": 127950 }, { - "epoch": 1.38, - "learning_rate": 9.250178374521631e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.0002031638001927239, + "loss": 0.0149, "step": 127960 }, { - "epoch": 1.38, - "learning_rate": 9.24855678796134e-05, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020315623249970988, + "loss": 0.0151, "step": 127970 }, { - "epoch": 1.38, - "learning_rate": 9.24693520140105e-05, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.00020314866480669586, + "loss": 0.0128, "step": 127980 }, { - "epoch": 1.38, - "learning_rate": 9.245313614840759e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020314109711368187, + "loss": 0.0151, "step": 127990 }, { - "epoch": 1.38, - "learning_rate": 9.24369202828047e-05, - "loss": 0.0063, + "epoch": 0.65, + "learning_rate": 0.00020313352942066785, + "loss": 0.0139, "step": 128000 }, { - "epoch": 1.38, - "eval_cer": 0.9215738390687187, - "eval_loss": 0.007414136081933975, - "eval_runtime": 121.0821, - "eval_samples_per_second": 16.518, - "eval_steps_per_second": 4.129, + "epoch": 0.65, + "eval_cer": 0.914481900656667, + "eval_loss": 0.01020896527916193, + "eval_runtime": 116.605, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, "step": 128000 }, { - "epoch": 1.38, - "learning_rate": 9.242070441720177e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020312596172765383, + "loss": 0.0147, "step": 128010 }, { - "epoch": 1.38, - "learning_rate": 9.240448855159888e-05, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020311839403463984, + "loss": 0.0158, "step": 128020 }, { - "epoch": 1.38, - "learning_rate": 9.238827268599596e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020311082634162582, + "loss": 0.0148, "step": 128030 }, { - "epoch": 1.38, - "learning_rate": 9.237205682039307e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002031032586486118, + "loss": 0.0171, "step": 128040 }, { - "epoch": 1.38, - "learning_rate": 9.235584095479017e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002030956909555978, + "loss": 0.0156, "step": 128050 }, { - "epoch": 1.38, - "learning_rate": 9.233962508918725e-05, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.0002030881232625838, + "loss": 0.0135, "step": 128060 }, { - "epoch": 1.38, - "learning_rate": 9.232340922358436e-05, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020308055556956977, + "loss": 0.0196, "step": 128070 }, { - "epoch": 1.38, - "learning_rate": 9.230719335798144e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020307298787655578, + "loss": 0.0173, "step": 128080 }, { - "epoch": 1.38, - "learning_rate": 9.229097749237854e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020306542018354176, + "loss": 0.018, "step": 128090 }, { - "epoch": 1.38, - "learning_rate": 9.227476162677562e-05, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020305785249052775, + "loss": 0.0159, "step": 128100 }, { - "epoch": 1.38, - "learning_rate": 9.225854576117273e-05, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020305028479751375, + "loss": 0.0195, "step": 128110 }, { - "epoch": 1.39, - "learning_rate": 9.224232989556982e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020304271710449974, + "loss": 0.0158, "step": 128120 }, { - "epoch": 1.39, - "learning_rate": 9.222611402996691e-05, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020303514941148572, + "loss": 0.0177, "step": 128130 }, { - "epoch": 1.39, - "learning_rate": 9.2209898164364e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.0002030275817184717, + "loss": 0.0116, "step": 128140 }, { - "epoch": 1.39, - "learning_rate": 9.219368229876111e-05, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.0002030200140254577, + "loss": 0.0167, "step": 128150 }, { - "epoch": 1.39, - "learning_rate": 9.217746643315819e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.0002030124463324437, + "loss": 0.0141, "step": 128160 }, { - "epoch": 1.39, - "learning_rate": 9.21612505675553e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020300487863942967, + "loss": 0.0144, "step": 128170 }, { - "epoch": 1.39, - "learning_rate": 9.214503470195238e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020299731094641568, + "loss": 0.0141, "step": 128180 }, { - "epoch": 1.39, - "learning_rate": 9.212881883634948e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020298974325340166, + "loss": 0.013, "step": 128190 }, { - "epoch": 1.39, - "learning_rate": 9.211260297074656e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020298217556038764, + "loss": 0.0141, "step": 128200 }, { - "epoch": 1.39, - "learning_rate": 9.209638710514367e-05, - "loss": 0.0127, + "epoch": 0.65, + "learning_rate": 0.00020297460786737365, + "loss": 0.0165, "step": 128210 }, { - "epoch": 1.39, - "learning_rate": 9.208017123954076e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020296704017435963, + "loss": 0.015, "step": 128220 }, { - "epoch": 1.39, - "learning_rate": 9.206395537393785e-05, - "loss": 0.0064, + "epoch": 0.65, + "learning_rate": 0.0002029594724813456, + "loss": 0.0138, "step": 128230 }, { - "epoch": 1.39, - "learning_rate": 9.204773950833495e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020295190478833162, + "loss": 0.014, "step": 128240 }, { - "epoch": 1.39, - "learning_rate": 9.203152364273204e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002029443370953176, + "loss": 0.0146, "step": 128250 }, { - "epoch": 1.39, - "learning_rate": 9.201530777712913e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020293676940230358, + "loss": 0.0154, "step": 128260 }, { - "epoch": 1.39, - "learning_rate": 9.199909191152624e-05, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.0002029292017092896, + "loss": 0.0186, "step": 128270 }, { - "epoch": 1.39, - "learning_rate": 9.198287604592332e-05, - "loss": 0.0063, + "epoch": 0.65, + "learning_rate": 0.00020292163401627557, + "loss": 0.0147, "step": 128280 }, { - "epoch": 1.39, - "learning_rate": 9.196666018032042e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020291406632326156, + "loss": 0.0123, "step": 128290 }, { - "epoch": 1.39, - "learning_rate": 9.19504443147175e-05, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020290649863024754, + "loss": 0.0133, "step": 128300 }, { - "epoch": 1.39, - "learning_rate": 9.193422844911461e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020289893093723355, + "loss": 0.0132, "step": 128310 }, { - "epoch": 1.39, - "learning_rate": 9.19180125835117e-05, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020289136324421953, + "loss": 0.0137, "step": 128320 }, { - "epoch": 1.39, - "learning_rate": 9.19017967179088e-05, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002028837955512055, + "loss": 0.0127, "step": 128330 }, { - "epoch": 1.39, - "learning_rate": 9.188558085230589e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020287622785819152, + "loss": 0.0156, "step": 128340 }, { - "epoch": 1.39, - "learning_rate": 9.186936498670298e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.0002028686601651775, + "loss": 0.0131, "step": 128350 }, { - "epoch": 1.39, - "learning_rate": 9.185314912110007e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020286109247216348, + "loss": 0.0191, "step": 128360 }, { - "epoch": 1.39, - "learning_rate": 9.183693325549718e-05, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.0002028535247791495, + "loss": 0.0147, "step": 128370 }, { - "epoch": 1.39, - "learning_rate": 9.182071738989426e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020284595708613547, + "loss": 0.0142, "step": 128380 }, { - "epoch": 1.39, - "learning_rate": 9.180450152429137e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020283838939312145, + "loss": 0.0148, "step": 128390 }, { - "epoch": 1.39, - "learning_rate": 9.178828565868844e-05, - "loss": 0.0143, + "epoch": 0.65, + "learning_rate": 0.00020283082170010746, + "loss": 0.0162, "step": 128400 }, { - "epoch": 1.39, - "learning_rate": 9.177206979308555e-05, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020282325400709344, + "loss": 0.01, "step": 128410 }, { - "epoch": 1.39, - "learning_rate": 9.175585392748263e-05, - "loss": 0.0108, + "epoch": 0.65, + "learning_rate": 0.00020281568631407942, + "loss": 0.0144, "step": 128420 }, { - "epoch": 1.39, - "learning_rate": 9.173963806187974e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020280811862106543, + "loss": 0.0126, "step": 128430 }, { - "epoch": 1.39, - "learning_rate": 9.172342219627683e-05, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002028005509280514, + "loss": 0.0132, "step": 128440 }, { - "epoch": 1.39, - "learning_rate": 9.170720633067392e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.0002027929832350374, + "loss": 0.0175, "step": 128450 }, { - "epoch": 1.39, - "learning_rate": 9.169099046507102e-05, - "loss": 0.0067, + "epoch": 0.65, + "learning_rate": 0.00020278541554202338, + "loss": 0.0135, "step": 128460 }, { - "epoch": 1.39, - "learning_rate": 9.167477459946812e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020277784784900938, + "loss": 0.0134, "step": 128470 }, { - "epoch": 1.39, - "learning_rate": 9.16585587338652e-05, - "loss": 0.0112, + "epoch": 0.65, + "learning_rate": 0.00020277028015599537, + "loss": 0.0134, "step": 128480 }, { - "epoch": 1.39, - "learning_rate": 9.164234286826231e-05, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020276271246298135, + "loss": 0.0131, "step": 128490 }, { - "epoch": 1.39, - "learning_rate": 9.162612700265939e-05, - "loss": 0.0112, + "epoch": 0.65, + "learning_rate": 0.00020275514476996736, + "loss": 0.0153, "step": 128500 }, { - "epoch": 1.39, - "learning_rate": 9.160991113705649e-05, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020274757707695334, + "loss": 0.015, "step": 128510 }, { - "epoch": 1.39, - "learning_rate": 9.159369527145357e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020274000938393932, + "loss": 0.0134, "step": 128520 }, { - "epoch": 1.39, - "learning_rate": 9.157747940585068e-05, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020273244169092533, + "loss": 0.0214, "step": 128530 }, { - "epoch": 1.39, - "learning_rate": 9.156126354024777e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002027248739979113, + "loss": 0.0165, "step": 128540 }, { - "epoch": 1.39, - "learning_rate": 9.154504767464486e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002027173063048973, + "loss": 0.0131, "step": 128550 }, { - "epoch": 1.39, - "learning_rate": 9.152883180904196e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.0002027097386118833, + "loss": 0.0133, "step": 128560 }, { - "epoch": 1.39, - "learning_rate": 9.151261594343905e-05, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020270217091886928, + "loss": 0.0182, "step": 128570 }, { - "epoch": 1.39, - "learning_rate": 9.149640007783614e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020269460322585526, + "loss": 0.0145, "step": 128580 }, { - "epoch": 1.39, - "learning_rate": 9.148018421223325e-05, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.00020268703553284127, + "loss": 0.0129, "step": 128590 }, { - "epoch": 1.39, - "learning_rate": 9.146396834663033e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020267946783982725, + "loss": 0.0129, "step": 128600 }, { - "epoch": 1.39, - "learning_rate": 9.144775248102743e-05, - "loss": 0.0115, + "epoch": 0.65, + "learning_rate": 0.00020267190014681323, + "loss": 0.0142, "step": 128610 }, { - "epoch": 1.39, - "learning_rate": 9.143153661542451e-05, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020266433245379924, + "loss": 0.0161, "step": 128620 }, { - "epoch": 1.39, - "learning_rate": 9.141532074982162e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020265676476078522, + "loss": 0.0127, "step": 128630 }, { - "epoch": 1.39, - "learning_rate": 9.13991048842187e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002026491970677712, + "loss": 0.0149, "step": 128640 }, { - "epoch": 1.39, - "learning_rate": 9.13828890186158e-05, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020264162937475719, + "loss": 0.0121, "step": 128650 }, { - "epoch": 1.39, - "learning_rate": 9.13666731530129e-05, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.0002026340616817432, + "loss": 0.0127, "step": 128660 }, { - "epoch": 1.39, - "learning_rate": 9.135045728740999e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020262649398872918, + "loss": 0.0126, "step": 128670 }, { - "epoch": 1.39, - "learning_rate": 9.133424142180708e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020261892629571516, + "loss": 0.0126, "step": 128680 }, { - "epoch": 1.39, - "learning_rate": 9.131802555620419e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020261135860270117, + "loss": 0.0142, "step": 128690 }, { - "epoch": 1.39, - "learning_rate": 9.130180969060127e-05, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020260379090968715, + "loss": 0.0122, "step": 128700 }, { - "epoch": 1.39, - "learning_rate": 9.128559382499837e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020259622321667313, + "loss": 0.0133, "step": 128710 }, { - "epoch": 1.39, - "learning_rate": 9.126937795939545e-05, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020258865552365914, + "loss": 0.0155, "step": 128720 }, { - "epoch": 1.39, - "learning_rate": 9.125316209379256e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020258108783064512, + "loss": 0.0134, "step": 128730 }, { - "epoch": 1.39, - "learning_rate": 9.123694622818964e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.0002025735201376311, + "loss": 0.0125, "step": 128740 }, { - "epoch": 1.39, - "learning_rate": 9.122073036258675e-05, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.0002025659524446171, + "loss": 0.0118, "step": 128750 }, { - "epoch": 1.39, - "learning_rate": 9.120451449698385e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.0002025583847516031, + "loss": 0.0157, "step": 128760 }, { - "epoch": 1.39, - "learning_rate": 9.118829863138093e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020255081705858907, + "loss": 0.0127, "step": 128770 }, { - "epoch": 1.39, - "learning_rate": 9.117208276577804e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020254324936557508, + "loss": 0.0152, "step": 128780 }, { - "epoch": 1.39, - "learning_rate": 9.115586690017512e-05, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.00020253568167256106, + "loss": 0.0172, "step": 128790 }, { - "epoch": 1.39, - "learning_rate": 9.113965103457222e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020252811397954704, + "loss": 0.0157, "step": 128800 }, { - "epoch": 1.39, - "learning_rate": 9.112343516896932e-05, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020252054628653302, + "loss": 0.0136, "step": 128810 }, { - "epoch": 1.39, - "learning_rate": 9.110721930336641e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020251297859351903, + "loss": 0.0129, "step": 128820 }, { - "epoch": 1.39, - "learning_rate": 9.10910034377635e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020250541090050501, + "loss": 0.0151, "step": 128830 }, { - "epoch": 1.39, - "learning_rate": 9.107478757216061e-05, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020249784320749097, + "loss": 0.0163, "step": 128840 }, { - "epoch": 1.39, - "learning_rate": 9.105857170655769e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020249027551447695, + "loss": 0.0118, "step": 128850 }, { - "epoch": 1.39, - "learning_rate": 9.104235584095479e-05, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020248270782146296, + "loss": 0.0117, "step": 128860 }, { - "epoch": 1.39, - "learning_rate": 9.102613997535187e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020247514012844894, + "loss": 0.0146, "step": 128870 }, { - "epoch": 1.39, - "learning_rate": 9.100992410974898e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020246757243543492, + "loss": 0.015, "step": 128880 }, { - "epoch": 1.39, - "learning_rate": 9.099370824414606e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020246000474242093, + "loss": 0.0144, "step": 128890 }, { - "epoch": 1.39, - "learning_rate": 9.097749237854316e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.0002024524370494069, + "loss": 0.016, "step": 128900 }, { - "epoch": 1.39, - "learning_rate": 9.096127651294026e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.0002024448693563929, + "loss": 0.0163, "step": 128910 }, { - "epoch": 1.39, - "learning_rate": 9.094506064733735e-05, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.0002024373016633789, + "loss": 0.0116, "step": 128920 }, { - "epoch": 1.39, - "learning_rate": 9.092884478173444e-05, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020242973397036488, + "loss": 0.0106, "step": 128930 }, { - "epoch": 1.39, - "learning_rate": 9.091262891613155e-05, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020242216627735086, + "loss": 0.0153, "step": 128940 }, { - "epoch": 1.39, - "learning_rate": 9.089641305052863e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020241459858433687, + "loss": 0.0124, "step": 128950 }, { - "epoch": 1.39, - "learning_rate": 9.088019718492573e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020240703089132285, + "loss": 0.0128, "step": 128960 }, { - "epoch": 1.39, - "learning_rate": 9.086398131932281e-05, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020239946319830884, + "loss": 0.0117, "step": 128970 }, { - "epoch": 1.39, - "learning_rate": 9.084776545371992e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020239189550529484, + "loss": 0.0112, "step": 128980 }, { - "epoch": 1.39, - "learning_rate": 9.0831549588117e-05, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020238432781228083, + "loss": 0.0128, "step": 128990 }, { - "epoch": 1.39, - "learning_rate": 9.08153337225141e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.0002023767601192668, + "loss": 0.0141, "step": 129000 }, { - "epoch": 1.39, - "eval_cer": 0.9215460437741146, - "eval_loss": 0.0069303130730986595, - "eval_runtime": 121.2397, - "eval_samples_per_second": 16.496, - "eval_steps_per_second": 4.124, + "epoch": 0.65, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.009670346975326538, + "eval_runtime": 116.6611, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, "step": 129000 }, { - "epoch": 1.39, - "learning_rate": 9.07991178569112e-05, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020236919242625282, + "loss": 0.0127, "step": 129010 }, { - "epoch": 1.39, - "learning_rate": 9.078290199130829e-05, - "loss": 0.0114, + "epoch": 0.65, + "learning_rate": 0.0002023616247332388, + "loss": 0.0134, "step": 129020 }, { - "epoch": 1.39, - "learning_rate": 9.076668612570538e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020235405704022478, + "loss": 0.0115, "step": 129030 }, { - "epoch": 1.39, - "learning_rate": 9.075047026010248e-05, - "loss": 0.0062, + "epoch": 0.65, + "learning_rate": 0.00020234648934721076, + "loss": 0.0146, "step": 129040 }, { - "epoch": 1.4, - "learning_rate": 9.073425439449957e-05, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020233892165419677, + "loss": 0.0119, "step": 129050 }, { - "epoch": 1.4, - "learning_rate": 9.071803852889667e-05, - "loss": 0.0105, + "epoch": 0.65, + "learning_rate": 0.00020233135396118275, + "loss": 0.0129, "step": 129060 }, { - "epoch": 1.4, - "learning_rate": 9.070182266329375e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020232378626816873, + "loss": 0.0137, "step": 129070 }, { - "epoch": 1.4, - "learning_rate": 9.068560679769086e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020231621857515474, + "loss": 0.0115, "step": 129080 }, { - "epoch": 1.4, - "learning_rate": 9.066939093208794e-05, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020230865088214072, + "loss": 0.0122, "step": 129090 }, { - "epoch": 1.4, - "learning_rate": 9.065317506648505e-05, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.0002023010831891267, + "loss": 0.0133, "step": 129100 }, { - "epoch": 1.4, - "learning_rate": 9.063695920088212e-05, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.0002022935154961127, + "loss": 0.0194, "step": 129110 }, { - "epoch": 1.4, - "learning_rate": 9.062074333527923e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002022859478030987, + "loss": 0.0124, "step": 129120 }, { - "epoch": 1.4, - "learning_rate": 9.060452746967632e-05, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.00020227838011008467, + "loss": 0.0149, "step": 129130 }, { - "epoch": 1.4, - "learning_rate": 9.058831160407342e-05, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020227081241707068, + "loss": 0.0134, "step": 129140 }, { - "epoch": 1.4, - "learning_rate": 9.057209573847051e-05, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020226324472405666, + "loss": 0.0127, "step": 129150 }, { - "epoch": 1.4, - "learning_rate": 9.055587987286762e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020225567703104265, + "loss": 0.0111, "step": 129160 }, { - "epoch": 1.4, - "learning_rate": 9.05396640072647e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020224810933802865, + "loss": 0.0187, "step": 129170 }, { - "epoch": 1.4, - "learning_rate": 9.05234481416618e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020224054164501464, + "loss": 0.0127, "step": 129180 }, { - "epoch": 1.4, - "learning_rate": 9.050723227605888e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020223297395200062, + "loss": 0.0135, "step": 129190 }, { - "epoch": 1.4, - "learning_rate": 9.049101641045599e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.0002022254062589866, + "loss": 0.0155, "step": 129200 }, { - "epoch": 1.4, - "learning_rate": 9.047480054485307e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.0002022178385659726, + "loss": 0.0159, "step": 129210 }, { - "epoch": 1.4, - "learning_rate": 9.045858467925017e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002022102708729586, + "loss": 0.0148, "step": 129220 }, { - "epoch": 1.4, - "learning_rate": 9.044236881364726e-05, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020220270317994457, + "loss": 0.0113, "step": 129230 }, { - "epoch": 1.4, - "learning_rate": 9.042615294804436e-05, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020219513548693058, + "loss": 0.0144, "step": 129240 }, { - "epoch": 1.4, - "learning_rate": 9.040993708244145e-05, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020218756779391656, + "loss": 0.015, "step": 129250 }, { - "epoch": 1.4, - "learning_rate": 9.039372121683854e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020218000010090254, + "loss": 0.014, "step": 129260 }, { - "epoch": 1.4, - "learning_rate": 9.037750535123564e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020217243240788855, + "loss": 0.0117, "step": 129270 }, { - "epoch": 1.4, - "learning_rate": 9.036128948563274e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020216486471487453, + "loss": 0.0101, "step": 129280 }, { - "epoch": 1.4, - "learning_rate": 9.034507362002982e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.0002021572970218605, + "loss": 0.0203, "step": 129290 }, { - "epoch": 1.4, - "learning_rate": 9.032885775442693e-05, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020214972932884652, + "loss": 0.0156, "step": 129300 }, { - "epoch": 1.4, - "learning_rate": 9.0312641888824e-05, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002021421616358325, + "loss": 0.0155, "step": 129310 }, { - "epoch": 1.4, - "learning_rate": 9.029642602322111e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020213459394281848, + "loss": 0.0165, "step": 129320 }, { - "epoch": 1.4, - "learning_rate": 9.02802101576182e-05, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.0002021270262498045, + "loss": 0.0142, "step": 129330 }, { - "epoch": 1.4, - "learning_rate": 9.02639942920153e-05, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020211945855679047, + "loss": 0.0157, "step": 129340 }, { - "epoch": 1.4, - "learning_rate": 9.024777842641239e-05, - "loss": 0.0054, + "epoch": 0.65, + "learning_rate": 0.00020211189086377646, + "loss": 0.0149, "step": 129350 }, { - "epoch": 1.4, - "learning_rate": 9.023156256080948e-05, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020210432317076244, + "loss": 0.0159, "step": 129360 }, { - "epoch": 1.4, - "learning_rate": 9.021534669520658e-05, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020209675547774845, + "loss": 0.013, "step": 129370 }, { - "epoch": 1.4, - "learning_rate": 9.019913082960368e-05, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.00020208918778473443, + "loss": 0.0159, "step": 129380 }, { - "epoch": 1.4, - "learning_rate": 9.018291496400076e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.0002020816200917204, + "loss": 0.0134, "step": 129390 }, { - "epoch": 1.4, - "learning_rate": 9.016669909839787e-05, - "loss": 0.0061, + "epoch": 0.65, + "learning_rate": 0.00020207405239870642, + "loss": 0.0152, "step": 129400 }, { - "epoch": 1.4, - "learning_rate": 9.015048323279495e-05, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002020664847056924, + "loss": 0.0137, "step": 129410 }, { - "epoch": 1.4, - "learning_rate": 9.013426736719205e-05, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020205891701267838, + "loss": 0.0123, "step": 129420 }, { - "epoch": 1.4, - "learning_rate": 9.011805150158913e-05, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.0002020513493196644, + "loss": 0.0144, "step": 129430 }, { - "epoch": 1.4, - "learning_rate": 9.010183563598624e-05, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020204378162665037, + "loss": 0.0143, "step": 129440 }, { - "epoch": 1.4, - "learning_rate": 9.008561977038333e-05, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020203621393363635, + "loss": 0.0182, "step": 129450 }, { - "epoch": 1.4, - "learning_rate": 9.006940390478042e-05, - "loss": 0.0061, + "epoch": 0.65, + "learning_rate": 0.00020202864624062236, + "loss": 0.0125, "step": 129460 }, { - "epoch": 1.4, - "learning_rate": 9.005318803917752e-05, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020202107854760834, + "loss": 0.0149, "step": 129470 }, { - "epoch": 1.4, - "learning_rate": 9.003697217357462e-05, - "loss": 0.0067, + "epoch": 0.65, + "learning_rate": 0.00020201351085459432, + "loss": 0.014, "step": 129480 }, { - "epoch": 1.4, - "learning_rate": 9.002075630797172e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020200594316158033, + "loss": 0.0154, "step": 129490 }, { - "epoch": 1.4, - "learning_rate": 9.000454044236881e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002019983754685663, + "loss": 0.0112, "step": 129500 }, { - "epoch": 1.4, - "learning_rate": 8.99883245767659e-05, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.0002019908077755523, + "loss": 0.0152, "step": 129510 }, { - "epoch": 1.4, - "learning_rate": 8.9972108711163e-05, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020198324008253828, + "loss": 0.0138, "step": 129520 }, { - "epoch": 1.4, - "learning_rate": 8.99558928455601e-05, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020197567238952428, + "loss": 0.0143, "step": 129530 }, { - "epoch": 1.4, - "learning_rate": 8.993967697995718e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020196810469651027, + "loss": 0.0149, "step": 129540 }, { - "epoch": 1.4, - "learning_rate": 8.992346111435429e-05, - "loss": 0.0064, + "epoch": 0.65, + "learning_rate": 0.00020196053700349625, + "loss": 0.0143, "step": 129550 }, { - "epoch": 1.4, - "learning_rate": 8.990724524875137e-05, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020195296931048226, + "loss": 0.0143, "step": 129560 }, { - "epoch": 1.4, - "learning_rate": 8.989102938314847e-05, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020194540161746824, + "loss": 0.0117, "step": 129570 }, { - "epoch": 1.4, - "learning_rate": 8.987481351754555e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020193783392445422, + "loss": 0.0162, "step": 129580 }, { - "epoch": 1.4, - "learning_rate": 8.985859765194266e-05, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020193026623144023, + "loss": 0.0157, "step": 129590 }, { - "epoch": 1.4, - "learning_rate": 8.984238178633975e-05, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.0002019226985384262, + "loss": 0.0126, "step": 129600 }, { - "epoch": 1.4, - "learning_rate": 8.982616592073684e-05, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.0002019151308454122, + "loss": 0.0129, "step": 129610 }, { - "epoch": 1.4, - "learning_rate": 8.980995005513394e-05, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.0002019075631523982, + "loss": 0.0119, "step": 129620 }, { - "epoch": 1.4, - "learning_rate": 8.979373418953104e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020189999545938418, + "loss": 0.0114, "step": 129630 }, { - "epoch": 1.4, - "learning_rate": 8.977751832392812e-05, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020189242776637016, + "loss": 0.013, "step": 129640 }, { - "epoch": 1.4, - "learning_rate": 8.976130245832523e-05, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020188486007335617, + "loss": 0.013, "step": 129650 }, { - "epoch": 1.4, - "learning_rate": 8.974508659272231e-05, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020187729238034215, + "loss": 0.0171, "step": 129660 }, { - "epoch": 1.4, - "learning_rate": 8.972887072711941e-05, - "loss": 0.0065, + "epoch": 0.65, + "learning_rate": 0.00020186972468732813, + "loss": 0.0131, "step": 129670 }, { - "epoch": 1.4, - "learning_rate": 8.971265486151649e-05, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020186215699431414, + "loss": 0.0148, "step": 129680 }, { - "epoch": 1.4, - "learning_rate": 8.96964389959136e-05, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020185458930130012, + "loss": 0.0105, "step": 129690 }, { - "epoch": 1.4, - "learning_rate": 8.968022313031069e-05, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.0002018470216082861, + "loss": 0.0118, "step": 129700 }, { - "epoch": 1.4, - "learning_rate": 8.966400726470778e-05, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020183945391527209, + "loss": 0.0148, "step": 129710 }, { - "epoch": 1.4, - "learning_rate": 8.964779139910488e-05, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.0002018318862222581, + "loss": 0.0144, "step": 129720 }, { - "epoch": 1.4, - "learning_rate": 8.963157553350197e-05, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020182431852924408, + "loss": 0.0129, "step": 129730 }, { - "epoch": 1.4, - "learning_rate": 8.961535966789906e-05, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020181675083623006, + "loss": 0.0102, "step": 129740 }, { - "epoch": 1.4, - "learning_rate": 8.959914380229617e-05, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020180918314321607, + "loss": 0.0126, "step": 129750 }, { - "epoch": 1.4, - "learning_rate": 8.958292793669325e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020180161545020205, + "loss": 0.0114, "step": 129760 }, { - "epoch": 1.4, - "learning_rate": 8.956671207109035e-05, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020179404775718803, + "loss": 0.0135, "step": 129770 }, { - "epoch": 1.4, - "learning_rate": 8.955049620548743e-05, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020178648006417404, + "loss": 0.0139, "step": 129780 }, { - "epoch": 1.4, - "learning_rate": 8.953428033988454e-05, - "loss": 0.0125, + "epoch": 0.65, + "learning_rate": 0.00020177891237116002, + "loss": 0.0132, "step": 129790 }, { - "epoch": 1.4, - "learning_rate": 8.951806447428162e-05, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.000201771344678146, + "loss": 0.0142, "step": 129800 }, { - "epoch": 1.4, - "learning_rate": 8.950184860867873e-05, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.000201763776985132, + "loss": 0.0156, "step": 129810 }, { - "epoch": 1.4, - "learning_rate": 8.948563274307582e-05, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.000201756209292118, + "loss": 0.0145, "step": 129820 }, { - "epoch": 1.4, - "learning_rate": 8.946941687747291e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020174864159910397, + "loss": 0.0146, "step": 129830 }, { - "epoch": 1.4, - "learning_rate": 8.945320101187e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020174107390608998, + "loss": 0.0128, "step": 129840 }, { - "epoch": 1.4, - "learning_rate": 8.943698514626711e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020173350621307596, + "loss": 0.0139, "step": 129850 }, { - "epoch": 1.4, - "learning_rate": 8.942076928066419e-05, - "loss": 0.0107, + "epoch": 0.66, + "learning_rate": 0.00020172593852006194, + "loss": 0.0145, "step": 129860 }, { - "epoch": 1.4, - "learning_rate": 8.94045534150613e-05, - "loss": 0.009, + "epoch": 0.66, + "learning_rate": 0.00020171837082704792, + "loss": 0.0142, "step": 129870 }, { - "epoch": 1.4, - "learning_rate": 8.938833754945837e-05, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020171080313403393, + "loss": 0.0132, "step": 129880 }, { - "epoch": 1.4, - "learning_rate": 8.937212168385548e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020170323544101991, + "loss": 0.0127, "step": 129890 }, { - "epoch": 1.4, - "learning_rate": 8.935590581825256e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.0002016956677480059, + "loss": 0.0136, "step": 129900 }, { - "epoch": 1.4, - "learning_rate": 8.933968995264967e-05, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.0002016881000549919, + "loss": 0.0135, "step": 129910 }, { - "epoch": 1.4, - "learning_rate": 8.932347408704676e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020168053236197789, + "loss": 0.0127, "step": 129920 }, { - "epoch": 1.4, - "learning_rate": 8.930725822144385e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020167296466896387, + "loss": 0.0122, "step": 129930 }, { - "epoch": 1.4, - "learning_rate": 8.929104235584094e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020166539697594988, + "loss": 0.0163, "step": 129940 }, { - "epoch": 1.4, - "learning_rate": 8.927482649023805e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020165782928293586, + "loss": 0.0134, "step": 129950 }, { - "epoch": 1.4, - "learning_rate": 8.925861062463513e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020165026158992184, + "loss": 0.0132, "step": 129960 }, { - "epoch": 1.41, - "learning_rate": 8.924239475903224e-05, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020164269389690785, + "loss": 0.0164, "step": 129970 }, { - "epoch": 1.41, - "learning_rate": 8.922617889342932e-05, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020163512620389383, + "loss": 0.0125, "step": 129980 }, { - "epoch": 1.41, - "learning_rate": 8.920996302782642e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.0002016275585108798, + "loss": 0.0152, "step": 129990 }, { - "epoch": 1.41, - "learning_rate": 8.91937471622235e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020161999081786582, + "loss": 0.0161, "step": 130000 }, { - "epoch": 1.41, - "eval_cer": 0.9215477809800273, - "eval_loss": 0.00709355715662241, - "eval_runtime": 121.4935, - "eval_samples_per_second": 16.462, - "eval_steps_per_second": 4.115, + "epoch": 0.66, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.009702015668153763, + "eval_runtime": 116.6027, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, "step": 130000 }, { - "epoch": 1.41, - "learning_rate": 8.917753129662061e-05, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.0002016124231248518, + "loss": 0.0188, "step": 130010 }, { - "epoch": 1.41, - "learning_rate": 8.91613154310177e-05, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.00020160485543183778, + "loss": 0.0146, "step": 130020 }, { - "epoch": 1.41, - "learning_rate": 8.914509956541479e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020159728773882376, + "loss": 0.0123, "step": 130030 }, { - "epoch": 1.41, - "learning_rate": 8.912888369981189e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020158972004580977, + "loss": 0.013, "step": 130040 }, { - "epoch": 1.41, - "learning_rate": 8.911266783420898e-05, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020158215235279575, + "loss": 0.0145, "step": 130050 }, { - "epoch": 1.41, - "learning_rate": 8.909645196860607e-05, - "loss": 0.0062, + "epoch": 0.66, + "learning_rate": 0.00020157458465978173, + "loss": 0.0136, "step": 130060 }, { - "epoch": 1.41, - "learning_rate": 8.908023610300318e-05, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.00020156701696676774, + "loss": 0.0117, "step": 130070 }, { - "epoch": 1.41, - "learning_rate": 8.906402023740026e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020155944927375372, + "loss": 0.0131, "step": 130080 }, { - "epoch": 1.41, - "learning_rate": 8.904780437179736e-05, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020155188158073968, + "loss": 0.0142, "step": 130090 }, { - "epoch": 1.41, - "learning_rate": 8.903158850619444e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020154431388772566, + "loss": 0.0159, "step": 130100 }, { - "epoch": 1.41, - "learning_rate": 8.901537264059155e-05, - "loss": 0.0106, + "epoch": 0.66, + "learning_rate": 0.00020153674619471167, + "loss": 0.0168, "step": 130110 }, { - "epoch": 1.41, - "learning_rate": 8.899915677498863e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020152917850169765, + "loss": 0.0158, "step": 130120 }, { - "epoch": 1.41, - "learning_rate": 8.898294090938573e-05, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020152161080868363, + "loss": 0.0163, "step": 130130 }, { - "epoch": 1.41, - "learning_rate": 8.896672504378283e-05, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020151404311566964, + "loss": 0.0116, "step": 130140 }, { - "epoch": 1.41, - "learning_rate": 8.895050917817992e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020150647542265562, + "loss": 0.0121, "step": 130150 }, { - "epoch": 1.41, - "learning_rate": 8.893429331257701e-05, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.0002014989077296416, + "loss": 0.012, "step": 130160 }, { - "epoch": 1.41, - "learning_rate": 8.891807744697412e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002014913400366276, + "loss": 0.0146, "step": 130170 }, { - "epoch": 1.41, - "learning_rate": 8.89018615813712e-05, - "loss": 0.0064, + "epoch": 0.66, + "learning_rate": 0.0002014837723436136, + "loss": 0.012, "step": 130180 }, { - "epoch": 1.41, - "learning_rate": 8.88856457157683e-05, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020147620465059957, + "loss": 0.0134, "step": 130190 }, { - "epoch": 1.41, - "learning_rate": 8.88694298501654e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020146863695758558, + "loss": 0.0143, "step": 130200 }, { - "epoch": 1.41, - "learning_rate": 8.885321398456249e-05, - "loss": 0.0123, + "epoch": 0.66, + "learning_rate": 0.00020146106926457156, + "loss": 0.0201, "step": 130210 }, { - "epoch": 1.41, - "learning_rate": 8.88369981189596e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020145350157155755, + "loss": 0.0137, "step": 130220 }, { - "epoch": 1.41, - "learning_rate": 8.882078225335667e-05, - "loss": 0.0114, + "epoch": 0.66, + "learning_rate": 0.00020144593387854355, + "loss": 0.0121, "step": 130230 }, { - "epoch": 1.41, - "learning_rate": 8.880456638775378e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020143836618552954, + "loss": 0.0109, "step": 130240 }, { - "epoch": 1.41, - "learning_rate": 8.878835052215086e-05, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020143079849251552, + "loss": 0.0135, "step": 130250 }, { - "epoch": 1.41, - "learning_rate": 8.877213465654797e-05, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.0002014232307995015, + "loss": 0.0118, "step": 130260 }, { - "epoch": 1.41, - "learning_rate": 8.875591879094505e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.0002014156631064875, + "loss": 0.0164, "step": 130270 }, { - "epoch": 1.41, - "learning_rate": 8.873970292534215e-05, - "loss": 0.0062, + "epoch": 0.66, + "learning_rate": 0.0002014080954134735, + "loss": 0.0132, "step": 130280 }, { - "epoch": 1.41, - "learning_rate": 8.872348705973924e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020140052772045947, + "loss": 0.014, "step": 130290 }, { - "epoch": 1.41, - "learning_rate": 8.870727119413634e-05, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020139296002744548, + "loss": 0.0133, "step": 130300 }, { - "epoch": 1.41, - "learning_rate": 8.869105532853343e-05, - "loss": 0.0124, + "epoch": 0.66, + "learning_rate": 0.00020138539233443146, + "loss": 0.0155, "step": 130310 }, { - "epoch": 1.41, - "learning_rate": 8.867483946293054e-05, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020137782464141744, + "loss": 0.017, "step": 130320 }, { - "epoch": 1.41, - "learning_rate": 8.865862359732762e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020137025694840345, + "loss": 0.0145, "step": 130330 }, { - "epoch": 1.41, - "learning_rate": 8.864240773172472e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020136268925538943, + "loss": 0.0138, "step": 130340 }, { - "epoch": 1.41, - "learning_rate": 8.86261918661218e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.0002013551215623754, + "loss": 0.0117, "step": 130350 }, { - "epoch": 1.41, - "learning_rate": 8.860997600051891e-05, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020134755386936142, + "loss": 0.0131, "step": 130360 }, { - "epoch": 1.41, - "learning_rate": 8.859376013491599e-05, - "loss": 0.012, + "epoch": 0.66, + "learning_rate": 0.0002013399861763474, + "loss": 0.0135, "step": 130370 }, { - "epoch": 1.41, - "learning_rate": 8.857754426931309e-05, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020133241848333338, + "loss": 0.0123, "step": 130380 }, { - "epoch": 1.41, - "learning_rate": 8.856132840371019e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002013248507903194, + "loss": 0.0159, "step": 130390 }, { - "epoch": 1.41, - "learning_rate": 8.854511253810728e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020131728309730537, + "loss": 0.018, "step": 130400 }, { - "epoch": 1.41, - "learning_rate": 8.852889667250437e-05, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020130971540429136, + "loss": 0.0128, "step": 130410 }, { - "epoch": 1.41, - "learning_rate": 8.851268080690146e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020130214771127734, + "loss": 0.0131, "step": 130420 }, { - "epoch": 1.41, - "learning_rate": 8.849646494129856e-05, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020129458001826335, + "loss": 0.0135, "step": 130430 }, { - "epoch": 1.41, - "learning_rate": 8.848024907569566e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020128701232524933, + "loss": 0.0147, "step": 130440 }, { - "epoch": 1.41, - "learning_rate": 8.846403321009274e-05, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.0002012794446322353, + "loss": 0.0171, "step": 130450 }, { - "epoch": 1.41, - "learning_rate": 8.844781734448985e-05, - "loss": 0.0107, + "epoch": 0.66, + "learning_rate": 0.00020127187693922132, + "loss": 0.0132, "step": 130460 }, { - "epoch": 1.41, - "learning_rate": 8.843160147888693e-05, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.0002012643092462073, + "loss": 0.0136, "step": 130470 }, { - "epoch": 1.41, - "learning_rate": 8.841538561328403e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020125674155319328, + "loss": 0.0139, "step": 130480 }, { - "epoch": 1.41, - "learning_rate": 8.839916974768113e-05, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.0002012491738601793, + "loss": 0.0135, "step": 130490 }, { - "epoch": 1.41, - "learning_rate": 8.838295388207822e-05, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020124160616716527, + "loss": 0.0121, "step": 130500 }, { - "epoch": 1.41, - "learning_rate": 8.836673801647531e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020123403847415125, + "loss": 0.0146, "step": 130510 }, { - "epoch": 1.41, - "learning_rate": 8.83505221508724e-05, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020122647078113726, + "loss": 0.0149, "step": 130520 }, { - "epoch": 1.41, - "learning_rate": 8.83343062852695e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020121890308812324, + "loss": 0.0157, "step": 130530 }, { - "epoch": 1.41, - "learning_rate": 8.83180904196666e-05, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020121133539510922, + "loss": 0.0126, "step": 130540 }, { - "epoch": 1.41, - "learning_rate": 8.830187455406368e-05, - "loss": 0.0108, + "epoch": 0.66, + "learning_rate": 0.00020120376770209523, + "loss": 0.0113, "step": 130550 }, { - "epoch": 1.41, - "learning_rate": 8.828565868846079e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.0002011962000090812, + "loss": 0.0197, "step": 130560 }, { - "epoch": 1.41, - "learning_rate": 8.826944282285787e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.0002011886323160672, + "loss": 0.0133, "step": 130570 }, { - "epoch": 1.41, - "learning_rate": 8.825322695725497e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.0002011810646230532, + "loss": 0.0151, "step": 130580 }, { - "epoch": 1.41, - "learning_rate": 8.823701109165205e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020117349693003918, + "loss": 0.0155, "step": 130590 }, { - "epoch": 1.41, - "learning_rate": 8.822079522604916e-05, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020116592923702517, + "loss": 0.0148, "step": 130600 }, { - "epoch": 1.41, - "learning_rate": 8.820457936044625e-05, - "loss": 0.0113, + "epoch": 0.66, + "learning_rate": 0.00020115836154401115, + "loss": 0.0139, "step": 130610 }, { - "epoch": 1.41, - "learning_rate": 8.818836349484335e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020115079385099716, + "loss": 0.0117, "step": 130620 }, { - "epoch": 1.41, - "learning_rate": 8.817214762924044e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020114322615798314, + "loss": 0.0157, "step": 130630 }, { - "epoch": 1.41, - "learning_rate": 8.815593176363754e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020113565846496912, + "loss": 0.0122, "step": 130640 }, { - "epoch": 1.41, - "learning_rate": 8.813971589803462e-05, - "loss": 0.0109, + "epoch": 0.66, + "learning_rate": 0.00020112809077195513, + "loss": 0.0144, "step": 130650 }, { - "epoch": 1.41, - "learning_rate": 8.812350003243173e-05, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.0002011205230789411, + "loss": 0.0109, "step": 130660 }, { - "epoch": 1.41, - "learning_rate": 8.810728416682881e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.0002011129553859271, + "loss": 0.016, "step": 130670 }, { - "epoch": 1.41, - "learning_rate": 8.809106830122592e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.0002011053876929131, + "loss": 0.0129, "step": 130680 }, { - "epoch": 1.41, - "learning_rate": 8.8074852435623e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020109781999989908, + "loss": 0.0159, "step": 130690 }, { - "epoch": 1.41, - "learning_rate": 8.80586365700201e-05, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020109025230688506, + "loss": 0.0155, "step": 130700 }, { - "epoch": 1.41, - "learning_rate": 8.80424207044172e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020108268461387107, + "loss": 0.0149, "step": 130710 }, { - "epoch": 1.41, - "learning_rate": 8.802620483881429e-05, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020107511692085705, + "loss": 0.0126, "step": 130720 }, { - "epoch": 1.41, - "learning_rate": 8.800998897321138e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020106754922784303, + "loss": 0.012, "step": 130730 }, { - "epoch": 1.41, - "learning_rate": 8.799377310760847e-05, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020105998153482904, + "loss": 0.0123, "step": 130740 }, { - "epoch": 1.41, - "learning_rate": 8.797755724200556e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020105241384181502, + "loss": 0.0133, "step": 130750 }, { - "epoch": 1.41, - "learning_rate": 8.796134137640267e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.000201044846148801, + "loss": 0.0175, "step": 130760 }, { - "epoch": 1.41, - "learning_rate": 8.794512551079975e-05, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020103727845578699, + "loss": 0.0149, "step": 130770 }, { - "epoch": 1.41, - "learning_rate": 8.792890964519686e-05, - "loss": 0.006, + "epoch": 0.66, + "learning_rate": 0.000201029710762773, + "loss": 0.015, "step": 130780 }, { - "epoch": 1.41, - "learning_rate": 8.791269377959394e-05, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020102214306975898, + "loss": 0.0116, "step": 130790 }, { - "epoch": 1.41, - "learning_rate": 8.789647791399104e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020101457537674496, + "loss": 0.0112, "step": 130800 }, { - "epoch": 1.41, - "learning_rate": 8.788026204838812e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020100700768373097, + "loss": 0.0121, "step": 130810 }, { - "epoch": 1.41, - "learning_rate": 8.786404618278523e-05, - "loss": 0.0106, + "epoch": 0.66, + "learning_rate": 0.00020099943999071695, + "loss": 0.0189, "step": 130820 }, { - "epoch": 1.41, - "learning_rate": 8.784783031718232e-05, - "loss": 0.009, + "epoch": 0.66, + "learning_rate": 0.00020099187229770293, + "loss": 0.0152, "step": 130830 }, { - "epoch": 1.41, - "learning_rate": 8.783161445157941e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020098430460468894, + "loss": 0.0132, "step": 130840 }, { - "epoch": 1.41, - "learning_rate": 8.78153985859765e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020097673691167492, + "loss": 0.0127, "step": 130850 }, { - "epoch": 1.41, - "learning_rate": 8.779918272037361e-05, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.0002009691692186609, + "loss": 0.0109, "step": 130860 }, { - "epoch": 1.41, - "learning_rate": 8.778296685477069e-05, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.0002009616015256469, + "loss": 0.0161, "step": 130870 }, { - "epoch": 1.41, - "learning_rate": 8.77667509891678e-05, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.0002009540338326329, + "loss": 0.015, "step": 130880 }, { - "epoch": 1.41, - "learning_rate": 8.775053512356488e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020094646613961887, + "loss": 0.0112, "step": 130890 }, { - "epoch": 1.42, - "learning_rate": 8.773431925796198e-05, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.00020093889844660488, + "loss": 0.0136, "step": 130900 }, { - "epoch": 1.42, - "learning_rate": 8.771810339235906e-05, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020093133075359086, + "loss": 0.0122, "step": 130910 }, { - "epoch": 1.42, - "learning_rate": 8.770188752675617e-05, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020092376306057684, + "loss": 0.0134, "step": 130920 }, { - "epoch": 1.42, - "learning_rate": 8.768567166115328e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020091619536756282, + "loss": 0.0165, "step": 130930 }, { - "epoch": 1.42, - "learning_rate": 8.766945579555035e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020090862767454883, + "loss": 0.0144, "step": 130940 }, { - "epoch": 1.42, - "learning_rate": 8.765323992994746e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020090105998153481, + "loss": 0.0148, "step": 130950 }, { - "epoch": 1.42, - "learning_rate": 8.763702406434455e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.0002008934922885208, + "loss": 0.0157, "step": 130960 }, { - "epoch": 1.42, - "learning_rate": 8.762080819874165e-05, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.0002008859245955068, + "loss": 0.0184, "step": 130970 }, { - "epoch": 1.42, - "learning_rate": 8.760459233313874e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020087835690249279, + "loss": 0.0131, "step": 130980 }, { - "epoch": 1.42, - "learning_rate": 8.758837646753583e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020087078920947877, + "loss": 0.0125, "step": 130990 }, { - "epoch": 1.42, - "learning_rate": 8.757216060193292e-05, - "loss": 0.0107, + "epoch": 0.66, + "learning_rate": 0.00020086322151646478, + "loss": 0.0129, "step": 131000 }, { - "epoch": 1.42, - "eval_cer": 0.9215486495829838, - "eval_loss": 0.006674186792224646, - "eval_runtime": 121.2703, - "eval_samples_per_second": 16.492, - "eval_steps_per_second": 4.123, + "epoch": 0.66, + "eval_cer": 0.9145090717481783, + "eval_loss": 0.009523593820631504, + "eval_runtime": 116.9784, + "eval_samples_per_second": 17.097, + "eval_steps_per_second": 4.274, "step": 131000 }, { - "epoch": 1.42, - "learning_rate": 8.755594473633003e-05, - "loss": 0.013, + "epoch": 0.66, + "learning_rate": 0.00020085565382345076, + "loss": 0.0139, "step": 131010 }, { - "epoch": 1.42, - "learning_rate": 8.753972887072711e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020084808613043674, + "loss": 0.0161, "step": 131020 }, { - "epoch": 1.42, - "learning_rate": 8.752351300512422e-05, - "loss": 0.0114, + "epoch": 0.66, + "learning_rate": 0.00020084051843742275, + "loss": 0.0112, "step": 131030 }, { - "epoch": 1.42, - "learning_rate": 8.75072971395213e-05, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020083295074440873, + "loss": 0.0114, "step": 131040 }, { - "epoch": 1.42, - "learning_rate": 8.74910812739184e-05, + "epoch": 0.66, + "learning_rate": 0.0002008253830513947, "loss": 0.0119, "step": 131050 }, { - "epoch": 1.42, - "learning_rate": 8.747486540831548e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020081781535838072, + "loss": 0.0165, "step": 131060 }, { - "epoch": 1.42, - "learning_rate": 8.745864954271259e-05, - "loss": 0.0105, + "epoch": 0.66, + "learning_rate": 0.0002008102476653667, + "loss": 0.0111, "step": 131070 }, { - "epoch": 1.42, - "learning_rate": 8.744243367710968e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020080267997235268, + "loss": 0.0125, "step": 131080 }, { - "epoch": 1.42, - "learning_rate": 8.742621781150677e-05, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.0002007951122793387, + "loss": 0.0126, "step": 131090 }, { - "epoch": 1.42, - "learning_rate": 8.741000194590387e-05, - "loss": 0.0112, + "epoch": 0.66, + "learning_rate": 0.00020078754458632467, + "loss": 0.0132, "step": 131100 }, { - "epoch": 1.42, - "learning_rate": 8.739378608030097e-05, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020077997689331065, + "loss": 0.0137, "step": 131110 }, { - "epoch": 1.42, - "learning_rate": 8.737757021469805e-05, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020077240920029663, + "loss": 0.0126, "step": 131120 }, { - "epoch": 1.42, - "learning_rate": 8.736135434909516e-05, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020076484150728264, + "loss": 0.0139, "step": 131130 }, { - "epoch": 1.42, - "learning_rate": 8.734513848349224e-05, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020075727381426862, + "loss": 0.0147, "step": 131140 }, { - "epoch": 1.42, - "learning_rate": 8.732892261788934e-05, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.0002007497061212546, + "loss": 0.0149, "step": 131150 }, { - "epoch": 1.42, - "learning_rate": 8.731270675228642e-05, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020074213842824061, + "loss": 0.0187, "step": 131160 }, { - "epoch": 1.42, - "learning_rate": 8.729649088668353e-05, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.0002007345707352266, + "loss": 0.0143, "step": 131170 }, { - "epoch": 1.42, - "learning_rate": 8.728027502108062e-05, - "loss": 0.0105, + "epoch": 0.66, + "learning_rate": 0.00020072700304221258, + "loss": 0.0157, "step": 131180 }, { - "epoch": 1.42, - "learning_rate": 8.726405915547771e-05, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020071943534919859, + "loss": 0.0176, "step": 131190 }, { - "epoch": 1.42, - "learning_rate": 8.72478432898748e-05, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020071186765618457, + "loss": 0.0137, "step": 131200 }, { - "epoch": 1.42, - "learning_rate": 8.72316274242719e-05, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020070429996317055, + "loss": 0.0128, "step": 131210 }, { - "epoch": 1.42, - "learning_rate": 8.721541155866899e-05, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020069673227015656, + "loss": 0.0139, "step": 131220 }, { - "epoch": 1.42, - "learning_rate": 8.71991956930661e-05, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020068916457714254, + "loss": 0.014, "step": 131230 }, { - "epoch": 1.42, - "learning_rate": 8.718297982746318e-05, - "loss": 0.0104, + "epoch": 0.66, + "learning_rate": 0.00020068159688412852, + "loss": 0.0117, "step": 131240 }, { - "epoch": 1.42, - "learning_rate": 8.716676396186028e-05, - "loss": 0.0107, + "epoch": 0.66, + "learning_rate": 0.00020067402919111453, + "loss": 0.0152, "step": 131250 }, { - "epoch": 1.42, - "learning_rate": 8.715054809625736e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002006664614981005, + "loss": 0.0124, "step": 131260 }, { - "epoch": 1.42, - "learning_rate": 8.713433223065447e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002006588938050865, + "loss": 0.0135, "step": 131270 }, { - "epoch": 1.42, - "learning_rate": 8.711811636505155e-05, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020065132611207247, + "loss": 0.0143, "step": 131280 }, { - "epoch": 1.42, - "learning_rate": 8.710190049944865e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020064375841905848, + "loss": 0.0141, "step": 131290 }, { - "epoch": 1.42, - "learning_rate": 8.708568463384575e-05, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020063619072604446, + "loss": 0.0137, "step": 131300 }, { - "epoch": 1.42, - "learning_rate": 8.706946876824284e-05, - "loss": 0.011, + "epoch": 0.66, + "learning_rate": 0.00020062862303303044, + "loss": 0.0125, "step": 131310 }, { - "epoch": 1.42, - "learning_rate": 8.705325290263993e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020062105534001645, + "loss": 0.0113, "step": 131320 }, { - "epoch": 1.42, - "learning_rate": 8.703703703703704e-05, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020061348764700243, + "loss": 0.0145, "step": 131330 }, { - "epoch": 1.42, - "learning_rate": 8.702082117143412e-05, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020060591995398842, + "loss": 0.0164, "step": 131340 }, { - "epoch": 1.42, - "learning_rate": 8.700460530583122e-05, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020059835226097437, + "loss": 0.015, "step": 131350 }, { - "epoch": 1.42, - "learning_rate": 8.69883894402283e-05, - "loss": 0.0108, + "epoch": 0.66, + "learning_rate": 0.00020059078456796038, + "loss": 0.014, "step": 131360 }, { - "epoch": 1.42, - "learning_rate": 8.697217357462541e-05, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020058321687494636, + "loss": 0.0136, "step": 131370 }, { - "epoch": 1.42, - "learning_rate": 8.695595770902249e-05, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.00020057564918193234, + "loss": 0.0184, "step": 131380 }, { - "epoch": 1.42, - "learning_rate": 8.69397418434196e-05, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020056808148891835, + "loss": 0.0122, "step": 131390 }, { - "epoch": 1.42, - "learning_rate": 8.692352597781669e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020056051379590433, + "loss": 0.0152, "step": 131400 }, { - "epoch": 1.42, - "learning_rate": 8.690731011221378e-05, - "loss": 0.0116, + "epoch": 0.66, + "learning_rate": 0.0002005529461028903, + "loss": 0.0142, "step": 131410 }, { - "epoch": 1.42, - "learning_rate": 8.689109424661087e-05, - "loss": 0.0111, + "epoch": 0.66, + "learning_rate": 0.00020054537840987632, + "loss": 0.0145, "step": 131420 }, { - "epoch": 1.42, - "learning_rate": 8.687487838100797e-05, - "loss": 0.0128, + "epoch": 0.66, + "learning_rate": 0.0002005378107168623, + "loss": 0.0137, "step": 131430 }, { - "epoch": 1.42, - "learning_rate": 8.685866251540506e-05, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020053024302384828, + "loss": 0.0124, "step": 131440 }, { - "epoch": 1.42, - "learning_rate": 8.684244664980217e-05, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.0002005226753308343, + "loss": 0.0152, "step": 131450 }, { - "epoch": 1.42, - "learning_rate": 8.682623078419924e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020051510763782027, + "loss": 0.0126, "step": 131460 }, { - "epoch": 1.42, - "learning_rate": 8.681001491859635e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020050753994480626, + "loss": 0.0145, "step": 131470 }, { - "epoch": 1.42, - "learning_rate": 8.679379905299343e-05, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.00020049997225179226, + "loss": 0.0155, "step": 131480 }, { - "epoch": 1.42, - "learning_rate": 8.677758318739054e-05, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020049240455877825, + "loss": 0.0133, "step": 131490 }, { - "epoch": 1.42, - "learning_rate": 8.676136732178763e-05, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020048483686576423, + "loss": 0.0112, "step": 131500 }, { - "epoch": 1.42, - "learning_rate": 8.674515145618472e-05, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.0002004772691727502, + "loss": 0.0174, "step": 131510 }, { - "epoch": 1.42, - "learning_rate": 8.672893559058181e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020046970147973622, + "loss": 0.0156, "step": 131520 }, { - "epoch": 1.42, - "learning_rate": 8.671271972497891e-05, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.0002004621337867222, + "loss": 0.0137, "step": 131530 }, { - "epoch": 1.42, - "learning_rate": 8.6696503859376e-05, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020045456609370818, + "loss": 0.0124, "step": 131540 }, { - "epoch": 1.42, - "learning_rate": 8.66802879937731e-05, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.0002004469984006942, + "loss": 0.0122, "step": 131550 }, { - "epoch": 1.42, - "learning_rate": 8.666407212817019e-05, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.00020043943070768017, + "loss": 0.0114, "step": 131560 }, { - "epoch": 1.42, - "learning_rate": 8.664785626256729e-05, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020043186301466615, + "loss": 0.01, "step": 131570 }, { - "epoch": 1.42, - "learning_rate": 8.663164039696437e-05, - "loss": 0.0062, + "epoch": 0.66, + "learning_rate": 0.00020042429532165216, + "loss": 0.0125, "step": 131580 }, { - "epoch": 1.42, - "learning_rate": 8.661542453136148e-05, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020041672762863814, + "loss": 0.0138, "step": 131590 }, { - "epoch": 1.42, - "learning_rate": 8.659920866575856e-05, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020040915993562412, + "loss": 0.0148, "step": 131600 }, { - "epoch": 1.42, - "learning_rate": 8.658299280015566e-05, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020040159224261013, + "loss": 0.0111, "step": 131610 }, { - "epoch": 1.42, - "learning_rate": 8.656677693455276e-05, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.0002003940245495961, + "loss": 0.0117, "step": 131620 }, { - "epoch": 1.42, - "learning_rate": 8.655056106894985e-05, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.0002003864568565821, + "loss": 0.0124, "step": 131630 }, { - "epoch": 1.42, - "learning_rate": 8.653434520334695e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.0002003788891635681, + "loss": 0.0105, "step": 131640 }, { - "epoch": 1.42, - "learning_rate": 8.651812933774405e-05, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020037132147055408, + "loss": 0.0123, "step": 131650 }, { - "epoch": 1.42, - "learning_rate": 8.650191347214114e-05, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020036375377754007, + "loss": 0.0117, "step": 131660 }, { - "epoch": 1.42, - "learning_rate": 8.648569760653823e-05, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020035618608452605, + "loss": 0.0142, "step": 131670 }, { - "epoch": 1.42, - "learning_rate": 8.646948174093533e-05, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020034861839151206, + "loss": 0.0134, "step": 131680 }, { - "epoch": 1.42, - "learning_rate": 8.645326587533242e-05, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020034105069849804, + "loss": 0.0137, "step": 131690 }, { - "epoch": 1.42, - "learning_rate": 8.643705000972952e-05, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020033348300548402, + "loss": 0.0121, "step": 131700 }, { - "epoch": 1.42, - "learning_rate": 8.64208341441266e-05, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020032591531247003, + "loss": 0.0112, "step": 131710 }, { - "epoch": 1.42, - "learning_rate": 8.640461827852371e-05, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.000200318347619456, + "loss": 0.0125, "step": 131720 }, { - "epoch": 1.42, - "learning_rate": 8.638840241292079e-05, - "loss": 0.0114, + "epoch": 0.66, + "learning_rate": 0.000200310779926442, + "loss": 0.0124, "step": 131730 }, { - "epoch": 1.42, - "learning_rate": 8.63721865473179e-05, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.000200303212233428, + "loss": 0.0193, "step": 131740 }, { - "epoch": 1.42, - "learning_rate": 8.635597068171497e-05, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020029564454041398, + "loss": 0.0135, "step": 131750 }, { - "epoch": 1.42, - "learning_rate": 8.633975481611208e-05, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020028807684739996, + "loss": 0.0144, "step": 131760 }, { - "epoch": 1.42, - "learning_rate": 8.632353895050917e-05, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020028050915438597, + "loss": 0.014, "step": 131770 }, { - "epoch": 1.42, - "learning_rate": 8.630732308490627e-05, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020027294146137195, + "loss": 0.0099, "step": 131780 }, { - "epoch": 1.42, - "learning_rate": 8.629110721930336e-05, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020026537376835793, + "loss": 0.0153, "step": 131790 }, { - "epoch": 1.42, - "learning_rate": 8.627489135370047e-05, - "loss": 0.0104, + "epoch": 0.66, + "learning_rate": 0.00020025780607534394, + "loss": 0.0137, "step": 131800 }, { - "epoch": 1.42, - "learning_rate": 8.625867548809754e-05, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020025023838232992, + "loss": 0.0179, "step": 131810 }, { - "epoch": 1.43, - "learning_rate": 8.624245962249465e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.0002002426706893159, + "loss": 0.0137, "step": 131820 }, { - "epoch": 1.43, - "learning_rate": 8.622624375689173e-05, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.00020023510299630189, + "loss": 0.0191, "step": 131830 }, { - "epoch": 1.43, - "learning_rate": 8.621002789128884e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.0002002275353032879, + "loss": 0.0138, "step": 131840 }, { - "epoch": 1.43, - "learning_rate": 8.619381202568592e-05, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00020021996761027388, + "loss": 0.0135, "step": 131850 }, { - "epoch": 1.43, - "learning_rate": 8.617759616008302e-05, - "loss": 0.0098, + "epoch": 0.67, + "learning_rate": 0.00020021239991725986, + "loss": 0.0122, "step": 131860 }, { - "epoch": 1.43, - "learning_rate": 8.616138029448011e-05, - "loss": 0.0059, + "epoch": 0.67, + "learning_rate": 0.00020020483222424587, + "loss": 0.0146, "step": 131870 }, { - "epoch": 1.43, - "learning_rate": 8.614516442887721e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00020019726453123185, + "loss": 0.0136, "step": 131880 }, { - "epoch": 1.43, - "learning_rate": 8.61289485632743e-05, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00020018969683821783, + "loss": 0.013, "step": 131890 }, { - "epoch": 1.43, - "learning_rate": 8.611273269767139e-05, - "loss": 0.0068, + "epoch": 0.67, + "learning_rate": 0.00020018212914520384, + "loss": 0.0137, "step": 131900 }, { - "epoch": 1.43, - "learning_rate": 8.609651683206849e-05, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00020017456145218982, + "loss": 0.0128, "step": 131910 }, { - "epoch": 1.43, - "learning_rate": 8.608030096646559e-05, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.0002001669937591758, + "loss": 0.013, "step": 131920 }, { - "epoch": 1.43, - "learning_rate": 8.606408510086267e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.0002001594260661618, + "loss": 0.0138, "step": 131930 }, { - "epoch": 1.43, - "learning_rate": 8.604786923525978e-05, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.0002001518583731478, + "loss": 0.0117, "step": 131940 }, { - "epoch": 1.43, - "learning_rate": 8.603165336965686e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020014429068013377, + "loss": 0.015, "step": 131950 }, { - "epoch": 1.43, - "learning_rate": 8.601543750405396e-05, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00020013672298711978, + "loss": 0.0124, "step": 131960 }, { - "epoch": 1.43, - "learning_rate": 8.599922163845106e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00020012915529410576, + "loss": 0.0153, "step": 131970 }, { - "epoch": 1.43, - "learning_rate": 8.598300577284815e-05, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00020012158760109174, + "loss": 0.0134, "step": 131980 }, { - "epoch": 1.43, - "learning_rate": 8.596678990724524e-05, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00020011401990807775, + "loss": 0.0133, "step": 131990 }, { - "epoch": 1.43, - "learning_rate": 8.595057404164233e-05, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00020010645221506373, + "loss": 0.0141, "step": 132000 }, { - "epoch": 1.43, - "eval_cer": 0.9215443065682019, - "eval_loss": 0.0068144891411066055, - "eval_runtime": 121.5561, - "eval_samples_per_second": 16.453, - "eval_steps_per_second": 4.113, + "epoch": 0.67, + "eval_cer": 0.9144430848116509, + "eval_loss": 0.009661003015935421, + "eval_runtime": 116.7282, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, "step": 132000 }, { - "epoch": 1.43, - "learning_rate": 8.593435817603943e-05, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.00020009888452204971, + "loss": 0.0143, "step": 132010 }, { - "epoch": 1.43, - "learning_rate": 8.591814231043653e-05, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.0002000913168290357, + "loss": 0.0144, "step": 132020 }, { - "epoch": 1.43, - "learning_rate": 8.590192644483361e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.0002000837491360217, + "loss": 0.0149, "step": 132030 }, { - "epoch": 1.43, - "learning_rate": 8.588571057923072e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00020007618144300769, + "loss": 0.0115, "step": 132040 }, { - "epoch": 1.43, - "learning_rate": 8.58694947136278e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00020006861374999367, + "loss": 0.0116, "step": 132050 }, { - "epoch": 1.43, - "learning_rate": 8.58532788480249e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00020006104605697968, + "loss": 0.0161, "step": 132060 }, { - "epoch": 1.43, - "learning_rate": 8.583706298242198e-05, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00020005347836396566, + "loss": 0.0162, "step": 132070 }, { - "epoch": 1.43, - "learning_rate": 8.582084711681909e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00020004591067095164, + "loss": 0.0132, "step": 132080 }, { - "epoch": 1.43, - "learning_rate": 8.580463125121618e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00020003834297793765, + "loss": 0.0195, "step": 132090 }, { - "epoch": 1.43, - "learning_rate": 8.578841538561328e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00020003077528492363, + "loss": 0.0137, "step": 132100 }, { - "epoch": 1.43, - "learning_rate": 8.577219952001037e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.0002000232075919096, + "loss": 0.0134, "step": 132110 }, { - "epoch": 1.43, - "learning_rate": 8.575598365440747e-05, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00020001563989889562, + "loss": 0.0159, "step": 132120 }, { - "epoch": 1.43, - "learning_rate": 8.573976778880455e-05, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0002000080722058816, + "loss": 0.0092, "step": 132130 }, { - "epoch": 1.43, - "learning_rate": 8.572355192320166e-05, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00020000050451286758, + "loss": 0.0113, "step": 132140 }, { - "epoch": 1.43, - "learning_rate": 8.570733605759874e-05, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.0001999929368198536, + "loss": 0.0126, "step": 132150 }, { - "epoch": 1.43, - "learning_rate": 8.569112019199585e-05, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019998536912683957, + "loss": 0.014, "step": 132160 }, { - "epoch": 1.43, - "learning_rate": 8.567490432639292e-05, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019997780143382555, + "loss": 0.0112, "step": 132170 }, { - "epoch": 1.43, - "learning_rate": 8.565868846079003e-05, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019997023374081153, + "loss": 0.0116, "step": 132180 }, { - "epoch": 1.43, - "learning_rate": 8.564247259518712e-05, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00019996266604779754, + "loss": 0.0139, "step": 132190 }, { - "epoch": 1.43, - "learning_rate": 8.562625672958422e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019995509835478352, + "loss": 0.0143, "step": 132200 }, { - "epoch": 1.43, - "learning_rate": 8.561004086398131e-05, - "loss": 0.0109, + "epoch": 0.67, + "learning_rate": 0.0001999475306617695, + "loss": 0.0152, "step": 132210 }, { - "epoch": 1.43, - "learning_rate": 8.55938249983784e-05, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.00019993996296875551, + "loss": 0.0129, "step": 132220 }, { - "epoch": 1.43, - "learning_rate": 8.55776091327755e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.0001999323952757415, + "loss": 0.0126, "step": 132230 }, { - "epoch": 1.43, - "learning_rate": 8.55613932671726e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019992482758272748, + "loss": 0.0154, "step": 132240 }, { - "epoch": 1.43, - "learning_rate": 8.554517740156968e-05, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019991725988971349, + "loss": 0.0118, "step": 132250 }, { - "epoch": 1.43, - "learning_rate": 8.552896153596679e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019990969219669947, + "loss": 0.0154, "step": 132260 }, { - "epoch": 1.43, - "learning_rate": 8.551274567036387e-05, - "loss": 0.0111, + "epoch": 0.67, + "learning_rate": 0.00019990212450368545, + "loss": 0.0166, "step": 132270 }, { - "epoch": 1.43, - "learning_rate": 8.549652980476097e-05, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019989455681067146, + "loss": 0.0145, "step": 132280 }, { - "epoch": 1.43, - "learning_rate": 8.548031393915805e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019988698911765744, + "loss": 0.011, "step": 132290 }, { - "epoch": 1.43, - "learning_rate": 8.546409807355516e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019987942142464342, + "loss": 0.0157, "step": 132300 }, { - "epoch": 1.43, - "learning_rate": 8.544788220795225e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019987185373162943, + "loss": 0.015, "step": 132310 }, { - "epoch": 1.43, - "learning_rate": 8.543166634234934e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.0001998642860386154, + "loss": 0.0122, "step": 132320 }, { - "epoch": 1.43, - "learning_rate": 8.541545047674644e-05, - "loss": 0.0112, + "epoch": 0.67, + "learning_rate": 0.0001998567183456014, + "loss": 0.0153, "step": 132330 }, { - "epoch": 1.43, - "learning_rate": 8.539923461114354e-05, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019984915065258737, + "loss": 0.0142, "step": 132340 }, { - "epoch": 1.43, - "learning_rate": 8.538301874554062e-05, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019984158295957338, + "loss": 0.0143, "step": 132350 }, { - "epoch": 1.43, - "learning_rate": 8.536680287993773e-05, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019983401526655936, + "loss": 0.0134, "step": 132360 }, { - "epoch": 1.43, - "learning_rate": 8.535058701433482e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019982644757354534, + "loss": 0.0192, "step": 132370 }, { - "epoch": 1.43, - "learning_rate": 8.533437114873191e-05, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019981887988053135, + "loss": 0.0155, "step": 132380 }, { - "epoch": 1.43, - "learning_rate": 8.531815528312902e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019981131218751733, + "loss": 0.0139, "step": 132390 }, { - "epoch": 1.43, - "learning_rate": 8.53019394175261e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019980374449450332, + "loss": 0.0122, "step": 132400 }, { - "epoch": 1.43, - "learning_rate": 8.52857235519232e-05, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019979617680148932, + "loss": 0.0141, "step": 132410 }, { - "epoch": 1.43, - "learning_rate": 8.526950768632028e-05, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.0001997886091084753, + "loss": 0.0137, "step": 132420 }, { - "epoch": 1.43, - "learning_rate": 8.525329182071739e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.0001997810414154613, + "loss": 0.0144, "step": 132430 }, { - "epoch": 1.43, - "learning_rate": 8.523707595511447e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.0001997734737224473, + "loss": 0.0115, "step": 132440 }, { - "epoch": 1.43, - "learning_rate": 8.522086008951158e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019976590602943328, + "loss": 0.0166, "step": 132450 }, { - "epoch": 1.43, - "learning_rate": 8.520464422390867e-05, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019975833833641926, + "loss": 0.0139, "step": 132460 }, { - "epoch": 1.43, - "learning_rate": 8.518842835830576e-05, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019975077064340527, + "loss": 0.0301, "step": 132470 }, { - "epoch": 1.43, - "learning_rate": 8.517221249270285e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019974320295039125, + "loss": 0.0163, "step": 132480 }, { - "epoch": 1.43, - "learning_rate": 8.515599662709996e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019973563525737723, + "loss": 0.0141, "step": 132490 }, { - "epoch": 1.43, - "learning_rate": 8.513978076149704e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019972806756436324, + "loss": 0.0141, "step": 132500 }, { - "epoch": 1.43, - "learning_rate": 8.512356489589415e-05, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019972049987134922, + "loss": 0.0141, "step": 132510 }, { - "epoch": 1.43, - "learning_rate": 8.510734903029122e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.0001997129321783352, + "loss": 0.0153, "step": 132520 }, { - "epoch": 1.43, - "learning_rate": 8.509113316468833e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019970536448532118, + "loss": 0.012, "step": 132530 }, { - "epoch": 1.43, - "learning_rate": 8.507491729908541e-05, - "loss": 0.0111, + "epoch": 0.67, + "learning_rate": 0.0001996977967923072, + "loss": 0.0157, "step": 132540 }, { - "epoch": 1.43, - "learning_rate": 8.505870143348252e-05, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019969022909929317, + "loss": 0.0149, "step": 132550 }, { - "epoch": 1.43, - "learning_rate": 8.504248556787961e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019968266140627915, + "loss": 0.0137, "step": 132560 }, { - "epoch": 1.43, - "learning_rate": 8.50262697022767e-05, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019967509371326516, + "loss": 0.0116, "step": 132570 }, { - "epoch": 1.43, - "learning_rate": 8.50100538366738e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019966752602025114, + "loss": 0.0141, "step": 132580 }, { - "epoch": 1.43, - "learning_rate": 8.499383797107089e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019965995832723713, + "loss": 0.0176, "step": 132590 }, { - "epoch": 1.43, - "learning_rate": 8.497762210546798e-05, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019965239063422313, + "loss": 0.0151, "step": 132600 }, { - "epoch": 1.43, - "learning_rate": 8.496140623986509e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.0001996448229412091, + "loss": 0.014, "step": 132610 }, { - "epoch": 1.43, - "learning_rate": 8.494519037426217e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019963725524819507, + "loss": 0.025, "step": 132620 }, { - "epoch": 1.43, - "learning_rate": 8.492897450865927e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019962968755518105, + "loss": 0.0155, "step": 132630 }, { - "epoch": 1.43, - "learning_rate": 8.491275864305635e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019962211986216706, + "loss": 0.0168, "step": 132640 }, { - "epoch": 1.43, - "learning_rate": 8.489654277745346e-05, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019961455216915304, + "loss": 0.0151, "step": 132650 }, { - "epoch": 1.43, - "learning_rate": 8.488032691185055e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019960698447613902, + "loss": 0.0133, "step": 132660 }, { - "epoch": 1.43, - "learning_rate": 8.486411104624764e-05, - "loss": 0.0099, + "epoch": 0.67, + "learning_rate": 0.00019959941678312503, + "loss": 0.0117, "step": 132670 }, { - "epoch": 1.43, - "learning_rate": 8.484789518064474e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.000199591849090111, + "loss": 0.0165, "step": 132680 }, { - "epoch": 1.43, - "learning_rate": 8.483167931504183e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.000199584281397097, + "loss": 0.0162, "step": 132690 }, { - "epoch": 1.43, - "learning_rate": 8.481546344943892e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.000199576713704083, + "loss": 0.011, "step": 132700 }, { - "epoch": 1.43, - "learning_rate": 8.479924758383603e-05, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019956914601106898, + "loss": 0.0129, "step": 132710 }, { - "epoch": 1.43, - "learning_rate": 8.47830317182331e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019956157831805497, + "loss": 0.0153, "step": 132720 }, { - "epoch": 1.43, - "learning_rate": 8.476681585263021e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019955401062504095, + "loss": 0.0128, "step": 132730 }, { - "epoch": 1.43, - "learning_rate": 8.475059998702729e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019954644293202696, + "loss": 0.012, "step": 132740 }, { - "epoch": 1.44, - "learning_rate": 8.47343841214244e-05, - "loss": 0.0104, + "epoch": 0.67, + "learning_rate": 0.00019953887523901294, + "loss": 0.0143, "step": 132750 }, { - "epoch": 1.44, - "learning_rate": 8.471816825582148e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019953130754599892, + "loss": 0.0132, "step": 132760 }, { - "epoch": 1.44, - "learning_rate": 8.470195239021858e-05, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019952373985298493, + "loss": 0.0135, "step": 132770 }, { - "epoch": 1.44, - "learning_rate": 8.468573652461568e-05, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.0001995161721599709, + "loss": 0.0138, "step": 132780 }, { - "epoch": 1.44, - "learning_rate": 8.466952065901277e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.0001995086044669569, + "loss": 0.0139, "step": 132790 }, { - "epoch": 1.44, - "learning_rate": 8.465330479340986e-05, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.0001995010367739429, + "loss": 0.0161, "step": 132800 }, { - "epoch": 1.44, - "learning_rate": 8.463708892780697e-05, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019949346908092888, + "loss": 0.0145, "step": 132810 }, { - "epoch": 1.44, - "learning_rate": 8.462087306220405e-05, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019948590138791486, + "loss": 0.0119, "step": 132820 }, { - "epoch": 1.44, - "learning_rate": 8.460465719660115e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019947833369490087, + "loss": 0.017, "step": 132830 }, { - "epoch": 1.44, - "learning_rate": 8.458844133099823e-05, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00019947076600188685, + "loss": 0.0116, "step": 132840 }, { - "epoch": 1.44, - "learning_rate": 8.457222546539534e-05, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019946319830887283, + "loss": 0.0134, "step": 132850 }, { - "epoch": 1.44, - "learning_rate": 8.455600959979242e-05, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019945563061585884, + "loss": 0.0169, "step": 132860 }, { - "epoch": 1.44, - "learning_rate": 8.453979373418952e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019944806292284482, + "loss": 0.0109, "step": 132870 }, { - "epoch": 1.44, - "learning_rate": 8.452357786858662e-05, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.0001994404952298308, + "loss": 0.0142, "step": 132880 }, { - "epoch": 1.44, - "learning_rate": 8.450736200298371e-05, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.0001994329275368168, + "loss": 0.0132, "step": 132890 }, { - "epoch": 1.44, - "learning_rate": 8.44911461373808e-05, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.0001994253598438028, + "loss": 0.0153, "step": 132900 }, { - "epoch": 1.44, - "learning_rate": 8.44749302717779e-05, - "loss": 0.0102, + "epoch": 0.67, + "learning_rate": 0.00019941779215078878, + "loss": 0.0141, "step": 132910 }, { - "epoch": 1.44, - "learning_rate": 8.445871440617499e-05, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019941022445777476, + "loss": 0.0148, "step": 132920 }, { - "epoch": 1.44, - "learning_rate": 8.44424985405721e-05, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019940265676476077, + "loss": 0.014, "step": 132930 }, { - "epoch": 1.44, - "learning_rate": 8.442628267496917e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019939508907174675, + "loss": 0.0136, "step": 132940 }, { - "epoch": 1.44, - "learning_rate": 8.441006680936628e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019938752137873273, + "loss": 0.0159, "step": 132950 }, { - "epoch": 1.44, - "learning_rate": 8.439385094376336e-05, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00019937995368571874, + "loss": 0.0128, "step": 132960 }, { - "epoch": 1.44, - "learning_rate": 8.437763507816047e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019937238599270472, + "loss": 0.0162, "step": 132970 }, { - "epoch": 1.44, - "learning_rate": 8.436141921255754e-05, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.0001993648182996907, + "loss": 0.0122, "step": 132980 }, { - "epoch": 1.44, - "learning_rate": 8.434520334695465e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.0001993572506066767, + "loss": 0.0117, "step": 132990 }, { - "epoch": 1.44, - "learning_rate": 8.432898748135174e-05, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.0001993496829136627, + "loss": 0.0126, "step": 133000 }, { - "epoch": 1.44, - "eval_cer": 0.9215364891415945, - "eval_loss": 0.006863737478852272, - "eval_runtime": 121.164, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.67, + "eval_cer": 0.9144964565985481, + "eval_loss": 0.009822376072406769, + "eval_runtime": 116.6404, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, "step": 133000 }, { - "epoch": 1.44, - "learning_rate": 8.431277161574884e-05, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019934211522064867, + "loss": 0.0111, "step": 133010 }, { - "epoch": 1.44, - "learning_rate": 8.429655575014593e-05, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019933454752763468, + "loss": 0.0119, "step": 133020 }, { - "epoch": 1.44, - "learning_rate": 8.428033988454304e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019932697983462066, + "loss": 0.0162, "step": 133030 }, { - "epoch": 1.44, - "learning_rate": 8.426412401894011e-05, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00019931941214160664, + "loss": 0.0136, "step": 133040 }, { - "epoch": 1.44, - "learning_rate": 8.424790815333722e-05, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019931184444859265, + "loss": 0.0115, "step": 133050 }, { - "epoch": 1.44, - "learning_rate": 8.42316922877343e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019930427675557863, + "loss": 0.0158, "step": 133060 }, { - "epoch": 1.44, - "learning_rate": 8.42154764221314e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019929670906256462, + "loss": 0.014, "step": 133070 }, { - "epoch": 1.44, - "learning_rate": 8.419926055652851e-05, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.0001992891413695506, + "loss": 0.0145, "step": 133080 }, { - "epoch": 1.44, - "learning_rate": 8.418304469092559e-05, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.0001992815736765366, + "loss": 0.0151, "step": 133090 }, { - "epoch": 1.44, - "learning_rate": 8.41668288253227e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019927400598352259, + "loss": 0.0139, "step": 133100 }, { - "epoch": 1.44, - "learning_rate": 8.415061295971978e-05, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019926643829050857, + "loss": 0.0117, "step": 133110 }, { - "epoch": 1.44, - "learning_rate": 8.413439709411688e-05, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019925887059749458, + "loss": 0.0152, "step": 133120 }, { - "epoch": 1.44, - "learning_rate": 8.411818122851398e-05, - "loss": 0.0102, + "epoch": 0.67, + "learning_rate": 0.00019925130290448056, + "loss": 0.0139, "step": 133130 }, { - "epoch": 1.44, - "learning_rate": 8.410196536291107e-05, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019924373521146654, + "loss": 0.0135, "step": 133140 }, { - "epoch": 1.44, - "learning_rate": 8.408574949730816e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019923616751845255, + "loss": 0.0137, "step": 133150 }, { - "epoch": 1.44, - "learning_rate": 8.406953363170525e-05, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019922859982543853, + "loss": 0.0132, "step": 133160 }, { - "epoch": 1.44, - "learning_rate": 8.405331776610235e-05, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.0001992210321324245, + "loss": 0.0126, "step": 133170 }, { - "epoch": 1.44, - "learning_rate": 8.403710190049945e-05, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.00019921346443941052, + "loss": 0.0132, "step": 133180 }, { - "epoch": 1.44, - "learning_rate": 8.402088603489653e-05, - "loss": 0.0109, + "epoch": 0.67, + "learning_rate": 0.0001992058967463965, + "loss": 0.0142, "step": 133190 }, { - "epoch": 1.44, - "learning_rate": 8.400467016929364e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019919832905338248, + "loss": 0.0135, "step": 133200 }, { - "epoch": 1.44, - "learning_rate": 8.398845430369072e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001991907613603685, + "loss": 0.012, "step": 133210 }, { - "epoch": 1.44, - "learning_rate": 8.397223843808782e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019918319366735447, + "loss": 0.0154, "step": 133220 }, { - "epoch": 1.44, - "learning_rate": 8.39560225724849e-05, - "loss": 0.0098, + "epoch": 0.67, + "learning_rate": 0.00019917562597434045, + "loss": 0.0119, "step": 133230 }, { - "epoch": 1.44, - "learning_rate": 8.393980670688201e-05, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019916805828132644, + "loss": 0.0132, "step": 133240 }, { - "epoch": 1.44, - "learning_rate": 8.39235908412791e-05, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019916049058831244, + "loss": 0.0139, "step": 133250 }, { - "epoch": 1.44, - "learning_rate": 8.39073749756762e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019915292289529843, + "loss": 0.016, "step": 133260 }, { - "epoch": 1.44, - "learning_rate": 8.389115911007329e-05, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.0001991453552022844, + "loss": 0.0159, "step": 133270 }, { - "epoch": 1.44, - "learning_rate": 8.38749432444704e-05, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019913778750927042, + "loss": 0.017, "step": 133280 }, { - "epoch": 1.44, - "learning_rate": 8.385872737886747e-05, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001991302198162564, + "loss": 0.0142, "step": 133290 }, { - "epoch": 1.44, - "learning_rate": 8.384251151326458e-05, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019912265212324238, + "loss": 0.0113, "step": 133300 }, { - "epoch": 1.44, - "learning_rate": 8.382629564766166e-05, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001991150844302284, + "loss": 0.0138, "step": 133310 }, { - "epoch": 1.44, - "learning_rate": 8.381007978205877e-05, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019910751673721437, + "loss": 0.0151, "step": 133320 }, { - "epoch": 1.44, - "learning_rate": 8.379386391645585e-05, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019909994904420035, + "loss": 0.0111, "step": 133330 }, { - "epoch": 1.44, - "learning_rate": 8.377764805085295e-05, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019909238135118636, + "loss": 0.0135, "step": 133340 }, { - "epoch": 1.44, - "learning_rate": 8.376143218525004e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019908481365817234, + "loss": 0.0143, "step": 133350 }, { - "epoch": 1.44, - "learning_rate": 8.374521631964714e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019907724596515832, + "loss": 0.0141, "step": 133360 }, { - "epoch": 1.44, - "learning_rate": 8.372900045404423e-05, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.00019906967827214433, + "loss": 0.0137, "step": 133370 }, { - "epoch": 1.44, - "learning_rate": 8.371278458844132e-05, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.0001990621105791303, + "loss": 0.0222, "step": 133380 }, { - "epoch": 1.44, - "learning_rate": 8.369656872283842e-05, - "loss": 0.0103, + "epoch": 0.67, + "learning_rate": 0.0001990545428861163, + "loss": 0.0161, "step": 133390 }, { - "epoch": 1.44, - "learning_rate": 8.368035285723552e-05, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019904697519310227, + "loss": 0.0142, "step": 133400 }, { - "epoch": 1.44, - "learning_rate": 8.36641369916326e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019903940750008828, + "loss": 0.0174, "step": 133410 }, { - "epoch": 1.44, - "learning_rate": 8.364792112602971e-05, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019903183980707426, + "loss": 0.0133, "step": 133420 }, { - "epoch": 1.44, - "learning_rate": 8.363170526042679e-05, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.00019902427211406025, + "loss": 0.0131, "step": 133430 }, { - "epoch": 1.44, - "learning_rate": 8.361548939482389e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019901670442104625, + "loss": 0.0162, "step": 133440 }, { - "epoch": 1.44, - "learning_rate": 8.359927352922097e-05, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019900913672803224, + "loss": 0.0132, "step": 133450 }, { - "epoch": 1.44, - "learning_rate": 8.358305766361808e-05, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.00019900156903501822, + "loss": 0.014, "step": 133460 }, { - "epoch": 1.44, - "learning_rate": 8.356684179801517e-05, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00019899400134200423, + "loss": 0.0126, "step": 133470 }, { - "epoch": 1.44, - "learning_rate": 8.355062593241226e-05, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.0001989864336489902, + "loss": 0.0117, "step": 133480 }, { - "epoch": 1.44, - "learning_rate": 8.353441006680936e-05, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.0001989788659559762, + "loss": 0.0151, "step": 133490 }, { - "epoch": 1.44, - "learning_rate": 8.351819420120646e-05, - "loss": 0.0068, + "epoch": 0.67, + "learning_rate": 0.0001989712982629622, + "loss": 0.0167, "step": 133500 }, { - "epoch": 1.44, - "learning_rate": 8.350197833560354e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019896373056994818, + "loss": 0.0134, "step": 133510 }, { - "epoch": 1.44, - "learning_rate": 8.348576247000065e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019895616287693416, + "loss": 0.0131, "step": 133520 }, { - "epoch": 1.44, - "learning_rate": 8.346954660439773e-05, - "loss": 0.0099, + "epoch": 0.67, + "learning_rate": 0.00019894859518392017, + "loss": 0.0181, "step": 133530 }, { - "epoch": 1.44, - "learning_rate": 8.345333073879483e-05, - "loss": 0.0102, + "epoch": 0.67, + "learning_rate": 0.00019894102749090615, + "loss": 0.0124, "step": 133540 }, { - "epoch": 1.44, - "learning_rate": 8.343711487319191e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019893345979789213, + "loss": 0.0133, "step": 133550 }, { - "epoch": 1.44, - "learning_rate": 8.342089900758902e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019892589210487814, + "loss": 0.0145, "step": 133560 }, { - "epoch": 1.44, - "learning_rate": 8.340468314198611e-05, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019891832441186412, + "loss": 0.0111, "step": 133570 }, { - "epoch": 1.44, - "learning_rate": 8.33884672763832e-05, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.0001989107567188501, + "loss": 0.0136, "step": 133580 }, { - "epoch": 1.44, - "learning_rate": 8.33722514107803e-05, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019890318902583608, + "loss": 0.0133, "step": 133590 }, { - "epoch": 1.44, - "learning_rate": 8.335603554517739e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001988956213328221, + "loss": 0.0127, "step": 133600 }, { - "epoch": 1.44, - "learning_rate": 8.333981967957448e-05, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019888805363980807, + "loss": 0.0153, "step": 133610 }, { - "epoch": 1.44, - "learning_rate": 8.332360381397159e-05, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019888048594679406, + "loss": 0.0156, "step": 133620 }, { - "epoch": 1.44, - "learning_rate": 8.330738794836867e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019887291825378006, + "loss": 0.0149, "step": 133630 }, { - "epoch": 1.44, - "learning_rate": 8.329117208276577e-05, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019886535056076605, + "loss": 0.0124, "step": 133640 }, { - "epoch": 1.44, - "learning_rate": 8.327495621716285e-05, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019885778286775203, + "loss": 0.0134, "step": 133650 }, { - "epoch": 1.44, - "learning_rate": 8.325874035155996e-05, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019885021517473804, + "loss": 0.0127, "step": 133660 }, { - "epoch": 1.45, - "learning_rate": 8.324252448595705e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019884264748172402, + "loss": 0.0143, "step": 133670 }, { - "epoch": 1.45, - "learning_rate": 8.322630862035415e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019883507978871, + "loss": 0.0136, "step": 133680 }, { - "epoch": 1.45, - "learning_rate": 8.321009275475124e-05, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.000198827512095696, + "loss": 0.017, "step": 133690 }, { - "epoch": 1.45, - "learning_rate": 8.319387688914833e-05, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.000198819944402682, + "loss": 0.0152, "step": 133700 }, { - "epoch": 1.45, - "learning_rate": 8.317766102354542e-05, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019881237670966797, + "loss": 0.0143, "step": 133710 }, { - "epoch": 1.45, - "learning_rate": 8.316144515794253e-05, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019880480901665398, + "loss": 0.0131, "step": 133720 }, { - "epoch": 1.45, - "learning_rate": 8.314522929233961e-05, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00019879724132363996, + "loss": 0.0134, "step": 133730 }, { - "epoch": 1.45, - "learning_rate": 8.312901342673672e-05, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019878967363062594, + "loss": 0.0125, "step": 133740 }, { - "epoch": 1.45, - "learning_rate": 8.31127975611338e-05, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019878210593761192, + "loss": 0.0173, "step": 133750 }, { - "epoch": 1.45, - "learning_rate": 8.30965816955309e-05, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019877453824459793, + "loss": 0.0147, "step": 133760 }, { - "epoch": 1.45, - "learning_rate": 8.308036582992798e-05, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.0001987669705515839, + "loss": 0.0143, "step": 133770 }, { - "epoch": 1.45, - "learning_rate": 8.306414996432509e-05, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.0001987594028585699, + "loss": 0.0199, "step": 133780 }, { - "epoch": 1.45, - "learning_rate": 8.304793409872219e-05, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001987518351655559, + "loss": 0.0149, "step": 133790 }, { - "epoch": 1.45, - "learning_rate": 8.303171823311927e-05, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019874426747254188, + "loss": 0.0138, "step": 133800 }, { - "epoch": 1.45, - "learning_rate": 8.301550236751638e-05, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019873669977952787, + "loss": 0.0168, "step": 133810 }, { - "epoch": 1.45, - "learning_rate": 8.299928650191347e-05, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019872913208651387, + "loss": 0.0164, "step": 133820 }, { - "epoch": 1.45, - "learning_rate": 8.298307063631056e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019872156439349986, + "loss": 0.0147, "step": 133830 }, { - "epoch": 1.45, - "learning_rate": 8.296685477070766e-05, - "loss": 0.0111, + "epoch": 0.68, + "learning_rate": 0.00019871399670048584, + "loss": 0.0139, "step": 133840 }, { - "epoch": 1.45, - "learning_rate": 8.295063890510475e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019870642900747185, + "loss": 0.0138, "step": 133850 }, { - "epoch": 1.45, - "learning_rate": 8.293442303950184e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.0001986988613144578, + "loss": 0.0147, "step": 133860 }, { - "epoch": 1.45, - "learning_rate": 8.291820717389895e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019869129362144378, + "loss": 0.0134, "step": 133870 }, { - "epoch": 1.45, - "learning_rate": 8.290199130829603e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019868372592842976, + "loss": 0.0165, "step": 133880 }, { - "epoch": 1.45, - "learning_rate": 8.288577544269313e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019867615823541577, + "loss": 0.0134, "step": 133890 }, { - "epoch": 1.45, - "learning_rate": 8.286955957709021e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019866859054240175, + "loss": 0.0158, "step": 133900 }, { - "epoch": 1.45, - "learning_rate": 8.285334371148732e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019866102284938773, + "loss": 0.0148, "step": 133910 }, { - "epoch": 1.45, - "learning_rate": 8.28371278458844e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019865345515637374, + "loss": 0.0147, "step": 133920 }, { - "epoch": 1.45, - "learning_rate": 8.28209119802815e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019864588746335972, + "loss": 0.0124, "step": 133930 }, { - "epoch": 1.45, - "learning_rate": 8.28046961146786e-05, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.0001986383197703457, + "loss": 0.014, "step": 133940 }, { - "epoch": 1.45, - "learning_rate": 8.278848024907569e-05, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019863075207733171, + "loss": 0.0327, "step": 133950 }, { - "epoch": 1.45, - "learning_rate": 8.277226438347278e-05, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.0001986231843843177, + "loss": 0.0124, "step": 133960 }, { - "epoch": 1.45, - "learning_rate": 8.275604851786989e-05, - "loss": 0.006, + "epoch": 0.68, + "learning_rate": 0.00019861561669130368, + "loss": 0.0166, "step": 133970 }, { - "epoch": 1.45, - "learning_rate": 8.273983265226697e-05, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019860804899828966, + "loss": 0.0152, "step": 133980 }, { - "epoch": 1.45, - "learning_rate": 8.272361678666407e-05, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019860048130527567, + "loss": 0.0125, "step": 133990 }, { - "epoch": 1.45, - "learning_rate": 8.270740092106115e-05, - "loss": 0.0139, + "epoch": 0.68, + "learning_rate": 0.00019859291361226165, + "loss": 0.0116, "step": 134000 }, { - "epoch": 1.45, - "eval_cer": 0.9215547298036784, - "eval_loss": 0.00670721335336566, - "eval_runtime": 121.1717, - "eval_samples_per_second": 16.506, - "eval_steps_per_second": 4.126, + "epoch": 0.68, + "eval_cer": 0.9144634631302844, + "eval_loss": 0.009661918506026268, + "eval_runtime": 116.6673, + "eval_samples_per_second": 17.143, + "eval_steps_per_second": 4.286, "step": 134000 }, { - "epoch": 1.45, - "learning_rate": 8.269118505545826e-05, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019858534591924763, + "loss": 0.0112, "step": 134010 }, { - "epoch": 1.45, - "learning_rate": 8.267496918985534e-05, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019857777822623364, + "loss": 0.0165, "step": 134020 }, { - "epoch": 1.45, - "learning_rate": 8.265875332425245e-05, - "loss": 0.0113, + "epoch": 0.68, + "learning_rate": 0.00019857021053321962, + "loss": 0.0158, "step": 134030 }, { - "epoch": 1.45, - "learning_rate": 8.264253745864954e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001985626428402056, + "loss": 0.014, "step": 134040 }, { - "epoch": 1.45, - "learning_rate": 8.262632159304663e-05, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.0001985550751471916, + "loss": 0.0279, "step": 134050 }, { - "epoch": 1.45, - "learning_rate": 8.261010572744372e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001985475074541776, + "loss": 0.0158, "step": 134060 }, { - "epoch": 1.45, - "learning_rate": 8.259388986184082e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019853993976116357, + "loss": 0.0154, "step": 134070 }, { - "epoch": 1.45, - "learning_rate": 8.257767399623791e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019853237206814958, + "loss": 0.0199, "step": 134080 }, { - "epoch": 1.45, - "learning_rate": 8.256145813063502e-05, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019852480437513556, + "loss": 0.014, "step": 134090 }, { - "epoch": 1.45, - "learning_rate": 8.25452422650321e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019851723668212154, + "loss": 0.0144, "step": 134100 }, { - "epoch": 1.45, - "learning_rate": 8.25290263994292e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019850966898910755, + "loss": 0.0148, "step": 134110 }, { - "epoch": 1.45, - "learning_rate": 8.251281053382628e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019850210129609353, + "loss": 0.0191, "step": 134120 }, { - "epoch": 1.45, - "learning_rate": 8.249659466822339e-05, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019849453360307952, + "loss": 0.0129, "step": 134130 }, { - "epoch": 1.45, - "learning_rate": 8.248037880262048e-05, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.0001984869659100655, + "loss": 0.0112, "step": 134140 }, { - "epoch": 1.45, - "learning_rate": 8.246416293701757e-05, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.0001984793982170515, + "loss": 0.0142, "step": 134150 }, { - "epoch": 1.45, - "learning_rate": 8.244794707141466e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.0001984718305240375, + "loss": 0.0197, "step": 134160 }, { - "epoch": 1.45, - "learning_rate": 8.243173120581176e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019846426283102347, + "loss": 0.0161, "step": 134170 }, { - "epoch": 1.45, - "learning_rate": 8.241551534020885e-05, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019845669513800948, + "loss": 0.0147, "step": 134180 }, { - "epoch": 1.45, - "learning_rate": 8.239929947460596e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019844912744499546, + "loss": 0.0188, "step": 134190 }, { - "epoch": 1.45, - "learning_rate": 8.238308360900304e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019844155975198144, + "loss": 0.014, "step": 134200 }, { - "epoch": 1.45, - "learning_rate": 8.236686774340014e-05, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019843399205896745, + "loss": 0.0116, "step": 134210 }, { - "epoch": 1.45, - "learning_rate": 8.235065187779722e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019842642436595343, + "loss": 0.0155, "step": 134220 }, { - "epoch": 1.45, - "learning_rate": 8.233443601219433e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.0001984188566729394, + "loss": 0.0154, "step": 134230 }, { - "epoch": 1.45, - "learning_rate": 8.23182201465914e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019841128897992542, + "loss": 0.0153, "step": 134240 }, { - "epoch": 1.45, - "learning_rate": 8.230200428098851e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.0001984037212869114, + "loss": 0.0159, "step": 134250 }, { - "epoch": 1.45, - "learning_rate": 8.22857884153856e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019839615359389738, + "loss": 0.0147, "step": 134260 }, { - "epoch": 1.45, - "learning_rate": 8.22695725497827e-05, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001983885859008834, + "loss": 0.0141, "step": 134270 }, { - "epoch": 1.45, - "learning_rate": 8.225335668417979e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019838101820786937, + "loss": 0.0137, "step": 134280 }, { - "epoch": 1.45, - "learning_rate": 8.22371408185769e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019837345051485535, + "loss": 0.014, "step": 134290 }, { - "epoch": 1.45, - "learning_rate": 8.222092495297398e-05, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019836588282184134, + "loss": 0.0135, "step": 134300 }, { - "epoch": 1.45, - "learning_rate": 8.220470908737108e-05, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019835831512882734, + "loss": 0.0129, "step": 134310 }, { - "epoch": 1.45, - "learning_rate": 8.218849322176816e-05, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019835074743581333, + "loss": 0.016, "step": 134320 }, { - "epoch": 1.45, - "learning_rate": 8.217227735616527e-05, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.0001983431797427993, + "loss": 0.0169, "step": 134330 }, { - "epoch": 1.45, - "learning_rate": 8.215606149056235e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019833561204978532, + "loss": 0.0161, "step": 134340 }, { - "epoch": 1.45, - "learning_rate": 8.213984562495945e-05, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001983280443567713, + "loss": 0.0122, "step": 134350 }, { - "epoch": 1.45, - "learning_rate": 8.212362975935655e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019832047666375728, + "loss": 0.0151, "step": 134360 }, { - "epoch": 1.45, - "learning_rate": 8.210741389375364e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.0001983129089707433, + "loss": 0.0157, "step": 134370 }, { - "epoch": 1.45, - "learning_rate": 8.209119802815073e-05, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019830534127772927, + "loss": 0.0123, "step": 134380 }, { - "epoch": 1.45, - "learning_rate": 8.207498216254783e-05, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019829777358471525, + "loss": 0.0123, "step": 134390 }, { - "epoch": 1.45, - "learning_rate": 8.205876629694492e-05, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019829020589170126, + "loss": 0.0128, "step": 134400 }, { - "epoch": 1.45, - "learning_rate": 8.204255043134202e-05, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019828263819868724, + "loss": 0.015, "step": 134410 }, { - "epoch": 1.45, - "learning_rate": 8.20263345657391e-05, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019827507050567322, + "loss": 0.0152, "step": 134420 }, { - "epoch": 1.45, - "learning_rate": 8.201011870013621e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019826750281265923, + "loss": 0.0142, "step": 134430 }, { - "epoch": 1.45, - "learning_rate": 8.199390283453329e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.0001982599351196452, + "loss": 0.0155, "step": 134440 }, { - "epoch": 1.45, - "learning_rate": 8.19776869689304e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.0001982523674266312, + "loss": 0.0137, "step": 134450 }, { - "epoch": 1.45, - "learning_rate": 8.196147110332747e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.0001982447997336172, + "loss": 0.0117, "step": 134460 }, { - "epoch": 1.45, - "learning_rate": 8.194525523772458e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019823723204060318, + "loss": 0.0139, "step": 134470 }, { - "epoch": 1.45, - "learning_rate": 8.192903937212167e-05, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019822966434758916, + "loss": 0.0139, "step": 134480 }, { - "epoch": 1.45, - "learning_rate": 8.191282350651877e-05, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019822209665457515, + "loss": 0.0126, "step": 134490 }, { - "epoch": 1.45, - "learning_rate": 8.189660764091586e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019821452896156115, + "loss": 0.0156, "step": 134500 }, { - "epoch": 1.45, - "learning_rate": 8.188039177531297e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019820696126854714, + "loss": 0.0141, "step": 134510 }, { - "epoch": 1.45, - "learning_rate": 8.186417590971006e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019819939357553312, + "loss": 0.0152, "step": 134520 }, { - "epoch": 1.45, - "learning_rate": 8.184796004410715e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019819182588251913, + "loss": 0.0165, "step": 134530 }, { - "epoch": 1.45, - "learning_rate": 8.183174417850424e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.0001981842581895051, + "loss": 0.0133, "step": 134540 }, { - "epoch": 1.45, - "learning_rate": 8.181552831290134e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.0001981766904964911, + "loss": 0.0151, "step": 134550 }, { - "epoch": 1.45, - "learning_rate": 8.179931244729844e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001981691228034771, + "loss": 0.0169, "step": 134560 }, { - "epoch": 1.45, - "learning_rate": 8.178309658169552e-05, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019816155511046308, + "loss": 0.014, "step": 134570 }, { - "epoch": 1.45, - "learning_rate": 8.176688071609263e-05, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019815398741744906, + "loss": 0.0189, "step": 134580 }, { - "epoch": 1.45, - "learning_rate": 8.175066485048971e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019814641972443507, + "loss": 0.0148, "step": 134590 }, { - "epoch": 1.46, - "learning_rate": 8.173444898488681e-05, - "loss": 0.0104, + "epoch": 0.68, + "learning_rate": 0.00019813885203142105, + "loss": 0.0132, "step": 134600 }, { - "epoch": 1.46, - "learning_rate": 8.171823311928389e-05, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019813128433840703, + "loss": 0.0138, "step": 134610 }, { - "epoch": 1.46, - "learning_rate": 8.1702017253681e-05, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019812371664539304, + "loss": 0.0141, "step": 134620 }, { - "epoch": 1.46, - "learning_rate": 8.168580138807809e-05, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.00019811614895237902, + "loss": 0.0151, "step": 134630 }, { - "epoch": 1.46, - "learning_rate": 8.166958552247518e-05, - "loss": 0.0104, + "epoch": 0.68, + "learning_rate": 0.000198108581259365, + "loss": 0.0166, "step": 134640 }, { - "epoch": 1.46, - "learning_rate": 8.165336965687228e-05, - "loss": 0.0202, + "epoch": 0.68, + "learning_rate": 0.00019810101356635098, + "loss": 0.0142, "step": 134650 }, { - "epoch": 1.46, - "learning_rate": 8.163715379126938e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.000198093445873337, + "loss": 0.0141, "step": 134660 }, { - "epoch": 1.46, - "learning_rate": 8.162093792566646e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019808587818032297, + "loss": 0.0137, "step": 134670 }, { - "epoch": 1.46, - "learning_rate": 8.160472206006357e-05, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019807831048730896, + "loss": 0.0123, "step": 134680 }, { - "epoch": 1.46, - "learning_rate": 8.158850619446065e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019807074279429496, + "loss": 0.0149, "step": 134690 }, { - "epoch": 1.46, - "learning_rate": 8.157229032885775e-05, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.00019806317510128095, + "loss": 0.0125, "step": 134700 }, { - "epoch": 1.46, - "learning_rate": 8.155607446325483e-05, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.00019805560740826693, + "loss": 0.0145, "step": 134710 }, { - "epoch": 1.46, - "learning_rate": 8.153985859765194e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019804803971525294, + "loss": 0.0112, "step": 134720 }, { - "epoch": 1.46, - "learning_rate": 8.152364273204903e-05, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019804047202223892, + "loss": 0.014, "step": 134730 }, { - "epoch": 1.46, - "learning_rate": 8.150742686644613e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.0001980329043292249, + "loss": 0.0117, "step": 134740 }, { - "epoch": 1.46, - "learning_rate": 8.149121100084322e-05, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001980253366362109, + "loss": 0.0125, "step": 134750 }, { - "epoch": 1.46, - "learning_rate": 8.147499513524031e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001980177689431969, + "loss": 0.0136, "step": 134760 }, { - "epoch": 1.46, - "learning_rate": 8.14587792696374e-05, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019801020125018287, + "loss": 0.0134, "step": 134770 }, { - "epoch": 1.46, - "learning_rate": 8.144256340403451e-05, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019800263355716888, + "loss": 0.013, "step": 134780 }, { - "epoch": 1.46, - "learning_rate": 8.142634753843159e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019799506586415486, + "loss": 0.0126, "step": 134790 }, { - "epoch": 1.46, - "learning_rate": 8.14101316728287e-05, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019798749817114084, + "loss": 0.0148, "step": 134800 }, { - "epoch": 1.46, - "learning_rate": 8.139391580722577e-05, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019797993047812682, + "loss": 0.014, "step": 134810 }, { - "epoch": 1.46, - "learning_rate": 8.137769994162288e-05, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019797236278511283, + "loss": 0.0144, "step": 134820 }, { - "epoch": 1.46, - "learning_rate": 8.136148407601997e-05, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.0001979647950920988, + "loss": 0.0155, "step": 134830 }, { - "epoch": 1.46, - "learning_rate": 8.134526821041707e-05, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.0001979572273990848, + "loss": 0.0149, "step": 134840 }, { - "epoch": 1.46, - "learning_rate": 8.132905234481416e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.0001979496597060708, + "loss": 0.0176, "step": 134850 }, { - "epoch": 1.46, - "learning_rate": 8.131283647921125e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019794209201305678, + "loss": 0.0131, "step": 134860 }, { - "epoch": 1.46, - "learning_rate": 8.129662061360834e-05, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019793452432004277, + "loss": 0.0146, "step": 134870 }, { - "epoch": 1.46, - "learning_rate": 8.128040474800545e-05, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019792695662702877, + "loss": 0.0134, "step": 134880 }, { - "epoch": 1.46, - "learning_rate": 8.126418888240253e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019791938893401476, + "loss": 0.0142, "step": 134890 }, { - "epoch": 1.46, - "learning_rate": 8.124797301679964e-05, - "loss": 0.011, + "epoch": 0.68, + "learning_rate": 0.00019791182124100074, + "loss": 0.0109, "step": 134900 }, { - "epoch": 1.46, - "learning_rate": 8.123175715119672e-05, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019790425354798675, + "loss": 0.013, "step": 134910 }, { - "epoch": 1.46, - "learning_rate": 8.121554128559382e-05, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.00019789668585497273, + "loss": 0.0203, "step": 134920 }, { - "epoch": 1.46, - "learning_rate": 8.11993254199909e-05, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.0001978891181619587, + "loss": 0.0123, "step": 134930 }, { - "epoch": 1.46, - "learning_rate": 8.118310955438801e-05, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019788155046894472, + "loss": 0.0158, "step": 134940 }, { - "epoch": 1.46, - "learning_rate": 8.11668936887851e-05, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.0001978739827759307, + "loss": 0.0146, "step": 134950 }, { - "epoch": 1.46, - "learning_rate": 8.115067782318219e-05, - "loss": 0.0128, + "epoch": 0.68, + "learning_rate": 0.00019786641508291668, + "loss": 0.0126, "step": 134960 }, { - "epoch": 1.46, - "learning_rate": 8.113446195757929e-05, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.0001978588473899027, + "loss": 0.0152, "step": 134970 }, { - "epoch": 1.46, - "learning_rate": 8.111824609197639e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019785127969688867, + "loss": 0.0125, "step": 134980 }, { - "epoch": 1.46, - "learning_rate": 8.110203022637347e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019784371200387465, + "loss": 0.0143, "step": 134990 }, { - "epoch": 1.46, - "learning_rate": 8.108581436077058e-05, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019783614431086063, + "loss": 0.0117, "step": 135000 }, { - "epoch": 1.46, - "eval_cer": 0.921567758848024, - "eval_loss": 0.006778133567422628, - "eval_runtime": 121.2762, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.68, + "eval_cer": 0.9144663743186606, + "eval_loss": 0.00933473464101553, + "eval_runtime": 116.6822, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, "step": 135000 }, { - "epoch": 1.46, - "learning_rate": 8.106959849516766e-05, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019782857661784664, + "loss": 0.0122, "step": 135010 }, { - "epoch": 1.46, - "learning_rate": 8.105338262956476e-05, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.00019782100892483262, + "loss": 0.0107, "step": 135020 }, { - "epoch": 1.46, - "learning_rate": 8.103716676396184e-05, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.0001978134412318186, + "loss": 0.015, "step": 135030 }, { - "epoch": 1.46, - "learning_rate": 8.102095089835895e-05, - "loss": 0.0098, + "epoch": 0.68, + "learning_rate": 0.0001978058735388046, + "loss": 0.014, "step": 135040 }, { - "epoch": 1.46, - "learning_rate": 8.100473503275604e-05, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.0001977983058457906, + "loss": 0.019, "step": 135050 }, { - "epoch": 1.46, - "learning_rate": 8.098851916715313e-05, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019779073815277658, + "loss": 0.0179, "step": 135060 }, { - "epoch": 1.46, - "learning_rate": 8.097230330155023e-05, - "loss": 0.0125, + "epoch": 0.68, + "learning_rate": 0.00019778317045976258, + "loss": 0.0143, "step": 135070 }, { - "epoch": 1.46, - "learning_rate": 8.095608743594732e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019777560276674857, + "loss": 0.0168, "step": 135080 }, { - "epoch": 1.46, - "learning_rate": 8.093987157034441e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019776803507373455, + "loss": 0.0132, "step": 135090 }, { - "epoch": 1.46, - "learning_rate": 8.092365570474152e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019776046738072056, + "loss": 0.0127, "step": 135100 }, { - "epoch": 1.46, - "learning_rate": 8.09074398391386e-05, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019775289968770654, + "loss": 0.0127, "step": 135110 }, { - "epoch": 1.46, - "learning_rate": 8.08912239735357e-05, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001977453319946925, + "loss": 0.0143, "step": 135120 }, { - "epoch": 1.46, - "learning_rate": 8.087500810793278e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019773776430167847, + "loss": 0.0116, "step": 135130 }, { - "epoch": 1.46, - "learning_rate": 8.085879224232989e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019773019660866448, + "loss": 0.0169, "step": 135140 }, { - "epoch": 1.46, - "learning_rate": 8.084257637672698e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019772262891565046, + "loss": 0.0111, "step": 135150 }, { - "epoch": 1.46, - "learning_rate": 8.082636051112407e-05, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019771506122263644, + "loss": 0.0118, "step": 135160 }, { - "epoch": 1.46, - "learning_rate": 8.081014464552117e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019770749352962245, + "loss": 0.0142, "step": 135170 }, { - "epoch": 1.46, - "learning_rate": 8.079392877991826e-05, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019769992583660843, + "loss": 0.0148, "step": 135180 }, { - "epoch": 1.46, - "learning_rate": 8.077771291431535e-05, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019769235814359442, + "loss": 0.0119, "step": 135190 }, { - "epoch": 1.46, - "learning_rate": 8.076149704871246e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.0001976847904505804, + "loss": 0.0158, "step": 135200 }, { - "epoch": 1.46, - "learning_rate": 8.074528118310954e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.0001976772227575664, + "loss": 0.0143, "step": 135210 }, { - "epoch": 1.46, - "learning_rate": 8.072906531750664e-05, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.0001976696550645524, + "loss": 0.0149, "step": 135220 }, { - "epoch": 1.46, - "learning_rate": 8.071284945190374e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019766208737153837, + "loss": 0.0147, "step": 135230 }, { - "epoch": 1.46, - "learning_rate": 8.069663358630083e-05, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019765451967852438, + "loss": 0.0117, "step": 135240 }, { - "epoch": 1.46, - "learning_rate": 8.068041772069794e-05, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019764695198551036, + "loss": 0.0128, "step": 135250 }, { - "epoch": 1.46, - "learning_rate": 8.066420185509502e-05, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019763938429249634, + "loss": 0.0205, "step": 135260 }, { - "epoch": 1.46, - "learning_rate": 8.064798598949212e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019763181659948235, + "loss": 0.011, "step": 135270 }, { - "epoch": 1.46, - "learning_rate": 8.06317701238892e-05, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019762424890646833, + "loss": 0.0122, "step": 135280 }, { - "epoch": 1.46, - "learning_rate": 8.061555425828631e-05, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001976166812134543, + "loss": 0.0129, "step": 135290 }, { - "epoch": 1.46, - "learning_rate": 8.05993383926834e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019760911352044032, + "loss": 0.0136, "step": 135300 }, { - "epoch": 1.46, - "learning_rate": 8.058312252708049e-05, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.0001976015458274263, + "loss": 0.0141, "step": 135310 }, { - "epoch": 1.46, - "learning_rate": 8.056690666147759e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019759397813441228, + "loss": 0.0129, "step": 135320 }, { - "epoch": 1.46, - "learning_rate": 8.055069079587468e-05, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.0001975864104413983, + "loss": 0.0111, "step": 135330 }, { - "epoch": 1.46, - "learning_rate": 8.053447493027177e-05, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.00019757884274838427, + "loss": 0.0113, "step": 135340 }, { - "epoch": 1.46, - "learning_rate": 8.051825906466888e-05, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019757127505537025, + "loss": 0.0137, "step": 135350 }, { - "epoch": 1.46, - "learning_rate": 8.050204319906596e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019756370736235626, + "loss": 0.0151, "step": 135360 }, { - "epoch": 1.46, - "learning_rate": 8.048582733346306e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019755613966934224, + "loss": 0.0134, "step": 135370 }, { - "epoch": 1.46, - "learning_rate": 8.046961146786014e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019754857197632823, + "loss": 0.0149, "step": 135380 }, { - "epoch": 1.46, - "learning_rate": 8.045339560225725e-05, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.0001975410042833142, + "loss": 0.0132, "step": 135390 }, { - "epoch": 1.46, - "learning_rate": 8.043717973665433e-05, - "loss": 0.01, + "epoch": 0.68, + "learning_rate": 0.00019753343659030022, + "loss": 0.014, "step": 135400 }, { - "epoch": 1.46, - "learning_rate": 8.042096387105143e-05, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.0001975258688972862, + "loss": 0.0124, "step": 135410 }, { - "epoch": 1.46, - "learning_rate": 8.040474800544853e-05, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019751830120427218, + "loss": 0.0117, "step": 135420 }, { - "epoch": 1.46, - "learning_rate": 8.038853213984562e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.0001975107335112582, + "loss": 0.0134, "step": 135430 }, { - "epoch": 1.46, - "learning_rate": 8.037231627424271e-05, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019750316581824417, + "loss": 0.0148, "step": 135440 }, { - "epoch": 1.46, - "learning_rate": 8.035610040863982e-05, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019749559812523015, + "loss": 0.0132, "step": 135450 }, { - "epoch": 1.46, - "learning_rate": 8.03398845430369e-05, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019748803043221616, + "loss": 0.013, "step": 135460 }, { - "epoch": 1.46, - "learning_rate": 8.0323668677434e-05, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.00019748046273920214, + "loss": 0.0108, "step": 135470 }, { - "epoch": 1.46, - "learning_rate": 8.030745281183108e-05, - "loss": 0.0064, + "epoch": 0.68, + "learning_rate": 0.00019747289504618812, + "loss": 0.0133, "step": 135480 }, { - "epoch": 1.46, - "learning_rate": 8.029123694622819e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019746532735317413, + "loss": 0.0164, "step": 135490 }, { - "epoch": 1.46, - "learning_rate": 8.027502108062527e-05, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.0001974577596601601, + "loss": 0.0146, "step": 135500 }, { - "epoch": 1.46, - "learning_rate": 8.025880521502237e-05, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.0001974501919671461, + "loss": 0.0148, "step": 135510 }, { - "epoch": 1.47, - "learning_rate": 8.024258934941947e-05, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.0001974426242741321, + "loss": 0.0177, "step": 135520 }, { - "epoch": 1.47, - "learning_rate": 8.022637348381656e-05, - "loss": 0.0059, + "epoch": 0.68, + "learning_rate": 0.00019743505658111808, + "loss": 0.0128, "step": 135530 }, { - "epoch": 1.47, - "learning_rate": 8.021015761821365e-05, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019742748888810406, + "loss": 0.0183, "step": 135540 }, { - "epoch": 1.47, - "learning_rate": 8.019394175261075e-05, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.00019741992119509005, + "loss": 0.0151, "step": 135550 }, { - "epoch": 1.47, - "learning_rate": 8.017772588700784e-05, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019741235350207605, + "loss": 0.0183, "step": 135560 }, { - "epoch": 1.47, - "learning_rate": 8.016151002140494e-05, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019740478580906204, + "loss": 0.0148, "step": 135570 }, { - "epoch": 1.47, - "learning_rate": 8.014529415580202e-05, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019739721811604802, + "loss": 0.0146, "step": 135580 }, { - "epoch": 1.47, - "learning_rate": 8.012907829019913e-05, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019738965042303403, + "loss": 0.0162, "step": 135590 }, { - "epoch": 1.47, - "learning_rate": 8.011286242459621e-05, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019738208273002, + "loss": 0.0134, "step": 135600 }, { - "epoch": 1.47, - "learning_rate": 8.009664655899332e-05, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.000197374515037006, + "loss": 0.0136, "step": 135610 }, { - "epoch": 1.47, - "learning_rate": 8.00804306933904e-05, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.000197366947343992, + "loss": 0.0145, "step": 135620 }, { - "epoch": 1.47, - "learning_rate": 8.00642148277875e-05, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019735937965097798, + "loss": 0.0105, "step": 135630 }, { - "epoch": 1.47, - "learning_rate": 8.00479989621846e-05, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019735181195796396, + "loss": 0.0102, "step": 135640 }, { - "epoch": 1.47, - "learning_rate": 8.003178309658169e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019734424426494997, + "loss": 0.013, "step": 135650 }, { - "epoch": 1.47, - "learning_rate": 8.001556723097878e-05, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019733667657193595, + "loss": 0.0098, "step": 135660 }, { - "epoch": 1.47, - "learning_rate": 7.999935136537589e-05, - "loss": 0.0098, + "epoch": 0.68, + "learning_rate": 0.00019732910887892193, + "loss": 0.0126, "step": 135670 }, { - "epoch": 1.47, - "learning_rate": 7.998313549977297e-05, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019732154118590794, + "loss": 0.0154, "step": 135680 }, { - "epoch": 1.47, - "learning_rate": 7.996691963417007e-05, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019731397349289392, + "loss": 0.0128, "step": 135690 }, { - "epoch": 1.47, - "learning_rate": 7.995070376856715e-05, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.0001973064057998799, + "loss": 0.0131, "step": 135700 }, { - "epoch": 1.47, - "learning_rate": 7.993448790296426e-05, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019729883810686588, + "loss": 0.0124, "step": 135710 }, { - "epoch": 1.47, - "learning_rate": 7.991827203736134e-05, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.0001972912704138519, + "loss": 0.0122, "step": 135720 }, { - "epoch": 1.47, - "learning_rate": 7.990205617175844e-05, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019728370272083787, + "loss": 0.0134, "step": 135730 }, { - "epoch": 1.47, - "learning_rate": 7.988584030615554e-05, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019727613502782386, + "loss": 0.0138, "step": 135740 }, { - "epoch": 1.47, - "learning_rate": 7.986962444055263e-05, - "loss": 0.0109, + "epoch": 0.68, + "learning_rate": 0.00019726856733480986, + "loss": 0.0124, "step": 135750 }, { - "epoch": 1.47, - "learning_rate": 7.985340857494972e-05, - "loss": 0.0107, + "epoch": 0.68, + "learning_rate": 0.00019726099964179585, + "loss": 0.0137, "step": 135760 }, { - "epoch": 1.47, - "learning_rate": 7.983719270934681e-05, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019725343194878183, + "loss": 0.0131, "step": 135770 }, { - "epoch": 1.47, - "learning_rate": 7.98209768437439e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019724586425576784, + "loss": 0.0148, "step": 135780 }, { - "epoch": 1.47, - "learning_rate": 7.980476097814101e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019723829656275382, + "loss": 0.0161, "step": 135790 }, { - "epoch": 1.47, - "learning_rate": 7.978854511253809e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.0001972307288697398, + "loss": 0.0136, "step": 135800 }, { - "epoch": 1.47, - "learning_rate": 7.97723292469352e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001972231611767258, + "loss": 0.0111, "step": 135810 }, { - "epoch": 1.47, - "learning_rate": 7.975611338133228e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.0001972155934837118, + "loss": 0.0104, "step": 135820 }, { - "epoch": 1.47, - "learning_rate": 7.973989751572938e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019720802579069777, + "loss": 0.0129, "step": 135830 }, { - "epoch": 1.47, - "learning_rate": 7.972368165012648e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019720045809768378, + "loss": 0.0123, "step": 135840 }, { - "epoch": 1.47, - "learning_rate": 7.970746578452357e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019719289040466976, + "loss": 0.0154, "step": 135850 }, { - "epoch": 1.47, - "learning_rate": 7.969124991892066e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019718532271165574, + "loss": 0.0106, "step": 135860 }, { - "epoch": 1.47, - "learning_rate": 7.967503405331775e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019717775501864175, + "loss": 0.0124, "step": 135870 }, { - "epoch": 1.47, - "learning_rate": 7.965881818771485e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019717018732562773, + "loss": 0.0121, "step": 135880 }, { - "epoch": 1.47, - "learning_rate": 7.964260232211195e-05, - "loss": 0.0109, + "epoch": 0.69, + "learning_rate": 0.0001971626196326137, + "loss": 0.0112, "step": 135890 }, { - "epoch": 1.47, - "learning_rate": 7.962638645650903e-05, - "loss": 0.0123, + "epoch": 0.69, + "learning_rate": 0.0001971550519395997, + "loss": 0.0111, "step": 135900 }, { - "epoch": 1.47, - "learning_rate": 7.961017059090614e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.0001971474842465857, + "loss": 0.0161, "step": 135910 }, { - "epoch": 1.47, - "learning_rate": 7.959395472530322e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019713991655357168, + "loss": 0.0132, "step": 135920 }, { - "epoch": 1.47, - "learning_rate": 7.957773885970032e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019713234886055767, + "loss": 0.0151, "step": 135930 }, { - "epoch": 1.47, - "learning_rate": 7.95615229940974e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019712478116754367, + "loss": 0.0137, "step": 135940 }, { - "epoch": 1.47, - "learning_rate": 7.954530712849451e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019711721347452966, + "loss": 0.0143, "step": 135950 }, { - "epoch": 1.47, - "learning_rate": 7.952909126289162e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019710964578151564, + "loss": 0.0124, "step": 135960 }, { - "epoch": 1.47, - "learning_rate": 7.95128753972887e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019710207808850165, + "loss": 0.0159, "step": 135970 }, { - "epoch": 1.47, - "learning_rate": 7.94966595316858e-05, - "loss": 0.01, + "epoch": 0.69, + "learning_rate": 0.00019709451039548763, + "loss": 0.0162, "step": 135980 }, { - "epoch": 1.47, - "learning_rate": 7.94804436660829e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001970869427024736, + "loss": 0.0157, "step": 135990 }, { - "epoch": 1.47, - "learning_rate": 7.946422780047999e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019707937500945962, + "loss": 0.0106, "step": 136000 }, { - "epoch": 1.47, - "eval_cer": 0.9215312775238562, - "eval_loss": 0.006653364282101393, - "eval_runtime": 121.3191, - "eval_samples_per_second": 16.485, - "eval_steps_per_second": 4.121, + "epoch": 0.69, + "eval_cer": 0.9144586111496574, + "eval_loss": 0.009702920913696289, + "eval_runtime": 116.6777, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, "step": 136000 }, { - "epoch": 1.47, - "learning_rate": 7.944801193487708e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001970718073164456, + "loss": 0.0132, "step": 136010 }, { - "epoch": 1.47, - "learning_rate": 7.943179606927417e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.00019706423962343158, + "loss": 0.011, "step": 136020 }, { - "epoch": 1.47, - "learning_rate": 7.941558020367127e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001970566719304176, + "loss": 0.0127, "step": 136030 }, { - "epoch": 1.47, - "learning_rate": 7.939936433806837e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019704910423740357, + "loss": 0.017, "step": 136040 }, { - "epoch": 1.47, - "learning_rate": 7.938314847246545e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019704153654438955, + "loss": 0.0134, "step": 136050 }, { - "epoch": 1.47, - "learning_rate": 7.936693260686256e-05, - "loss": 0.0054, + "epoch": 0.69, + "learning_rate": 0.00019703396885137553, + "loss": 0.0156, "step": 136060 }, { - "epoch": 1.47, - "learning_rate": 7.935071674125964e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019702640115836154, + "loss": 0.0128, "step": 136070 }, { - "epoch": 1.47, - "learning_rate": 7.933450087565674e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019701883346534752, + "loss": 0.0122, "step": 136080 }, { - "epoch": 1.47, - "learning_rate": 7.931828501005382e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.0001970112657723335, + "loss": 0.0161, "step": 136090 }, { - "epoch": 1.47, - "learning_rate": 7.930206914445093e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001970036980793195, + "loss": 0.0111, "step": 136100 }, { - "epoch": 1.47, - "learning_rate": 7.928585327884802e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.0001969961303863055, + "loss": 0.0135, "step": 136110 }, { - "epoch": 1.47, - "learning_rate": 7.926963741324511e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019698856269329148, + "loss": 0.0146, "step": 136120 }, { - "epoch": 1.47, - "learning_rate": 7.92534215476422e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019698099500027748, + "loss": 0.0135, "step": 136130 }, { - "epoch": 1.47, - "learning_rate": 7.923720568203931e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019697342730726347, + "loss": 0.0135, "step": 136140 }, { - "epoch": 1.47, - "learning_rate": 7.922098981643639e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019696585961424945, + "loss": 0.0127, "step": 136150 }, { - "epoch": 1.47, - "learning_rate": 7.92047739508335e-05, - "loss": 0.0124, + "epoch": 0.69, + "learning_rate": 0.00019695829192123546, + "loss": 0.0135, "step": 136160 }, { - "epoch": 1.47, - "learning_rate": 7.918855808523058e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019695072422822144, + "loss": 0.0124, "step": 136170 }, { - "epoch": 1.47, - "learning_rate": 7.917234221962768e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.00019694315653520742, + "loss": 0.0131, "step": 136180 }, { - "epoch": 1.47, - "learning_rate": 7.915612635402476e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019693558884219343, + "loss": 0.0183, "step": 136190 }, { - "epoch": 1.47, - "learning_rate": 7.913991048842187e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001969280211491794, + "loss": 0.0163, "step": 136200 }, { - "epoch": 1.47, - "learning_rate": 7.912369462281896e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.0001969204534561654, + "loss": 0.0133, "step": 136210 }, { - "epoch": 1.47, - "learning_rate": 7.910747875721605e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019691288576315137, + "loss": 0.0157, "step": 136220 }, { - "epoch": 1.47, - "learning_rate": 7.909126289161315e-05, - "loss": 0.0102, + "epoch": 0.69, + "learning_rate": 0.00019690531807013738, + "loss": 0.0134, "step": 136230 }, { - "epoch": 1.47, - "learning_rate": 7.907504702601024e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.00019689775037712336, + "loss": 0.014, "step": 136240 }, { - "epoch": 1.47, - "learning_rate": 7.905883116040733e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019689018268410934, + "loss": 0.0109, "step": 136250 }, { - "epoch": 1.47, - "learning_rate": 7.904261529480444e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019688261499109535, + "loss": 0.0135, "step": 136260 }, { - "epoch": 1.47, - "learning_rate": 7.902639942920152e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019687504729808133, + "loss": 0.0123, "step": 136270 }, { - "epoch": 1.47, - "learning_rate": 7.901018356359862e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019686747960506731, + "loss": 0.0179, "step": 136280 }, { - "epoch": 1.47, - "learning_rate": 7.89939676979957e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019685991191205332, + "loss": 0.0127, "step": 136290 }, { - "epoch": 1.47, - "learning_rate": 7.897775183239281e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.0001968523442190393, + "loss": 0.0116, "step": 136300 }, { - "epoch": 1.47, - "learning_rate": 7.89615359667899e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019684477652602529, + "loss": 0.0128, "step": 136310 }, { - "epoch": 1.47, - "learning_rate": 7.8945320101187e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.0001968372088330113, + "loss": 0.0176, "step": 136320 }, { - "epoch": 1.47, - "learning_rate": 7.892910423558409e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019682964113999728, + "loss": 0.0134, "step": 136330 }, { - "epoch": 1.47, - "learning_rate": 7.891288836998118e-05, - "loss": 0.0101, + "epoch": 0.69, + "learning_rate": 0.00019682207344698326, + "loss": 0.0114, "step": 136340 }, { - "epoch": 1.47, - "learning_rate": 7.889667250437827e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019681450575396927, + "loss": 0.014, "step": 136350 }, { - "epoch": 1.47, - "learning_rate": 7.888045663877538e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019680693806095525, + "loss": 0.0137, "step": 136360 }, { - "epoch": 1.47, - "learning_rate": 7.886424077317246e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019679937036794123, + "loss": 0.0153, "step": 136370 }, { - "epoch": 1.47, - "learning_rate": 7.884802490756957e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019679180267492718, + "loss": 0.0135, "step": 136380 }, { - "epoch": 1.47, - "learning_rate": 7.883180904196664e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001967842349819132, + "loss": 0.011, "step": 136390 }, { - "epoch": 1.47, - "learning_rate": 7.881559317636375e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019677666728889917, + "loss": 0.0117, "step": 136400 }, { - "epoch": 1.47, - "learning_rate": 7.879937731076083e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019676909959588515, + "loss": 0.0144, "step": 136410 }, { - "epoch": 1.47, - "learning_rate": 7.878316144515794e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019676153190287116, + "loss": 0.0189, "step": 136420 }, { - "epoch": 1.47, - "learning_rate": 7.876694557955503e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019675396420985714, + "loss": 0.0138, "step": 136430 }, { - "epoch": 1.47, - "learning_rate": 7.875072971395212e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019674639651684313, + "loss": 0.0149, "step": 136440 }, { - "epoch": 1.48, - "learning_rate": 7.873451384834921e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.0001967388288238291, + "loss": 0.0118, "step": 136450 }, { - "epoch": 1.48, - "learning_rate": 7.871829798274632e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019673126113081512, + "loss": 0.0119, "step": 136460 }, { - "epoch": 1.48, - "learning_rate": 7.87020821171434e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.0001967236934378011, + "loss": 0.0147, "step": 136470 }, { - "epoch": 1.48, - "learning_rate": 7.86858662515405e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019671612574478708, + "loss": 0.0142, "step": 136480 }, { - "epoch": 1.48, - "learning_rate": 7.866965038593759e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001967085580517731, + "loss": 0.012, "step": 136490 }, { - "epoch": 1.48, - "learning_rate": 7.865343452033469e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019670099035875907, + "loss": 0.0116, "step": 136500 }, { - "epoch": 1.48, - "learning_rate": 7.863721865473177e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019669342266574505, + "loss": 0.0124, "step": 136510 }, { - "epoch": 1.48, - "learning_rate": 7.862100278912888e-05, - "loss": 0.0101, + "epoch": 0.69, + "learning_rate": 0.00019668585497273106, + "loss": 0.0137, "step": 136520 }, { - "epoch": 1.48, - "learning_rate": 7.860478692352597e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019667828727971704, + "loss": 0.0134, "step": 136530 }, { - "epoch": 1.48, - "learning_rate": 7.858857105792306e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019667071958670302, + "loss": 0.0137, "step": 136540 }, { - "epoch": 1.48, - "learning_rate": 7.857235519232016e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019666315189368903, + "loss": 0.013, "step": 136550 }, { - "epoch": 1.48, - "learning_rate": 7.855613932671725e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.000196655584200675, + "loss": 0.0112, "step": 136560 }, { - "epoch": 1.48, - "learning_rate": 7.853992346111434e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.000196648016507661, + "loss": 0.0183, "step": 136570 }, { - "epoch": 1.48, - "learning_rate": 7.852370759551145e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.000196640448814647, + "loss": 0.0112, "step": 136580 }, { - "epoch": 1.48, - "learning_rate": 7.850749172990853e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019663288112163298, + "loss": 0.0123, "step": 136590 }, { - "epoch": 1.48, - "learning_rate": 7.849127586430563e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019662531342861896, + "loss": 0.013, "step": 136600 }, { - "epoch": 1.48, - "learning_rate": 7.847505999870271e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019661774573560495, + "loss": 0.0127, "step": 136610 }, { - "epoch": 1.48, - "learning_rate": 7.845884413309982e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019661017804259095, + "loss": 0.01, "step": 136620 }, { - "epoch": 1.48, - "learning_rate": 7.84426282674969e-05, - "loss": 0.006, + "epoch": 0.69, + "learning_rate": 0.00019660261034957694, + "loss": 0.0118, "step": 136630 }, { - "epoch": 1.48, - "learning_rate": 7.8426412401894e-05, - "loss": 0.0111, + "epoch": 0.69, + "learning_rate": 0.00019659504265656292, + "loss": 0.0179, "step": 136640 }, { - "epoch": 1.48, - "learning_rate": 7.84101965362911e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019658747496354893, + "loss": 0.0138, "step": 136650 }, { - "epoch": 1.48, - "learning_rate": 7.839398067068819e-05, - "loss": 0.01, + "epoch": 0.69, + "learning_rate": 0.0001965799072705349, + "loss": 0.0122, "step": 136660 }, { - "epoch": 1.48, - "learning_rate": 7.83777648050853e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.0001965723395775209, + "loss": 0.0123, "step": 136670 }, { - "epoch": 1.48, - "learning_rate": 7.836154893948239e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.0001965647718845069, + "loss": 0.0153, "step": 136680 }, { - "epoch": 1.48, - "learning_rate": 7.834533307387948e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019655720419149288, + "loss": 0.0126, "step": 136690 }, { - "epoch": 1.48, - "learning_rate": 7.832911720827657e-05, - "loss": 0.0061, + "epoch": 0.69, + "learning_rate": 0.00019654963649847886, + "loss": 0.0124, "step": 136700 }, { - "epoch": 1.48, - "learning_rate": 7.831290134267367e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019654206880546487, + "loss": 0.015, "step": 136710 }, { - "epoch": 1.48, - "learning_rate": 7.829668547707076e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.00019653450111245085, + "loss": 0.0141, "step": 136720 }, { - "epoch": 1.48, - "learning_rate": 7.828046961146787e-05, - "loss": 0.006, + "epoch": 0.69, + "learning_rate": 0.00019652693341943683, + "loss": 0.0182, "step": 136730 }, { - "epoch": 1.48, - "learning_rate": 7.826425374586494e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019651936572642284, + "loss": 0.0153, "step": 136740 }, { - "epoch": 1.48, - "learning_rate": 7.824803788026205e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019651179803340882, + "loss": 0.0119, "step": 136750 }, { - "epoch": 1.48, - "learning_rate": 7.823182201465913e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.0001965042303403948, + "loss": 0.0148, "step": 136760 }, { - "epoch": 1.48, - "learning_rate": 7.821560614905624e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.0001964966626473808, + "loss": 0.0092, "step": 136770 }, { - "epoch": 1.48, - "learning_rate": 7.819939028345332e-05, - "loss": 0.0061, + "epoch": 0.69, + "learning_rate": 0.0001964890949543668, + "loss": 0.0151, "step": 136780 }, { - "epoch": 1.48, - "learning_rate": 7.818317441785042e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.00019648152726135277, + "loss": 0.013, "step": 136790 }, { - "epoch": 1.48, - "learning_rate": 7.816695855224752e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019647395956833876, + "loss": 0.0186, "step": 136800 }, { - "epoch": 1.48, - "learning_rate": 7.815074268664461e-05, - "loss": 0.0061, + "epoch": 0.69, + "learning_rate": 0.00019646639187532476, + "loss": 0.015, "step": 136810 }, { - "epoch": 1.48, - "learning_rate": 7.81345268210417e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019645882418231075, + "loss": 0.0149, "step": 136820 }, { - "epoch": 1.48, - "learning_rate": 7.811831095543881e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019645125648929673, + "loss": 0.013, "step": 136830 }, { - "epoch": 1.48, - "learning_rate": 7.810209508983589e-05, - "loss": 0.0102, + "epoch": 0.69, + "learning_rate": 0.00019644368879628274, + "loss": 0.0142, "step": 136840 }, { - "epoch": 1.48, - "learning_rate": 7.808587922423299e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.00019643612110326872, + "loss": 0.0135, "step": 136850 }, { - "epoch": 1.48, - "learning_rate": 7.806966335863007e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.0001964285534102547, + "loss": 0.0171, "step": 136860 }, { - "epoch": 1.48, - "learning_rate": 7.805344749302718e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001964209857172407, + "loss": 0.0136, "step": 136870 }, { - "epoch": 1.48, - "learning_rate": 7.803723162742426e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.0001964134180242267, + "loss": 0.0126, "step": 136880 }, { - "epoch": 1.48, - "learning_rate": 7.802101576182136e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019640585033121267, + "loss": 0.0149, "step": 136890 }, { - "epoch": 1.48, - "learning_rate": 7.800479989621846e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019639828263819868, + "loss": 0.0149, "step": 136900 }, { - "epoch": 1.48, - "learning_rate": 7.798858403061555e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019639071494518466, + "loss": 0.0183, "step": 136910 }, { - "epoch": 1.48, - "learning_rate": 7.797236816501264e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019638314725217064, + "loss": 0.0138, "step": 136920 }, { - "epoch": 1.48, - "learning_rate": 7.795615229940973e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019637557955915665, + "loss": 0.0111, "step": 136930 }, { - "epoch": 1.48, - "learning_rate": 7.793993643380683e-05, - "loss": 0.006, + "epoch": 0.69, + "learning_rate": 0.00019636801186614263, + "loss": 0.0111, "step": 136940 }, { - "epoch": 1.48, - "learning_rate": 7.792372056820393e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.0001963604441731286, + "loss": 0.0159, "step": 136950 }, { - "epoch": 1.48, - "learning_rate": 7.790750470260101e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.0001963528764801146, + "loss": 0.0109, "step": 136960 }, { - "epoch": 1.48, - "learning_rate": 7.789128883699812e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001963453087871006, + "loss": 0.0137, "step": 136970 }, { - "epoch": 1.48, - "learning_rate": 7.78750729713952e-05, - "loss": 0.0067, + "epoch": 0.69, + "learning_rate": 0.00019633774109408658, + "loss": 0.0116, "step": 136980 }, { - "epoch": 1.48, - "learning_rate": 7.78588571057923e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019633017340107257, + "loss": 0.011, "step": 136990 }, { - "epoch": 1.48, - "learning_rate": 7.78426412401894e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019632260570805857, + "loss": 0.0151, "step": 137000 }, { - "epoch": 1.48, - "eval_cer": 0.9215529925977656, - "eval_loss": 0.006497697904706001, - "eval_runtime": 121.1874, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.69, + "eval_cer": 0.914462492734159, + "eval_loss": 0.009697197005152702, + "eval_runtime": 116.8588, + "eval_samples_per_second": 17.115, + "eval_steps_per_second": 4.279, "step": 137000 }, { - "epoch": 1.48, - "learning_rate": 7.782642537458649e-05, - "loss": 0.0112, + "epoch": 0.69, + "learning_rate": 0.00019631503801504456, + "loss": 0.0125, "step": 137010 }, { - "epoch": 1.48, - "learning_rate": 7.781020950898358e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019630747032203054, + "loss": 0.0121, "step": 137020 }, { - "epoch": 1.48, - "learning_rate": 7.779399364338068e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019629990262901655, + "loss": 0.0134, "step": 137030 }, { - "epoch": 1.48, - "learning_rate": 7.777777777777777e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019629233493600253, + "loss": 0.0124, "step": 137040 }, { - "epoch": 1.48, - "learning_rate": 7.776156191217487e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001962847672429885, + "loss": 0.0112, "step": 137050 }, { - "epoch": 1.48, - "learning_rate": 7.774534604657195e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019627719954997452, + "loss": 0.0138, "step": 137060 }, { - "epoch": 1.48, - "learning_rate": 7.772913018096906e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001962696318569605, + "loss": 0.0137, "step": 137070 }, { - "epoch": 1.48, - "learning_rate": 7.771291431536614e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019626206416394648, + "loss": 0.0146, "step": 137080 }, { - "epoch": 1.48, - "learning_rate": 7.769669844976325e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.0001962544964709325, + "loss": 0.0131, "step": 137090 }, { - "epoch": 1.48, - "learning_rate": 7.768048258416032e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019624692877791847, + "loss": 0.014, "step": 137100 }, { - "epoch": 1.48, - "learning_rate": 7.766426671855743e-05, - "loss": 0.0067, + "epoch": 0.69, + "learning_rate": 0.00019623936108490445, + "loss": 0.0163, "step": 137110 }, { - "epoch": 1.48, - "learning_rate": 7.764805085295452e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019623179339189043, + "loss": 0.0127, "step": 137120 }, { - "epoch": 1.48, - "learning_rate": 7.763183498735162e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019622422569887644, + "loss": 0.0135, "step": 137130 }, { - "epoch": 1.48, - "learning_rate": 7.761561912174871e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019621665800586242, + "loss": 0.0147, "step": 137140 }, { - "epoch": 1.48, - "learning_rate": 7.759940325614582e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.0001962090903128484, + "loss": 0.0138, "step": 137150 }, { - "epoch": 1.48, - "learning_rate": 7.75831873905429e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.0001962015226198344, + "loss": 0.0134, "step": 137160 }, { - "epoch": 1.48, - "learning_rate": 7.756697152494e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.0001961939549268204, + "loss": 0.0146, "step": 137170 }, { - "epoch": 1.48, - "learning_rate": 7.755075565933708e-05, - "loss": 0.0058, + "epoch": 0.69, + "learning_rate": 0.00019618638723380638, + "loss": 0.0127, "step": 137180 }, { - "epoch": 1.48, - "learning_rate": 7.753453979373419e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019617881954079238, + "loss": 0.015, "step": 137190 }, { - "epoch": 1.48, - "learning_rate": 7.751832392813127e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019617125184777837, + "loss": 0.0133, "step": 137200 }, { - "epoch": 1.48, - "learning_rate": 7.750210806252837e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019616368415476435, + "loss": 0.0132, "step": 137210 }, { - "epoch": 1.48, - "learning_rate": 7.748589219692546e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019615611646175036, + "loss": 0.0115, "step": 137220 }, { - "epoch": 1.48, - "learning_rate": 7.746967633132256e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019614854876873634, + "loss": 0.0117, "step": 137230 }, { - "epoch": 1.48, - "learning_rate": 7.745346046571965e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.00019614098107572232, + "loss": 0.0124, "step": 137240 }, { - "epoch": 1.48, - "learning_rate": 7.743724460011674e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019613341338270833, + "loss": 0.0129, "step": 137250 }, { - "epoch": 1.48, - "learning_rate": 7.742102873451384e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.0001961258456896943, + "loss": 0.0119, "step": 137260 }, { - "epoch": 1.48, - "learning_rate": 7.740481286891094e-05, - "loss": 0.0059, + "epoch": 0.69, + "learning_rate": 0.0001961182779966803, + "loss": 0.0138, "step": 137270 }, { - "epoch": 1.48, - "learning_rate": 7.738859700330802e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019611071030366627, + "loss": 0.0175, "step": 137280 }, { - "epoch": 1.48, - "learning_rate": 7.737238113770513e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019610314261065228, + "loss": 0.016, "step": 137290 }, { - "epoch": 1.48, - "learning_rate": 7.73561652721022e-05, - "loss": 0.0106, + "epoch": 0.69, + "learning_rate": 0.00019609557491763826, + "loss": 0.0146, "step": 137300 }, { - "epoch": 1.48, - "learning_rate": 7.733994940649931e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019608800722462424, + "loss": 0.0115, "step": 137310 }, { - "epoch": 1.48, - "learning_rate": 7.73237335408964e-05, - "loss": 0.0107, + "epoch": 0.69, + "learning_rate": 0.00019608043953161025, + "loss": 0.0112, "step": 137320 }, { - "epoch": 1.48, - "learning_rate": 7.73075176752935e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019607287183859623, + "loss": 0.0111, "step": 137330 }, { - "epoch": 1.48, - "learning_rate": 7.729130180969059e-05, - "loss": 0.0118, + "epoch": 0.69, + "learning_rate": 0.00019606530414558221, + "loss": 0.0155, "step": 137340 }, { - "epoch": 1.48, - "learning_rate": 7.727508594408768e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019605773645256822, + "loss": 0.0134, "step": 137350 }, { - "epoch": 1.48, - "learning_rate": 7.725887007848478e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001960501687595542, + "loss": 0.0138, "step": 137360 }, { - "epoch": 1.49, - "learning_rate": 7.724265421288188e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019604260106654019, + "loss": 0.011, "step": 137370 }, { - "epoch": 1.49, - "learning_rate": 7.722643834727896e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.0001960350333735262, + "loss": 0.0125, "step": 137380 }, { - "epoch": 1.49, - "learning_rate": 7.721022248167607e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019602746568051218, + "loss": 0.0132, "step": 137390 }, { - "epoch": 1.49, - "learning_rate": 7.719400661607316e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019601989798749816, + "loss": 0.012, "step": 137400 }, { - "epoch": 1.49, - "learning_rate": 7.717779075047025e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019601233029448417, + "loss": 0.0142, "step": 137410 }, { - "epoch": 1.49, - "learning_rate": 7.716157488486736e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019600476260147015, + "loss": 0.0114, "step": 137420 }, { - "epoch": 1.49, - "learning_rate": 7.714535901926444e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019599719490845613, + "loss": 0.0148, "step": 137430 }, { - "epoch": 1.49, - "learning_rate": 7.712914315366155e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019598962721544214, + "loss": 0.0163, "step": 137440 }, { - "epoch": 1.49, - "learning_rate": 7.711292728805862e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019598205952242812, + "loss": 0.0148, "step": 137450 }, { - "epoch": 1.49, - "learning_rate": 7.709671142245573e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.0001959744918294141, + "loss": 0.0126, "step": 137460 }, { - "epoch": 1.49, - "learning_rate": 7.708049555685282e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019596692413640008, + "loss": 0.0134, "step": 137470 }, { - "epoch": 1.49, - "learning_rate": 7.706427969124992e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001959593564433861, + "loss": 0.0143, "step": 137480 }, { - "epoch": 1.49, - "learning_rate": 7.704806382564701e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019595178875037207, + "loss": 0.0114, "step": 137490 }, { - "epoch": 1.49, - "learning_rate": 7.70318479600441e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019594422105735805, + "loss": 0.0161, "step": 137500 }, { - "epoch": 1.49, - "learning_rate": 7.70156320944412e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019593665336434406, + "loss": 0.0121, "step": 137510 }, { - "epoch": 1.49, - "learning_rate": 7.69994162288383e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019592908567133004, + "loss": 0.0138, "step": 137520 }, { - "epoch": 1.49, - "learning_rate": 7.698320036323538e-05, - "loss": 0.0093, + "epoch": 0.69, + "learning_rate": 0.00019592151797831602, + "loss": 0.0116, "step": 137530 }, { - "epoch": 1.49, - "learning_rate": 7.696698449763249e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019591395028530203, + "loss": 0.0099, "step": 137540 }, { - "epoch": 1.49, - "learning_rate": 7.695076863202957e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019590638259228801, + "loss": 0.0118, "step": 137550 }, { - "epoch": 1.49, - "learning_rate": 7.693455276642667e-05, - "loss": 0.0107, + "epoch": 0.69, + "learning_rate": 0.000195898814899274, + "loss": 0.0136, "step": 137560 }, { - "epoch": 1.49, - "learning_rate": 7.691833690082375e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019589124720626, + "loss": 0.0131, "step": 137570 }, { - "epoch": 1.49, - "learning_rate": 7.690212103522086e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019588367951324599, + "loss": 0.012, "step": 137580 }, { - "epoch": 1.49, - "learning_rate": 7.688590516961795e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019587611182023197, + "loss": 0.0135, "step": 137590 }, { - "epoch": 1.49, - "learning_rate": 7.686968930401504e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019586854412721798, + "loss": 0.0123, "step": 137600 }, { - "epoch": 1.49, - "learning_rate": 7.685347343841214e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019586097643420396, + "loss": 0.0142, "step": 137610 }, { - "epoch": 1.49, - "learning_rate": 7.683725757280924e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019585340874118994, + "loss": 0.0162, "step": 137620 }, { - "epoch": 1.49, - "learning_rate": 7.682104170720632e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001958458410481759, + "loss": 0.0137, "step": 137630 }, { - "epoch": 1.49, - "learning_rate": 7.680482584160343e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.0001958382733551619, + "loss": 0.0122, "step": 137640 }, { - "epoch": 1.49, - "learning_rate": 7.67886099760005e-05, - "loss": 0.0103, + "epoch": 0.69, + "learning_rate": 0.00019583070566214788, + "loss": 0.0111, "step": 137650 }, { - "epoch": 1.49, - "learning_rate": 7.677239411039761e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019582313796913386, + "loss": 0.0133, "step": 137660 }, { - "epoch": 1.49, - "learning_rate": 7.675617824479469e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019581557027611985, + "loss": 0.0147, "step": 137670 }, { - "epoch": 1.49, - "learning_rate": 7.67399623791918e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019580800258310585, + "loss": 0.0147, "step": 137680 }, { - "epoch": 1.49, - "learning_rate": 7.672374651358889e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019580043489009184, + "loss": 0.0167, "step": 137690 }, { - "epoch": 1.49, - "learning_rate": 7.670753064798598e-05, - "loss": 0.0107, + "epoch": 0.69, + "learning_rate": 0.00019579286719707782, + "loss": 0.0125, "step": 137700 }, { - "epoch": 1.49, - "learning_rate": 7.669131478238308e-05, - "loss": 0.0055, + "epoch": 0.69, + "learning_rate": 0.00019578529950406383, + "loss": 0.0128, "step": 137710 }, { - "epoch": 1.49, - "learning_rate": 7.667509891678017e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.0001957777318110498, + "loss": 0.0137, "step": 137720 }, { - "epoch": 1.49, - "learning_rate": 7.665888305117726e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001957701641180358, + "loss": 0.0108, "step": 137730 }, { - "epoch": 1.49, - "learning_rate": 7.664266718557437e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.0001957625964250218, + "loss": 0.0136, "step": 137740 }, { - "epoch": 1.49, - "learning_rate": 7.662645131997145e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019575502873200778, + "loss": 0.0122, "step": 137750 }, { - "epoch": 1.49, - "learning_rate": 7.661023545436855e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019574746103899376, + "loss": 0.013, "step": 137760 }, { - "epoch": 1.49, - "learning_rate": 7.659401958876563e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019573989334597977, + "loss": 0.0126, "step": 137770 }, { - "epoch": 1.49, - "learning_rate": 7.657780372316274e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019573232565296575, + "loss": 0.0156, "step": 137780 }, { - "epoch": 1.49, - "learning_rate": 7.656158785755982e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019572475795995173, + "loss": 0.0121, "step": 137790 }, { - "epoch": 1.49, - "learning_rate": 7.654537199195692e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019571719026693774, + "loss": 0.0118, "step": 137800 }, { - "epoch": 1.49, - "learning_rate": 7.652915612635402e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019570962257392372, + "loss": 0.0113, "step": 137810 }, { - "epoch": 1.49, - "learning_rate": 7.651294026075111e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001957020548809097, + "loss": 0.0131, "step": 137820 }, { - "epoch": 1.49, - "learning_rate": 7.64967243951482e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001956944871878957, + "loss": 0.0132, "step": 137830 }, { - "epoch": 1.49, - "learning_rate": 7.648050852954531e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.0001956869194948817, + "loss": 0.0109, "step": 137840 }, { - "epoch": 1.49, - "learning_rate": 7.646429266394239e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019567935180186767, + "loss": 0.0143, "step": 137850 }, { - "epoch": 1.49, - "learning_rate": 7.64480767983395e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019567178410885366, + "loss": 0.0111, "step": 137860 }, { - "epoch": 1.49, - "learning_rate": 7.643186093273657e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019566421641583966, + "loss": 0.0131, "step": 137870 }, { - "epoch": 1.49, - "learning_rate": 7.641564506713368e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.00019565664872282565, + "loss": 0.0167, "step": 137880 }, { - "epoch": 1.49, - "learning_rate": 7.639942920153076e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019564908102981163, + "loss": 0.015, "step": 137890 }, { - "epoch": 1.49, - "learning_rate": 7.638321333592787e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019564151333679764, + "loss": 0.0151, "step": 137900 }, { - "epoch": 1.49, - "learning_rate": 7.636699747032496e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019563394564378362, + "loss": 0.0129, "step": 137910 }, { - "epoch": 1.49, - "learning_rate": 7.635078160472205e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.0001956263779507696, + "loss": 0.0131, "step": 137920 }, { - "epoch": 1.49, - "learning_rate": 7.633456573911914e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.0001956188102577556, + "loss": 0.0124, "step": 137930 }, { - "epoch": 1.49, - "learning_rate": 7.631834987351624e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001956112425647416, + "loss": 0.0113, "step": 137940 }, { - "epoch": 1.49, - "learning_rate": 7.630213400791333e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019560367487172757, + "loss": 0.0141, "step": 137950 }, { - "epoch": 1.49, - "learning_rate": 7.628591814231044e-05, - "loss": 0.0115, + "epoch": 0.7, + "learning_rate": 0.00019559610717871358, + "loss": 0.0157, "step": 137960 }, { - "epoch": 1.49, - "learning_rate": 7.626970227670752e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019558853948569956, + "loss": 0.0125, "step": 137970 }, { - "epoch": 1.49, - "learning_rate": 7.625348641110462e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019558097179268554, + "loss": 0.0117, "step": 137980 }, { - "epoch": 1.49, - "learning_rate": 7.62372705455017e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.00019557340409967155, + "loss": 0.0138, "step": 137990 }, { - "epoch": 1.49, - "learning_rate": 7.622105467989881e-05, - "loss": 0.0108, + "epoch": 0.7, + "learning_rate": 0.00019556583640665753, + "loss": 0.0116, "step": 138000 }, { - "epoch": 1.49, - "eval_cer": 0.9215364891415945, - "eval_loss": 0.006428159307688475, - "eval_runtime": 121.4519, - "eval_samples_per_second": 16.467, - "eval_steps_per_second": 4.117, + "epoch": 0.7, + "eval_cer": 0.9144770486760401, + "eval_loss": 0.009700953029096127, + "eval_runtime": 116.67, + "eval_samples_per_second": 17.142, + "eval_steps_per_second": 4.286, "step": 138000 }, { - "epoch": 1.49, - "learning_rate": 7.62048388142959e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.0001955582687136435, + "loss": 0.0138, "step": 138010 }, { - "epoch": 1.49, - "learning_rate": 7.618862294869299e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001955507010206295, + "loss": 0.0124, "step": 138020 }, { - "epoch": 1.49, - "learning_rate": 7.617240708309009e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.0001955431333276155, + "loss": 0.0145, "step": 138030 }, { - "epoch": 1.49, - "learning_rate": 7.615619121748718e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019553556563460148, + "loss": 0.0182, "step": 138040 }, { - "epoch": 1.49, - "learning_rate": 7.613997535188427e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019552799794158747, + "loss": 0.0142, "step": 138050 }, { - "epoch": 1.49, - "learning_rate": 7.612375948628138e-05, - "loss": 0.011, + "epoch": 0.7, + "learning_rate": 0.00019552043024857347, + "loss": 0.0124, "step": 138060 }, { - "epoch": 1.49, - "learning_rate": 7.610754362067846e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019551286255555946, + "loss": 0.0141, "step": 138070 }, { - "epoch": 1.49, - "learning_rate": 7.609132775507556e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019550529486254544, + "loss": 0.0134, "step": 138080 }, { - "epoch": 1.49, - "learning_rate": 7.607511188947264e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019549772716953145, + "loss": 0.0149, "step": 138090 }, { - "epoch": 1.49, - "learning_rate": 7.605889602386975e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019549015947651743, + "loss": 0.0114, "step": 138100 }, { - "epoch": 1.49, - "learning_rate": 7.604268015826685e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.0001954825917835034, + "loss": 0.0134, "step": 138110 }, { - "epoch": 1.49, - "learning_rate": 7.602646429266393e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019547502409048942, + "loss": 0.0108, "step": 138120 }, { - "epoch": 1.49, - "learning_rate": 7.601024842706104e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001954674563974754, + "loss": 0.0123, "step": 138130 }, { - "epoch": 1.49, - "learning_rate": 7.599403256145812e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019545988870446138, + "loss": 0.0118, "step": 138140 }, { - "epoch": 1.49, - "learning_rate": 7.597781669585523e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001954523210114474, + "loss": 0.0122, "step": 138150 }, { - "epoch": 1.49, - "learning_rate": 7.596160083025232e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019544475331843337, + "loss": 0.0127, "step": 138160 }, { - "epoch": 1.49, - "learning_rate": 7.594538496464941e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019543718562541935, + "loss": 0.0163, "step": 138170 }, { - "epoch": 1.49, - "learning_rate": 7.59291690990465e-05, - "loss": 0.0104, + "epoch": 0.7, + "learning_rate": 0.00019542961793240533, + "loss": 0.013, "step": 138180 }, { - "epoch": 1.49, - "learning_rate": 7.59129532334436e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019542205023939134, + "loss": 0.014, "step": 138190 }, { - "epoch": 1.49, - "learning_rate": 7.589673736784069e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019541448254637732, + "loss": 0.0125, "step": 138200 }, { - "epoch": 1.49, - "learning_rate": 7.58805215022378e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001954069148533633, + "loss": 0.013, "step": 138210 }, { - "epoch": 1.49, - "learning_rate": 7.586430563663487e-05, - "loss": 0.0106, + "epoch": 0.7, + "learning_rate": 0.0001953993471603493, + "loss": 0.0118, "step": 138220 }, { - "epoch": 1.49, - "learning_rate": 7.584808977103198e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.0001953917794673353, + "loss": 0.0124, "step": 138230 }, { - "epoch": 1.49, - "learning_rate": 7.583187390542906e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019538421177432128, + "loss": 0.012, "step": 138240 }, { - "epoch": 1.49, - "learning_rate": 7.581565803982617e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019537664408130728, + "loss": 0.0177, "step": 138250 }, { - "epoch": 1.49, - "learning_rate": 7.579944217422325e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019536907638829327, + "loss": 0.0122, "step": 138260 }, { - "epoch": 1.49, - "learning_rate": 7.578322630862035e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019536150869527925, + "loss": 0.0106, "step": 138270 }, { - "epoch": 1.49, - "learning_rate": 7.576701044301744e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019535394100226526, + "loss": 0.0116, "step": 138280 }, { - "epoch": 1.49, - "learning_rate": 7.575079457741454e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.00019534637330925124, + "loss": 0.0129, "step": 138290 }, { - "epoch": 1.5, - "learning_rate": 7.573457871181163e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019533880561623722, + "loss": 0.015, "step": 138300 }, { - "epoch": 1.5, - "learning_rate": 7.571836284620874e-05, - "loss": 0.0056, + "epoch": 0.7, + "learning_rate": 0.00019533123792322323, + "loss": 0.0163, "step": 138310 }, { - "epoch": 1.5, - "learning_rate": 7.570214698060582e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.0001953236702302092, + "loss": 0.0154, "step": 138320 }, { - "epoch": 1.5, - "learning_rate": 7.568593111500292e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.0001953161025371952, + "loss": 0.0121, "step": 138330 }, { - "epoch": 1.5, - "learning_rate": 7.56697152494e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.0001953085348441812, + "loss": 0.0129, "step": 138340 }, { - "epoch": 1.5, - "learning_rate": 7.565349938379711e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019530096715116718, + "loss": 0.0129, "step": 138350 }, { - "epoch": 1.5, - "learning_rate": 7.563728351819419e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019529339945815316, + "loss": 0.0116, "step": 138360 }, { - "epoch": 1.5, - "learning_rate": 7.562106765259129e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019528583176513914, + "loss": 0.0105, "step": 138370 }, { - "epoch": 1.5, - "learning_rate": 7.560485178698839e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019527826407212515, + "loss": 0.0136, "step": 138380 }, { - "epoch": 1.5, - "learning_rate": 7.558863592138548e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019527069637911113, + "loss": 0.0123, "step": 138390 }, { - "epoch": 1.5, - "learning_rate": 7.557242005578257e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019526312868609711, + "loss": 0.0154, "step": 138400 }, { - "epoch": 1.5, - "learning_rate": 7.555620419017966e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019525556099308312, + "loss": 0.0113, "step": 138410 }, { - "epoch": 1.5, - "learning_rate": 7.553998832457676e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.0001952479933000691, + "loss": 0.0135, "step": 138420 }, { - "epoch": 1.5, - "learning_rate": 7.552377245897386e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019524042560705509, + "loss": 0.0124, "step": 138430 }, { - "epoch": 1.5, - "learning_rate": 7.550755659337094e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.0001952328579140411, + "loss": 0.0094, "step": 138440 }, { - "epoch": 1.5, - "learning_rate": 7.549134072776805e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019522529022102708, + "loss": 0.0118, "step": 138450 }, { - "epoch": 1.5, - "learning_rate": 7.547512486216513e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019521772252801306, + "loss": 0.0121, "step": 138460 }, { - "epoch": 1.5, - "learning_rate": 7.545890899656223e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019521015483499907, + "loss": 0.0124, "step": 138470 }, { - "epoch": 1.5, - "learning_rate": 7.544269313095933e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019520258714198505, + "loss": 0.0146, "step": 138480 }, { - "epoch": 1.5, - "learning_rate": 7.542647726535642e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019519501944897103, + "loss": 0.0141, "step": 138490 }, { - "epoch": 1.5, - "learning_rate": 7.541026139975351e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019518745175595704, + "loss": 0.0126, "step": 138500 }, { - "epoch": 1.5, - "learning_rate": 7.53940455341506e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019517988406294302, + "loss": 0.0128, "step": 138510 }, { - "epoch": 1.5, - "learning_rate": 7.53778296685477e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.000195172316369929, + "loss": 0.011, "step": 138520 }, { - "epoch": 1.5, - "learning_rate": 7.53616138029448e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.00019516474867691498, + "loss": 0.0153, "step": 138530 }, { - "epoch": 1.5, - "learning_rate": 7.534539793734188e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.000195157180983901, + "loss": 0.0141, "step": 138540 }, { - "epoch": 1.5, - "learning_rate": 7.532918207173899e-05, - "loss": 0.0105, + "epoch": 0.7, + "learning_rate": 0.00019514961329088697, + "loss": 0.0116, "step": 138550 }, { - "epoch": 1.5, - "learning_rate": 7.531296620613607e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019514204559787295, + "loss": 0.0118, "step": 138560 }, { - "epoch": 1.5, - "learning_rate": 7.529675034053317e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019513447790485896, + "loss": 0.0142, "step": 138570 }, { - "epoch": 1.5, - "learning_rate": 7.528053447493025e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019512691021184494, + "loss": 0.0147, "step": 138580 }, { - "epoch": 1.5, - "learning_rate": 7.526431860932736e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.00019511934251883092, + "loss": 0.0183, "step": 138590 }, { - "epoch": 1.5, - "learning_rate": 7.524810274372445e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019511177482581693, + "loss": 0.0133, "step": 138600 }, { - "epoch": 1.5, - "learning_rate": 7.523188687812155e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019510420713280291, + "loss": 0.013, "step": 138610 }, { - "epoch": 1.5, - "learning_rate": 7.521567101251864e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.0001950966394397889, + "loss": 0.012, "step": 138620 }, { - "epoch": 1.5, - "learning_rate": 7.519945514691574e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.0001950890717467749, + "loss": 0.0123, "step": 138630 }, { - "epoch": 1.5, - "learning_rate": 7.518323928131282e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019508150405376089, + "loss": 0.0172, "step": 138640 }, { - "epoch": 1.5, - "learning_rate": 7.516702341570993e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019507393636074687, + "loss": 0.018, "step": 138650 }, { - "epoch": 1.5, - "learning_rate": 7.515080755010701e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019506636866773288, + "loss": 0.0112, "step": 138660 }, { - "epoch": 1.5, - "learning_rate": 7.513459168450412e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019505880097471886, + "loss": 0.0169, "step": 138670 }, { - "epoch": 1.5, - "learning_rate": 7.51183758189012e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019505123328170484, + "loss": 0.0119, "step": 138680 }, { - "epoch": 1.5, - "learning_rate": 7.51021599532983e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019504366558869082, + "loss": 0.0108, "step": 138690 }, { - "epoch": 1.5, - "learning_rate": 7.50859440876954e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019503609789567683, + "loss": 0.0136, "step": 138700 }, { - "epoch": 1.5, - "learning_rate": 7.506972822209249e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.0001950285302026628, + "loss": 0.0145, "step": 138710 }, { - "epoch": 1.5, - "learning_rate": 7.505351235648958e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001950209625096488, + "loss": 0.0104, "step": 138720 }, { - "epoch": 1.5, - "learning_rate": 7.503729649088667e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.0001950133948166348, + "loss": 0.0128, "step": 138730 }, { - "epoch": 1.5, - "learning_rate": 7.502108062528376e-05, - "loss": 0.0054, + "epoch": 0.7, + "learning_rate": 0.00019500582712362078, + "loss": 0.0139, "step": 138740 }, { - "epoch": 1.5, - "learning_rate": 7.500486475968087e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019499825943060676, + "loss": 0.0109, "step": 138750 }, { - "epoch": 1.5, - "learning_rate": 7.498864889407796e-05, - "loss": 0.0118, + "epoch": 0.7, + "learning_rate": 0.00019499069173759277, + "loss": 0.0145, "step": 138760 }, { - "epoch": 1.5, - "learning_rate": 7.497243302847506e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019498312404457875, + "loss": 0.0118, "step": 138770 }, { - "epoch": 1.5, - "learning_rate": 7.495621716287215e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019497555635156473, + "loss": 0.013, "step": 138780 }, { - "epoch": 1.5, - "learning_rate": 7.494000129726924e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019496798865855074, + "loss": 0.0149, "step": 138790 }, { - "epoch": 1.5, - "learning_rate": 7.492378543166633e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019496042096553672, + "loss": 0.012, "step": 138800 }, { - "epoch": 1.5, - "learning_rate": 7.490756956606343e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001949528532725227, + "loss": 0.0134, "step": 138810 }, { - "epoch": 1.5, - "learning_rate": 7.489135370046052e-05, - "loss": 0.012, + "epoch": 0.7, + "learning_rate": 0.00019494528557950871, + "loss": 0.0138, "step": 138820 }, { - "epoch": 1.5, - "learning_rate": 7.487513783485761e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001949377178864947, + "loss": 0.0132, "step": 138830 }, { - "epoch": 1.5, - "learning_rate": 7.48589219692547e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019493015019348068, + "loss": 0.0143, "step": 138840 }, { - "epoch": 1.5, - "learning_rate": 7.484270610365181e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019492258250046669, + "loss": 0.0177, "step": 138850 }, { - "epoch": 1.5, - "learning_rate": 7.48264902380489e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019491501480745267, + "loss": 0.0126, "step": 138860 }, { - "epoch": 1.5, - "learning_rate": 7.4810274372446e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.00019490744711443865, + "loss": 0.0197, "step": 138870 }, { - "epoch": 1.5, - "learning_rate": 7.479405850684309e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019489987942142463, + "loss": 0.016, "step": 138880 }, { - "epoch": 1.5, - "learning_rate": 7.477784264124018e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001948923117284106, + "loss": 0.013, "step": 138890 }, { - "epoch": 1.5, - "learning_rate": 7.476162677563728e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.0001948847440353966, + "loss": 0.0131, "step": 138900 }, { - "epoch": 1.5, - "learning_rate": 7.474541091003437e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019487717634238258, + "loss": 0.0136, "step": 138910 }, { - "epoch": 1.5, - "learning_rate": 7.472919504443146e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019486960864936856, + "loss": 0.0137, "step": 138920 }, { - "epoch": 1.5, - "learning_rate": 7.471297917882855e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019486204095635457, + "loss": 0.0124, "step": 138930 }, { - "epoch": 1.5, - "learning_rate": 7.469676331322565e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019485447326334055, + "loss": 0.0102, "step": 138940 }, { - "epoch": 1.5, - "learning_rate": 7.468054744762274e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019484690557032653, + "loss": 0.0145, "step": 138950 }, { - "epoch": 1.5, - "learning_rate": 7.466433158201985e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019483933787731254, + "loss": 0.0114, "step": 138960 }, { - "epoch": 1.5, - "learning_rate": 7.464811571641694e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019483177018429852, + "loss": 0.0136, "step": 138970 }, { - "epoch": 1.5, - "learning_rate": 7.463189985081403e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001948242024912845, + "loss": 0.0131, "step": 138980 }, { - "epoch": 1.5, - "learning_rate": 7.461568398521112e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001948166347982705, + "loss": 0.0174, "step": 138990 }, { - "epoch": 1.5, - "learning_rate": 7.459946811960822e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001948090671052565, + "loss": 0.0138, "step": 139000 }, { - "epoch": 1.5, - "eval_cer": 0.9215234600972488, - "eval_loss": 0.006560348439961672, - "eval_runtime": 121.2617, - "eval_samples_per_second": 16.493, - "eval_steps_per_second": 4.123, + "epoch": 0.7, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.009447253309190273, + "eval_runtime": 116.7733, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, "step": 139000 }, { - "epoch": 1.5, - "learning_rate": 7.458325225400531e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019480149941224247, + "loss": 0.0125, "step": 139010 }, { - "epoch": 1.5, - "learning_rate": 7.45670363884024e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019479393171922848, + "loss": 0.0135, "step": 139020 }, { - "epoch": 1.5, - "learning_rate": 7.45508205227995e-05, - "loss": 0.0058, + "epoch": 0.7, + "learning_rate": 0.00019478636402621446, + "loss": 0.0139, "step": 139030 }, { - "epoch": 1.5, - "learning_rate": 7.453460465719659e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019477879633320044, + "loss": 0.0116, "step": 139040 }, { - "epoch": 1.5, - "learning_rate": 7.451838879159368e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019477122864018645, + "loss": 0.0139, "step": 139050 }, { - "epoch": 1.5, - "learning_rate": 7.450217292599079e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019476366094717243, + "loss": 0.0141, "step": 139060 }, { - "epoch": 1.5, - "learning_rate": 7.448595706038788e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019475609325415841, + "loss": 0.0104, "step": 139070 }, { - "epoch": 1.5, - "learning_rate": 7.446974119478497e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.0001947485255611444, + "loss": 0.0156, "step": 139080 }, { - "epoch": 1.5, - "learning_rate": 7.445352532918206e-05, - "loss": 0.0098, + "epoch": 0.7, + "learning_rate": 0.0001947409578681304, + "loss": 0.0188, "step": 139090 }, { - "epoch": 1.5, - "learning_rate": 7.443730946357916e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019473339017511639, + "loss": 0.014, "step": 139100 }, { - "epoch": 1.5, - "learning_rate": 7.442109359797625e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019472582248210237, + "loss": 0.0193, "step": 139110 }, { - "epoch": 1.5, - "learning_rate": 7.440487773237334e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019471825478908838, + "loss": 0.0167, "step": 139120 }, { - "epoch": 1.5, - "learning_rate": 7.438866186677044e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019471068709607436, + "loss": 0.0139, "step": 139130 }, { - "epoch": 1.5, - "learning_rate": 7.437244600116753e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019470311940306034, + "loss": 0.0127, "step": 139140 }, { - "epoch": 1.5, - "learning_rate": 7.435623013556462e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019469555171004635, + "loss": 0.0144, "step": 139150 }, { - "epoch": 1.5, - "learning_rate": 7.434001426996171e-05, - "loss": 0.0124, + "epoch": 0.7, + "learning_rate": 0.00019468798401703233, + "loss": 0.0127, "step": 139160 }, { - "epoch": 1.5, - "learning_rate": 7.432379840435882e-05, - "loss": 0.0109, + "epoch": 0.7, + "learning_rate": 0.0001946804163240183, + "loss": 0.0117, "step": 139170 }, { - "epoch": 1.5, - "learning_rate": 7.430758253875591e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019467284863100432, + "loss": 0.0132, "step": 139180 }, { - "epoch": 1.5, - "learning_rate": 7.4291366673153e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.0001946652809379903, + "loss": 0.0188, "step": 139190 }, { - "epoch": 1.5, - "learning_rate": 7.42751508075501e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.00019465771324497628, + "loss": 0.0143, "step": 139200 }, { - "epoch": 1.5, - "learning_rate": 7.42589349419472e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.0001946501455519623, + "loss": 0.0135, "step": 139210 }, { - "epoch": 1.51, - "learning_rate": 7.42427190763443e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019464257785894827, + "loss": 0.0121, "step": 139220 }, { - "epoch": 1.51, - "learning_rate": 7.422650321074139e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019463501016593425, + "loss": 0.013, "step": 139230 }, { - "epoch": 1.51, - "learning_rate": 7.421028734513848e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.00019462744247292026, + "loss": 0.0142, "step": 139240 }, { - "epoch": 1.51, - "learning_rate": 7.419407147953558e-05, - "loss": 0.0106, + "epoch": 0.7, + "learning_rate": 0.00019461987477990624, + "loss": 0.016, "step": 139250 }, { - "epoch": 1.51, - "learning_rate": 7.417785561393267e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019461230708689222, + "loss": 0.0141, "step": 139260 }, { - "epoch": 1.51, - "learning_rate": 7.416163974832976e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001946047393938782, + "loss": 0.0132, "step": 139270 }, { - "epoch": 1.51, - "learning_rate": 7.414542388272685e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019459717170086421, + "loss": 0.0141, "step": 139280 }, { - "epoch": 1.51, - "learning_rate": 7.412920801712395e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.0001945896040078502, + "loss": 0.0149, "step": 139290 }, { - "epoch": 1.51, - "learning_rate": 7.411299215152104e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019458203631483618, + "loss": 0.0111, "step": 139300 }, { - "epoch": 1.51, - "learning_rate": 7.409677628591813e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019457446862182219, + "loss": 0.015, "step": 139310 }, { - "epoch": 1.51, - "learning_rate": 7.408056042031524e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019456690092880817, + "loss": 0.0106, "step": 139320 }, { - "epoch": 1.51, - "learning_rate": 7.406434455471233e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019455933323579415, + "loss": 0.0135, "step": 139330 }, { - "epoch": 1.51, - "learning_rate": 7.404812868910942e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019455176554278016, + "loss": 0.0112, "step": 139340 }, { - "epoch": 1.51, - "learning_rate": 7.403191282350652e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019454419784976614, + "loss": 0.0135, "step": 139350 }, { - "epoch": 1.51, - "learning_rate": 7.401569695790361e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019453663015675212, + "loss": 0.0117, "step": 139360 }, { - "epoch": 1.51, - "learning_rate": 7.39994810923007e-05, - "loss": 0.0061, + "epoch": 0.7, + "learning_rate": 0.00019452906246373813, + "loss": 0.0133, "step": 139370 }, { - "epoch": 1.51, - "learning_rate": 7.39832652266978e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.0001945214947707241, + "loss": 0.0123, "step": 139380 }, { - "epoch": 1.51, - "learning_rate": 7.396704936109489e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.0001945139270777101, + "loss": 0.0128, "step": 139390 }, { - "epoch": 1.51, - "learning_rate": 7.395083349549198e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.0001945063593846961, + "loss": 0.0141, "step": 139400 }, { - "epoch": 1.51, - "learning_rate": 7.393461762988907e-05, - "loss": 0.006, + "epoch": 0.7, + "learning_rate": 0.00019449879169168208, + "loss": 0.016, "step": 139410 }, { - "epoch": 1.51, - "learning_rate": 7.391840176428617e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019449122399866806, + "loss": 0.0145, "step": 139420 }, { - "epoch": 1.51, - "learning_rate": 7.390218589868327e-05, - "loss": 0.0116, + "epoch": 0.7, + "learning_rate": 0.00019448365630565404, + "loss": 0.0158, "step": 139430 }, { - "epoch": 1.51, - "learning_rate": 7.388597003308037e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019447608861264005, + "loss": 0.0159, "step": 139440 }, { - "epoch": 1.51, - "learning_rate": 7.386975416747746e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019446852091962603, + "loss": 0.0126, "step": 139450 }, { - "epoch": 1.51, - "learning_rate": 7.385353830187455e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019446095322661202, + "loss": 0.0143, "step": 139460 }, { - "epoch": 1.51, - "learning_rate": 7.383732243627164e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.00019445338553359802, + "loss": 0.0136, "step": 139470 }, { - "epoch": 1.51, - "learning_rate": 7.382110657066874e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.000194445817840584, + "loss": 0.0168, "step": 139480 }, { - "epoch": 1.51, - "learning_rate": 7.380489070506583e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019443825014757, + "loss": 0.0159, "step": 139490 }, { - "epoch": 1.51, - "learning_rate": 7.378867483946292e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.000194430682454556, + "loss": 0.0118, "step": 139500 }, { - "epoch": 1.51, - "learning_rate": 7.377245897386001e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019442311476154198, + "loss": 0.015, "step": 139510 }, { - "epoch": 1.51, - "learning_rate": 7.375624310825711e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019441554706852796, + "loss": 0.0125, "step": 139520 }, { - "epoch": 1.51, - "learning_rate": 7.37400272426542e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.00019440797937551397, + "loss": 0.0141, "step": 139530 }, { - "epoch": 1.51, - "learning_rate": 7.37238113770513e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019440041168249995, + "loss": 0.0133, "step": 139540 }, { - "epoch": 1.51, - "learning_rate": 7.37075955114484e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019439284398948593, + "loss": 0.0126, "step": 139550 }, { - "epoch": 1.51, - "learning_rate": 7.369137964584549e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019438527629647194, + "loss": 0.0125, "step": 139560 }, { - "epoch": 1.51, - "learning_rate": 7.367516378024258e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.00019437770860345792, + "loss": 0.013, "step": 139570 }, { - "epoch": 1.51, - "learning_rate": 7.365894791463968e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.0001943701409104439, + "loss": 0.013, "step": 139580 }, { - "epoch": 1.51, - "learning_rate": 7.364273204903677e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019436257321742988, + "loss": 0.0138, "step": 139590 }, { - "epoch": 1.51, - "learning_rate": 7.362651618343386e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001943550055244159, + "loss": 0.0157, "step": 139600 }, { - "epoch": 1.51, - "learning_rate": 7.361030031783096e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019434743783140187, + "loss": 0.0139, "step": 139610 }, { - "epoch": 1.51, - "learning_rate": 7.359408445222805e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019433987013838785, + "loss": 0.0128, "step": 139620 }, { - "epoch": 1.51, - "learning_rate": 7.357786858662514e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.00019433230244537386, + "loss": 0.0127, "step": 139630 }, { - "epoch": 1.51, - "learning_rate": 7.356165272102225e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.00019432473475235984, + "loss": 0.0131, "step": 139640 }, { - "epoch": 1.51, - "learning_rate": 7.354543685541934e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019431716705934583, + "loss": 0.0135, "step": 139650 }, { - "epoch": 1.51, - "learning_rate": 7.352922098981643e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.00019430959936633183, + "loss": 0.0118, "step": 139660 }, { - "epoch": 1.51, - "learning_rate": 7.351300512421353e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019430203167331782, + "loss": 0.0101, "step": 139670 }, { - "epoch": 1.51, - "learning_rate": 7.349678925861062e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.0001942944639803038, + "loss": 0.0125, "step": 139680 }, { - "epoch": 1.51, - "learning_rate": 7.348057339300771e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.0001942868962872898, + "loss": 0.0119, "step": 139690 }, { - "epoch": 1.51, - "learning_rate": 7.34643575274048e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.0001942793285942758, + "loss": 0.0151, "step": 139700 }, { - "epoch": 1.51, - "learning_rate": 7.34481416618019e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019427176090126177, + "loss": 0.0141, "step": 139710 }, { - "epoch": 1.51, - "learning_rate": 7.343192579619899e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019426419320824778, + "loss": 0.0115, "step": 139720 }, { - "epoch": 1.51, - "learning_rate": 7.341570993059608e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019425662551523376, + "loss": 0.0163, "step": 139730 }, { - "epoch": 1.51, - "learning_rate": 7.339949406499317e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019424905782221974, + "loss": 0.0122, "step": 139740 }, { - "epoch": 1.51, - "learning_rate": 7.338327819939028e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019424149012920575, + "loss": 0.0147, "step": 139750 }, { - "epoch": 1.51, - "learning_rate": 7.336706233378737e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019423392243619173, + "loss": 0.0118, "step": 139760 }, { - "epoch": 1.51, - "learning_rate": 7.335084646818447e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.0001942263547431777, + "loss": 0.017, "step": 139770 }, { - "epoch": 1.51, - "learning_rate": 7.333463060258156e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.0001942187870501637, + "loss": 0.0108, "step": 139780 }, { - "epoch": 1.51, - "learning_rate": 7.331841473697865e-05, - "loss": 0.0098, + "epoch": 0.71, + "learning_rate": 0.0001942112193571497, + "loss": 0.0151, "step": 139790 }, { - "epoch": 1.51, - "learning_rate": 7.330219887137574e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019420365166413568, + "loss": 0.0142, "step": 139800 }, { - "epoch": 1.51, - "learning_rate": 7.328598300577284e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019419608397112166, + "loss": 0.0132, "step": 139810 }, { - "epoch": 1.51, - "learning_rate": 7.326976714016993e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019418851627810767, + "loss": 0.0099, "step": 139820 }, { - "epoch": 1.51, - "learning_rate": 7.325355127456702e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019418094858509365, + "loss": 0.0114, "step": 139830 }, { - "epoch": 1.51, - "learning_rate": 7.323733540896412e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019417338089207964, + "loss": 0.0124, "step": 139840 }, { - "epoch": 1.51, - "learning_rate": 7.322111954336121e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019416581319906564, + "loss": 0.0111, "step": 139850 }, { - "epoch": 1.51, - "learning_rate": 7.320490367775831e-05, - "loss": 0.0098, + "epoch": 0.71, + "learning_rate": 0.00019415824550605163, + "loss": 0.0131, "step": 139860 }, { - "epoch": 1.51, - "learning_rate": 7.318868781215541e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.0001941506778130376, + "loss": 0.0137, "step": 139870 }, { - "epoch": 1.51, - "learning_rate": 7.31724719465525e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019414311012002362, + "loss": 0.0105, "step": 139880 }, { - "epoch": 1.51, - "learning_rate": 7.315625608094959e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.0001941355424270096, + "loss": 0.0149, "step": 139890 }, { - "epoch": 1.51, - "learning_rate": 7.314004021534669e-05, - "loss": 0.0101, + "epoch": 0.71, + "learning_rate": 0.00019412797473399558, + "loss": 0.0131, "step": 139900 }, { - "epoch": 1.51, - "learning_rate": 7.312382434974379e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001941204070409816, + "loss": 0.0176, "step": 139910 }, { - "epoch": 1.51, - "learning_rate": 7.310760848414088e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019411283934796757, + "loss": 0.0124, "step": 139920 }, { - "epoch": 1.51, - "learning_rate": 7.309139261853798e-05, - "loss": 0.0114, + "epoch": 0.71, + "learning_rate": 0.00019410527165495355, + "loss": 0.0143, "step": 139930 }, { - "epoch": 1.51, - "learning_rate": 7.307517675293507e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019409770396193953, + "loss": 0.0131, "step": 139940 }, { - "epoch": 1.51, - "learning_rate": 7.305896088733216e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019409013626892554, + "loss": 0.0117, "step": 139950 }, { - "epoch": 1.51, - "learning_rate": 7.304274502172926e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019408256857591152, + "loss": 0.0114, "step": 139960 }, { - "epoch": 1.51, - "learning_rate": 7.302652915612635e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001940750008828975, + "loss": 0.0117, "step": 139970 }, { - "epoch": 1.51, - "learning_rate": 7.301031329052344e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.0001940674331898835, + "loss": 0.0121, "step": 139980 }, { - "epoch": 1.51, - "learning_rate": 7.299409742492053e-05, - "loss": 0.0112, + "epoch": 0.71, + "learning_rate": 0.0001940598654968695, + "loss": 0.0126, "step": 139990 }, { - "epoch": 1.51, - "learning_rate": 7.297788155931763e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019405229780385547, + "loss": 0.0152, "step": 140000 }, { - "epoch": 1.51, - "eval_cer": 0.9215503867888964, - "eval_loss": 0.006375947035849094, - "eval_runtime": 121.158, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.71, + "eval_cer": 0.9144741374876638, + "eval_loss": 0.009188586845993996, + "eval_runtime": 116.7594, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, "step": 140000 }, { - "epoch": 1.51, - "learning_rate": 7.296166569371473e-05, - "loss": 0.0093, + "epoch": 0.71, + "learning_rate": 0.00019404473011084148, + "loss": 0.015, "step": 140010 }, { - "epoch": 1.51, - "learning_rate": 7.294544982811183e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019403716241782746, + "loss": 0.0123, "step": 140020 }, { - "epoch": 1.51, - "learning_rate": 7.292923396250892e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019402959472481345, + "loss": 0.0155, "step": 140030 }, { - "epoch": 1.51, - "learning_rate": 7.291301809690601e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019402202703179945, + "loss": 0.0138, "step": 140040 }, { - "epoch": 1.51, - "learning_rate": 7.28968022313031e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019401445933878544, + "loss": 0.0173, "step": 140050 }, { - "epoch": 1.51, - "learning_rate": 7.28805863657002e-05, - "loss": 0.0111, + "epoch": 0.71, + "learning_rate": 0.00019400689164577142, + "loss": 0.0135, "step": 140060 }, { - "epoch": 1.51, - "learning_rate": 7.286437050009729e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019399932395275743, + "loss": 0.0115, "step": 140070 }, { - "epoch": 1.51, - "learning_rate": 7.284815463449438e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.0001939917562597434, + "loss": 0.0169, "step": 140080 }, { - "epoch": 1.51, - "learning_rate": 7.283193876889147e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.0001939841885667294, + "loss": 0.0127, "step": 140090 }, { - "epoch": 1.51, - "learning_rate": 7.281572290328857e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019397662087371537, + "loss": 0.0138, "step": 140100 }, { - "epoch": 1.51, - "learning_rate": 7.279950703768566e-05, - "loss": 0.0093, + "epoch": 0.71, + "learning_rate": 0.00019396905318070138, + "loss": 0.0135, "step": 140110 }, { - "epoch": 1.51, - "learning_rate": 7.278329117208277e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019396148548768736, + "loss": 0.0114, "step": 140120 }, { - "epoch": 1.51, - "learning_rate": 7.276707530647986e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019395391779467334, + "loss": 0.015, "step": 140130 }, { - "epoch": 1.51, - "learning_rate": 7.275085944087695e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019394635010165935, + "loss": 0.0135, "step": 140140 }, { - "epoch": 1.52, - "learning_rate": 7.273464357527404e-05, - "loss": 0.0105, + "epoch": 0.71, + "learning_rate": 0.0001939387824086453, + "loss": 0.0129, "step": 140150 }, { - "epoch": 1.52, - "learning_rate": 7.271842770967114e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019393121471563129, + "loss": 0.0104, "step": 140160 }, { - "epoch": 1.52, - "learning_rate": 7.270221184406823e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.00019392364702261727, + "loss": 0.0169, "step": 140170 }, { - "epoch": 1.52, - "learning_rate": 7.268599597846532e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019391607932960328, + "loss": 0.0121, "step": 140180 }, { - "epoch": 1.52, - "learning_rate": 7.266978011286242e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019390851163658926, + "loss": 0.0145, "step": 140190 }, { - "epoch": 1.52, - "learning_rate": 7.265356424725951e-05, - "loss": 0.0103, + "epoch": 0.71, + "learning_rate": 0.00019390094394357524, + "loss": 0.011, "step": 140200 }, { - "epoch": 1.52, - "learning_rate": 7.26373483816566e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019389337625056125, + "loss": 0.014, "step": 140210 }, { - "epoch": 1.52, - "learning_rate": 7.262113251605371e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019388580855754723, + "loss": 0.0134, "step": 140220 }, { - "epoch": 1.52, - "learning_rate": 7.26049166504508e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001938782408645332, + "loss": 0.0139, "step": 140230 }, { - "epoch": 1.52, - "learning_rate": 7.258870078484789e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019387067317151922, + "loss": 0.0191, "step": 140240 }, { - "epoch": 1.52, - "learning_rate": 7.257248491924499e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.0001938631054785052, + "loss": 0.0126, "step": 140250 }, { - "epoch": 1.52, - "learning_rate": 7.255626905364208e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019385553778549118, + "loss": 0.0164, "step": 140260 }, { - "epoch": 1.52, - "learning_rate": 7.254005318803917e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.0001938479700924772, + "loss": 0.0151, "step": 140270 }, { - "epoch": 1.52, - "learning_rate": 7.252383732243626e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019384040239946317, + "loss": 0.0122, "step": 140280 }, { - "epoch": 1.52, - "learning_rate": 7.250762145683336e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019383283470644915, + "loss": 0.014, "step": 140290 }, { - "epoch": 1.52, - "learning_rate": 7.249140559123045e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.00019382526701343516, + "loss": 0.0121, "step": 140300 }, { - "epoch": 1.52, - "learning_rate": 7.247518972562754e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019381769932042114, + "loss": 0.012, "step": 140310 }, { - "epoch": 1.52, - "learning_rate": 7.245897386002464e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019381013162740712, + "loss": 0.0141, "step": 140320 }, { - "epoch": 1.52, - "learning_rate": 7.244275799442174e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001938025639343931, + "loss": 0.0135, "step": 140330 }, { - "epoch": 1.52, - "learning_rate": 7.242654212881883e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.00019379499624137911, + "loss": 0.0094, "step": 140340 }, { - "epoch": 1.52, - "learning_rate": 7.241032626321593e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.0001937874285483651, + "loss": 0.0128, "step": 140350 }, { - "epoch": 1.52, - "learning_rate": 7.239411039761302e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019377986085535108, + "loss": 0.0149, "step": 140360 }, { - "epoch": 1.52, - "learning_rate": 7.237789453201011e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019377229316233709, + "loss": 0.0177, "step": 140370 }, { - "epoch": 1.52, - "learning_rate": 7.23616786664072e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019376472546932307, + "loss": 0.0164, "step": 140380 }, { - "epoch": 1.52, - "learning_rate": 7.23454628008043e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019375715777630905, + "loss": 0.0127, "step": 140390 }, { - "epoch": 1.52, - "learning_rate": 7.232924693520139e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019374959008329506, + "loss": 0.0131, "step": 140400 }, { - "epoch": 1.52, - "learning_rate": 7.231303106959848e-05, - "loss": 0.0117, + "epoch": 0.71, + "learning_rate": 0.00019374202239028104, + "loss": 0.013, "step": 140410 }, { - "epoch": 1.52, - "learning_rate": 7.229681520399558e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019373445469726702, + "loss": 0.0133, "step": 140420 }, { - "epoch": 1.52, - "learning_rate": 7.228059933839267e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019372688700425303, + "loss": 0.014, "step": 140430 }, { - "epoch": 1.52, - "learning_rate": 7.226438347278978e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.000193719319311239, + "loss": 0.013, "step": 140440 }, { - "epoch": 1.52, - "learning_rate": 7.224816760718687e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.000193711751618225, + "loss": 0.0145, "step": 140450 }, { - "epoch": 1.52, - "learning_rate": 7.223195174158396e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.000193704183925211, + "loss": 0.0134, "step": 140460 }, { - "epoch": 1.52, - "learning_rate": 7.221573587598105e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019369661623219698, + "loss": 0.0139, "step": 140470 }, { - "epoch": 1.52, - "learning_rate": 7.219952001037815e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019368904853918296, + "loss": 0.0159, "step": 140480 }, { - "epoch": 1.52, - "learning_rate": 7.218330414477524e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019368148084616894, + "loss": 0.0162, "step": 140490 }, { - "epoch": 1.52, - "learning_rate": 7.216708827917233e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.00019367391315315495, + "loss": 0.0142, "step": 140500 }, { - "epoch": 1.52, - "learning_rate": 7.215087241356942e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.00019366634546014093, + "loss": 0.0115, "step": 140510 }, { - "epoch": 1.52, - "learning_rate": 7.213465654796652e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019365877776712692, + "loss": 0.0145, "step": 140520 }, { - "epoch": 1.52, - "learning_rate": 7.211844068236361e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019365121007411292, + "loss": 0.0145, "step": 140530 }, { - "epoch": 1.52, - "learning_rate": 7.21022248167607e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.0001936436423810989, + "loss": 0.0166, "step": 140540 }, { - "epoch": 1.52, - "learning_rate": 7.208600895115781e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001936360746880849, + "loss": 0.0129, "step": 140550 }, { - "epoch": 1.52, - "learning_rate": 7.20697930855549e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.0001936285069950709, + "loss": 0.0117, "step": 140560 }, { - "epoch": 1.52, - "learning_rate": 7.2053577219952e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019362093930205688, + "loss": 0.0149, "step": 140570 }, { - "epoch": 1.52, - "learning_rate": 7.203736135434909e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019361337160904286, + "loss": 0.0128, "step": 140580 }, { - "epoch": 1.52, - "learning_rate": 7.202114548874618e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019360580391602887, + "loss": 0.0128, "step": 140590 }, { - "epoch": 1.52, - "learning_rate": 7.200492962314327e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019359823622301485, + "loss": 0.0126, "step": 140600 }, { - "epoch": 1.52, - "learning_rate": 7.198871375754037e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019359066853000083, + "loss": 0.0108, "step": 140610 }, { - "epoch": 1.52, - "learning_rate": 7.197249789193746e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019358310083698684, + "loss": 0.0111, "step": 140620 }, { - "epoch": 1.52, - "learning_rate": 7.195628202633456e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.00019357553314397282, + "loss": 0.0137, "step": 140630 }, { - "epoch": 1.52, - "learning_rate": 7.194006616073166e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.0001935679654509588, + "loss": 0.0139, "step": 140640 }, { - "epoch": 1.52, - "learning_rate": 7.192385029512875e-05, - "loss": 0.0053, + "epoch": 0.71, + "learning_rate": 0.0001935603977579448, + "loss": 0.0156, "step": 140650 }, { - "epoch": 1.52, - "learning_rate": 7.190763442952584e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.0001935528300649308, + "loss": 0.0108, "step": 140660 }, { - "epoch": 1.52, - "learning_rate": 7.189141856392294e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019354526237191677, + "loss": 0.0127, "step": 140670 }, { - "epoch": 1.52, - "learning_rate": 7.187520269832003e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019353769467890275, + "loss": 0.0103, "step": 140680 }, { - "epoch": 1.52, - "learning_rate": 7.185898683271713e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019353012698588876, + "loss": 0.0114, "step": 140690 }, { - "epoch": 1.52, - "learning_rate": 7.184277096711423e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019352255929287474, + "loss": 0.0127, "step": 140700 }, { - "epoch": 1.52, - "learning_rate": 7.182655510151132e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019351499159986073, + "loss": 0.0139, "step": 140710 }, { - "epoch": 1.52, - "learning_rate": 7.181033923590841e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019350742390684673, + "loss": 0.015, "step": 140720 }, { - "epoch": 1.52, - "learning_rate": 7.17941233703055e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019349985621383272, + "loss": 0.0135, "step": 140730 }, { - "epoch": 1.52, - "learning_rate": 7.17779075047026e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.0001934922885208187, + "loss": 0.0119, "step": 140740 }, { - "epoch": 1.52, - "learning_rate": 7.176169163909969e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.0001934847208278047, + "loss": 0.0116, "step": 140750 }, { - "epoch": 1.52, - "learning_rate": 7.174547577349678e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001934771531347907, + "loss": 0.0139, "step": 140760 }, { - "epoch": 1.52, - "learning_rate": 7.172925990789388e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019346958544177667, + "loss": 0.0136, "step": 140770 }, { - "epoch": 1.52, - "learning_rate": 7.171304404229097e-05, - "loss": 0.0119, + "epoch": 0.71, + "learning_rate": 0.00019346201774876268, + "loss": 0.011, "step": 140780 }, { - "epoch": 1.52, - "learning_rate": 7.169682817668806e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019345445005574866, + "loss": 0.0107, "step": 140790 }, { - "epoch": 1.52, - "learning_rate": 7.168061231108517e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019344688236273464, + "loss": 0.0098, "step": 140800 }, { - "epoch": 1.52, - "learning_rate": 7.166439644548226e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019343931466972065, + "loss": 0.0113, "step": 140810 }, { - "epoch": 1.52, - "learning_rate": 7.164818057987935e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019343174697670663, + "loss": 0.0161, "step": 140820 }, { - "epoch": 1.52, - "learning_rate": 7.163196471427645e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.0001934241792836926, + "loss": 0.0159, "step": 140830 }, { - "epoch": 1.52, - "learning_rate": 7.161574884867354e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.0001934166115906786, + "loss": 0.013, "step": 140840 }, { - "epoch": 1.52, - "learning_rate": 7.159953298307063e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001934090438976646, + "loss": 0.0135, "step": 140850 }, { - "epoch": 1.52, - "learning_rate": 7.158331711746772e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019340147620465058, + "loss": 0.0126, "step": 140860 }, { - "epoch": 1.52, - "learning_rate": 7.156710125186482e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019339390851163656, + "loss": 0.0128, "step": 140870 }, { - "epoch": 1.52, - "learning_rate": 7.155088538626191e-05, - "loss": 0.0103, + "epoch": 0.71, + "learning_rate": 0.00019338634081862257, + "loss": 0.0126, "step": 140880 }, { - "epoch": 1.52, - "learning_rate": 7.1534669520659e-05, - "loss": 0.0053, + "epoch": 0.71, + "learning_rate": 0.00019337877312560855, + "loss": 0.0095, "step": 140890 }, { - "epoch": 1.52, - "learning_rate": 7.15184536550561e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.00019337120543259454, + "loss": 0.014, "step": 140900 }, { - "epoch": 1.52, - "learning_rate": 7.15022377894532e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019336363773958054, + "loss": 0.0139, "step": 140910 }, { - "epoch": 1.52, - "learning_rate": 7.14860219238503e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019335607004656653, + "loss": 0.0146, "step": 140920 }, { - "epoch": 1.52, - "learning_rate": 7.146980605824739e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.0001933485023535525, + "loss": 0.0119, "step": 140930 }, { - "epoch": 1.52, - "learning_rate": 7.145359019264448e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.00019334093466053852, + "loss": 0.0132, "step": 140940 }, { - "epoch": 1.52, - "learning_rate": 7.143737432704157e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.0001933333669675245, + "loss": 0.0131, "step": 140950 }, { - "epoch": 1.52, - "learning_rate": 7.142115846143867e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019332579927451048, + "loss": 0.0132, "step": 140960 }, { - "epoch": 1.52, - "learning_rate": 7.140494259583576e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.0001933182315814965, + "loss": 0.0111, "step": 140970 }, { - "epoch": 1.52, - "learning_rate": 7.138872673023285e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019331066388848247, + "loss": 0.0155, "step": 140980 }, { - "epoch": 1.52, - "learning_rate": 7.137251086462994e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019330309619546845, + "loss": 0.0134, "step": 140990 }, { - "epoch": 1.52, - "learning_rate": 7.135629499902704e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.00019329552850245443, + "loss": 0.0156, "step": 141000 }, { - "epoch": 1.52, - "eval_cer": 0.9215347519356817, - "eval_loss": 0.006414701230823994, - "eval_runtime": 121.2563, - "eval_samples_per_second": 16.494, - "eval_steps_per_second": 4.123, + "epoch": 0.71, + "eval_cer": 0.9144789894682909, + "eval_loss": 0.009155085310339928, + "eval_runtime": 116.8383, + "eval_samples_per_second": 17.118, + "eval_steps_per_second": 4.279, "step": 141000 }, { - "epoch": 1.52, - "learning_rate": 7.134007913342413e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019328796080944044, + "loss": 0.0143, "step": 141010 }, { - "epoch": 1.52, - "learning_rate": 7.132386326782124e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019328039311642642, + "loss": 0.0152, "step": 141020 }, { - "epoch": 1.52, - "learning_rate": 7.130764740221833e-05, - "loss": 0.0101, + "epoch": 0.71, + "learning_rate": 0.0001932728254234124, + "loss": 0.0157, "step": 141030 }, { - "epoch": 1.52, - "learning_rate": 7.129143153661542e-05, - "loss": 0.0109, + "epoch": 0.71, + "learning_rate": 0.0001932652577303984, + "loss": 0.0117, "step": 141040 }, { - "epoch": 1.52, - "learning_rate": 7.127521567101251e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.0001932576900373844, + "loss": 0.0128, "step": 141050 }, { - "epoch": 1.52, - "learning_rate": 7.12589998054096e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.00019325012234437037, + "loss": 0.0142, "step": 141060 }, { - "epoch": 1.53, - "learning_rate": 7.12427839398067e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019324255465135638, + "loss": 0.0126, "step": 141070 }, { - "epoch": 1.53, - "learning_rate": 7.122656807420379e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019323498695834236, + "loss": 0.0138, "step": 141080 }, { - "epoch": 1.53, - "learning_rate": 7.121035220860088e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019322741926532835, + "loss": 0.0145, "step": 141090 }, { - "epoch": 1.53, - "learning_rate": 7.119413634299798e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019321985157231435, + "loss": 0.0108, "step": 141100 }, { - "epoch": 1.53, - "learning_rate": 7.117792047739507e-05, - "loss": 0.0109, + "epoch": 0.71, + "learning_rate": 0.00019321228387930034, + "loss": 0.0143, "step": 141110 }, { - "epoch": 1.53, - "learning_rate": 7.116170461179216e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019320471618628632, + "loss": 0.012, "step": 141120 }, { - "epoch": 1.53, - "learning_rate": 7.114548874618927e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019319714849327233, + "loss": 0.0135, "step": 141130 }, { - "epoch": 1.53, - "learning_rate": 7.112927288058636e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.0001931895808002583, + "loss": 0.0145, "step": 141140 }, { - "epoch": 1.53, - "learning_rate": 7.111305701498345e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.0001931820131072443, + "loss": 0.0112, "step": 141150 }, { - "epoch": 1.53, - "learning_rate": 7.109684114938055e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019317444541423027, + "loss": 0.0124, "step": 141160 }, { - "epoch": 1.53, - "learning_rate": 7.108062528377764e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019316687772121628, + "loss": 0.0108, "step": 141170 }, { - "epoch": 1.53, - "learning_rate": 7.106440941817473e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019315931002820226, + "loss": 0.0124, "step": 141180 }, { - "epoch": 1.53, - "learning_rate": 7.104819355257183e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019315174233518824, + "loss": 0.0145, "step": 141190 }, { - "epoch": 1.53, - "learning_rate": 7.103197768696892e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019314417464217425, + "loss": 0.0142, "step": 141200 }, { - "epoch": 1.53, - "learning_rate": 7.101576182136601e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019313660694916023, + "loss": 0.0146, "step": 141210 }, { - "epoch": 1.53, - "learning_rate": 7.09995459557631e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001931290392561462, + "loss": 0.0126, "step": 141220 }, { - "epoch": 1.53, - "learning_rate": 7.098333009016021e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019312147156313222, + "loss": 0.0134, "step": 141230 }, { - "epoch": 1.53, - "learning_rate": 7.09671142245573e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001931139038701182, + "loss": 0.0142, "step": 141240 }, { - "epoch": 1.53, - "learning_rate": 7.09508983589544e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019310633617710418, + "loss": 0.0144, "step": 141250 }, { - "epoch": 1.53, - "learning_rate": 7.093468249335149e-05, - "loss": 0.0055, + "epoch": 0.71, + "learning_rate": 0.0001930987684840902, + "loss": 0.0141, "step": 141260 }, { - "epoch": 1.53, - "learning_rate": 7.091846662774858e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.00019309120079107617, + "loss": 0.0141, "step": 141270 }, { - "epoch": 1.53, - "learning_rate": 7.090225076214567e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019308363309806216, + "loss": 0.0135, "step": 141280 }, { - "epoch": 1.53, - "learning_rate": 7.088603489654277e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019307606540504816, + "loss": 0.0129, "step": 141290 }, { - "epoch": 1.53, - "learning_rate": 7.086981903093986e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019306849771203415, + "loss": 0.0113, "step": 141300 }, { - "epoch": 1.53, - "learning_rate": 7.085360316533695e-05, - "loss": 0.0054, + "epoch": 0.71, + "learning_rate": 0.00019306093001902013, + "loss": 0.0134, "step": 141310 }, { - "epoch": 1.53, - "learning_rate": 7.083738729973404e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019305336232600614, + "loss": 0.0137, "step": 141320 }, { - "epoch": 1.53, - "learning_rate": 7.082117143413114e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019304579463299212, + "loss": 0.0137, "step": 141330 }, { - "epoch": 1.53, - "learning_rate": 7.080495556852824e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.0001930382269399781, + "loss": 0.0123, "step": 141340 }, { - "epoch": 1.53, - "learning_rate": 7.078873970292534e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019303065924696408, + "loss": 0.0129, "step": 141350 }, { - "epoch": 1.53, - "learning_rate": 7.077252383732243e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.0001930230915539501, + "loss": 0.0136, "step": 141360 }, { - "epoch": 1.53, - "learning_rate": 7.075630797171952e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019301552386093607, + "loss": 0.0127, "step": 141370 }, { - "epoch": 1.53, - "learning_rate": 7.074009210611663e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019300795616792205, + "loss": 0.0119, "step": 141380 }, { - "epoch": 1.53, - "learning_rate": 7.072387624051372e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019300038847490806, + "loss": 0.0146, "step": 141390 }, { - "epoch": 1.53, - "learning_rate": 7.070766037491081e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019299282078189401, + "loss": 0.0123, "step": 141400 }, { - "epoch": 1.53, - "learning_rate": 7.06914445093079e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019298525308888, + "loss": 0.0107, "step": 141410 }, { - "epoch": 1.53, - "learning_rate": 7.0675228643705e-05, - "loss": 0.0093, + "epoch": 0.71, + "learning_rate": 0.00019297768539586598, + "loss": 0.0132, "step": 141420 }, { - "epoch": 1.53, - "learning_rate": 7.065901277810209e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019297011770285199, + "loss": 0.0157, "step": 141430 }, { - "epoch": 1.53, - "learning_rate": 7.064279691249918e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019296255000983797, + "loss": 0.0114, "step": 141440 }, { - "epoch": 1.53, - "learning_rate": 7.062658104689628e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.00019295498231682395, + "loss": 0.0147, "step": 141450 }, { - "epoch": 1.53, - "learning_rate": 7.061036518129337e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019294741462380996, + "loss": 0.0173, "step": 141460 }, { - "epoch": 1.53, - "learning_rate": 7.059414931569046e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019293984693079594, + "loss": 0.0122, "step": 141470 }, { - "epoch": 1.53, - "learning_rate": 7.057793345008756e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019293227923778192, + "loss": 0.0114, "step": 141480 }, { - "epoch": 1.53, - "learning_rate": 7.056171758448466e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019292471154476793, + "loss": 0.0129, "step": 141490 }, { - "epoch": 1.53, - "learning_rate": 7.054550171888175e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.0001929171438517539, + "loss": 0.0169, "step": 141500 }, { - "epoch": 1.53, - "learning_rate": 7.052928585327885e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.0001929095761587399, + "loss": 0.0118, "step": 141510 }, { - "epoch": 1.53, - "learning_rate": 7.051306998767594e-05, - "loss": 0.0101, + "epoch": 0.71, + "learning_rate": 0.0001929020084657259, + "loss": 0.014, "step": 141520 }, { - "epoch": 1.53, - "learning_rate": 7.049685412207303e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.00019289444077271188, + "loss": 0.0137, "step": 141530 }, { - "epoch": 1.53, - "learning_rate": 7.048063825647013e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019288687307969786, + "loss": 0.0142, "step": 141540 }, { - "epoch": 1.53, - "learning_rate": 7.046442239086722e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019287930538668384, + "loss": 0.0145, "step": 141550 }, { - "epoch": 1.53, - "learning_rate": 7.044820652526431e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019287173769366985, + "loss": 0.0126, "step": 141560 }, { - "epoch": 1.53, - "learning_rate": 7.04319906596614e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019286417000065583, + "loss": 0.0119, "step": 141570 }, { - "epoch": 1.53, - "learning_rate": 7.04157747940585e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019285660230764182, + "loss": 0.0123, "step": 141580 }, { - "epoch": 1.53, - "learning_rate": 7.039955892845559e-05, - "loss": 0.0057, + "epoch": 0.71, + "learning_rate": 0.00019284903461462782, + "loss": 0.013, "step": 141590 }, { - "epoch": 1.53, - "learning_rate": 7.03833430628527e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001928414669216138, + "loss": 0.0117, "step": 141600 }, { - "epoch": 1.53, - "learning_rate": 7.036712719724979e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.0001928338992285998, + "loss": 0.0123, "step": 141610 }, { - "epoch": 1.53, - "learning_rate": 7.035091133164688e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.0001928263315355858, + "loss": 0.0122, "step": 141620 }, { - "epoch": 1.53, - "learning_rate": 7.033469546604397e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019281876384257178, + "loss": 0.0144, "step": 141630 }, { - "epoch": 1.53, - "learning_rate": 7.031847960044107e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019281119614955776, + "loss": 0.0118, "step": 141640 }, { - "epoch": 1.53, - "learning_rate": 7.030226373483816e-05, - "loss": 0.0123, + "epoch": 0.71, + "learning_rate": 0.00019280362845654377, + "loss": 0.0139, "step": 141650 }, { - "epoch": 1.53, - "learning_rate": 7.028604786923525e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.00019279606076352975, + "loss": 0.0135, "step": 141660 }, { - "epoch": 1.53, - "learning_rate": 7.026983200363235e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019278849307051573, + "loss": 0.0124, "step": 141670 }, { - "epoch": 1.53, - "learning_rate": 7.025361613802944e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019278092537750174, + "loss": 0.0122, "step": 141680 }, { - "epoch": 1.53, - "learning_rate": 7.023740027242653e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019277335768448772, + "loss": 0.0108, "step": 141690 }, { - "epoch": 1.53, - "learning_rate": 7.022118440682362e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.0001927657899914737, + "loss": 0.0142, "step": 141700 }, { - "epoch": 1.53, - "learning_rate": 7.020496854122073e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.0001927582222984597, + "loss": 0.0109, "step": 141710 }, { - "epoch": 1.53, - "learning_rate": 7.018875267561782e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.0001927506546054457, + "loss": 0.0122, "step": 141720 }, { - "epoch": 1.53, - "learning_rate": 7.017253681001492e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019274308691243167, + "loss": 0.0158, "step": 141730 }, { - "epoch": 1.53, - "learning_rate": 7.015632094441201e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019273551921941765, + "loss": 0.0124, "step": 141740 }, { - "epoch": 1.53, - "learning_rate": 7.01401050788091e-05, - "loss": 0.0094, + "epoch": 0.72, + "learning_rate": 0.00019272795152640366, + "loss": 0.0136, "step": 141750 }, { - "epoch": 1.53, - "learning_rate": 7.01238892132062e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019272038383338964, + "loss": 0.0113, "step": 141760 }, { - "epoch": 1.53, - "learning_rate": 7.010767334760329e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019271281614037563, + "loss": 0.0123, "step": 141770 }, { - "epoch": 1.53, - "learning_rate": 7.009145748200038e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019270524844736163, + "loss": 0.0123, "step": 141780 }, { - "epoch": 1.53, - "learning_rate": 7.007524161639747e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019269768075434762, + "loss": 0.0114, "step": 141790 }, { - "epoch": 1.53, - "learning_rate": 7.005902575079456e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.0001926901130613336, + "loss": 0.0109, "step": 141800 }, { - "epoch": 1.53, - "learning_rate": 7.004280988519167e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.0001926825453683196, + "loss": 0.0136, "step": 141810 }, { - "epoch": 1.53, - "learning_rate": 7.002659401958876e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.0001926749776753056, + "loss": 0.0123, "step": 141820 }, { - "epoch": 1.53, - "learning_rate": 7.001037815398586e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019266740998229157, + "loss": 0.0145, "step": 141830 }, { - "epoch": 1.53, - "learning_rate": 6.999416228838295e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019265984228927758, + "loss": 0.0155, "step": 141840 }, { - "epoch": 1.53, - "learning_rate": 6.997794642278004e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019265227459626356, + "loss": 0.0221, "step": 141850 }, { - "epoch": 1.53, - "learning_rate": 6.996173055717713e-05, - "loss": 0.0113, + "epoch": 0.72, + "learning_rate": 0.00019264470690324954, + "loss": 0.0091, "step": 141860 }, { - "epoch": 1.53, - "learning_rate": 6.994551469157423e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019263713921023555, + "loss": 0.014, "step": 141870 }, { - "epoch": 1.53, - "learning_rate": 6.992929882597132e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019262957151722153, + "loss": 0.0132, "step": 141880 }, { - "epoch": 1.53, - "learning_rate": 6.991308296036841e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.0001926220038242075, + "loss": 0.0193, "step": 141890 }, { - "epoch": 1.53, - "learning_rate": 6.98968670947655e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001926144361311935, + "loss": 0.0147, "step": 141900 }, { - "epoch": 1.53, - "learning_rate": 6.98806512291626e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001926068684381795, + "loss": 0.0123, "step": 141910 }, { - "epoch": 1.53, - "learning_rate": 6.98644353635597e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019259930074516548, + "loss": 0.0165, "step": 141920 }, { - "epoch": 1.53, - "learning_rate": 6.98482194979568e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019259173305215146, + "loss": 0.0159, "step": 141930 }, { - "epoch": 1.53, - "learning_rate": 6.983200363235389e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019258416535913747, + "loss": 0.0135, "step": 141940 }, { - "epoch": 1.53, - "learning_rate": 6.981578776675098e-05, - "loss": 0.0062, + "epoch": 0.72, + "learning_rate": 0.00019257659766612345, + "loss": 0.0166, "step": 141950 }, { - "epoch": 1.53, - "learning_rate": 6.979957190114808e-05, - "loss": 0.0104, + "epoch": 0.72, + "learning_rate": 0.00019256902997310944, + "loss": 0.0119, "step": 141960 }, { - "epoch": 1.53, - "learning_rate": 6.978335603554517e-05, - "loss": 0.0097, + "epoch": 0.72, + "learning_rate": 0.00019256146228009544, + "loss": 0.0129, "step": 141970 }, { - "epoch": 1.53, - "learning_rate": 6.976714016994226e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019255389458708143, + "loss": 0.0146, "step": 141980 }, { - "epoch": 1.53, - "learning_rate": 6.975092430433935e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001925463268940674, + "loss": 0.015, "step": 141990 }, { - "epoch": 1.54, - "learning_rate": 6.973470843873645e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019253875920105342, + "loss": 0.0109, "step": 142000 }, { - "epoch": 1.54, - "eval_cer": 0.9215330147297689, - "eval_loss": 0.0063419705256819725, - "eval_runtime": 121.1571, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.72, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.009451182559132576, + "eval_runtime": 116.6955, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 142000 }, { - "epoch": 1.54, - "learning_rate": 6.971849257313354e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001925311915080394, + "loss": 0.0138, "step": 142010 }, { - "epoch": 1.54, - "learning_rate": 6.970227670753063e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.00019252362381502538, + "loss": 0.014, "step": 142020 }, { - "epoch": 1.54, - "learning_rate": 6.968606084192774e-05, - "loss": 0.0055, + "epoch": 0.72, + "learning_rate": 0.0001925160561220114, + "loss": 0.0146, "step": 142030 }, { - "epoch": 1.54, - "learning_rate": 6.966984497632483e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019250848842899737, + "loss": 0.0153, "step": 142040 }, { - "epoch": 1.54, - "learning_rate": 6.965362911072192e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019250092073598335, + "loss": 0.0132, "step": 142050 }, { - "epoch": 1.54, - "learning_rate": 6.963741324511902e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019249335304296933, + "loss": 0.0153, "step": 142060 }, { - "epoch": 1.54, - "learning_rate": 6.962119737951612e-05, - "loss": 0.0097, + "epoch": 0.72, + "learning_rate": 0.00019248578534995534, + "loss": 0.0151, "step": 142070 }, { - "epoch": 1.54, - "learning_rate": 6.960498151391322e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019247821765694132, + "loss": 0.0142, "step": 142080 }, { - "epoch": 1.54, - "learning_rate": 6.958876564831031e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.0001924706499639273, + "loss": 0.0145, "step": 142090 }, { - "epoch": 1.54, - "learning_rate": 6.95725497827074e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.0001924630822709133, + "loss": 0.0106, "step": 142100 }, { - "epoch": 1.54, - "learning_rate": 6.95563339171045e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001924555145778993, + "loss": 0.0153, "step": 142110 }, { - "epoch": 1.54, - "learning_rate": 6.954011805150159e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019244794688488527, + "loss": 0.0152, "step": 142120 }, { - "epoch": 1.54, - "learning_rate": 6.952390218589868e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019244037919187128, + "loss": 0.0128, "step": 142130 }, { - "epoch": 1.54, - "learning_rate": 6.950768632029577e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019243281149885726, + "loss": 0.014, "step": 142140 }, { - "epoch": 1.54, - "learning_rate": 6.949147045469286e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019242524380584325, + "loss": 0.0126, "step": 142150 }, { - "epoch": 1.54, - "learning_rate": 6.947525458908996e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019241767611282925, + "loss": 0.0171, "step": 142160 }, { - "epoch": 1.54, - "learning_rate": 6.945903872348705e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019241010841981524, + "loss": 0.0135, "step": 142170 }, { - "epoch": 1.54, - "learning_rate": 6.944282285788416e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019240254072680122, + "loss": 0.0184, "step": 142180 }, { - "epoch": 1.54, - "learning_rate": 6.942660699228125e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019239497303378723, + "loss": 0.013, "step": 142190 }, { - "epoch": 1.54, - "learning_rate": 6.941039112667834e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.0001923874053407732, + "loss": 0.0143, "step": 142200 }, { - "epoch": 1.54, - "learning_rate": 6.939417526107543e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001923798376477592, + "loss": 0.018, "step": 142210 }, { - "epoch": 1.54, - "learning_rate": 6.937795939547253e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.0001923722699547452, + "loss": 0.014, "step": 142220 }, { - "epoch": 1.54, - "learning_rate": 6.936174352986962e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019236470226173118, + "loss": 0.0103, "step": 142230 }, { - "epoch": 1.54, - "learning_rate": 6.934552766426671e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019235713456871716, + "loss": 0.0136, "step": 142240 }, { - "epoch": 1.54, - "learning_rate": 6.93293117986638e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.00019234956687570314, + "loss": 0.0144, "step": 142250 }, { - "epoch": 1.54, - "learning_rate": 6.93130959330609e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019234199918268915, + "loss": 0.0158, "step": 142260 }, { - "epoch": 1.54, - "learning_rate": 6.929688006745799e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019233443148967513, + "loss": 0.0122, "step": 142270 }, { - "epoch": 1.54, - "learning_rate": 6.92806642018551e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001923268637966611, + "loss": 0.0139, "step": 142280 }, { - "epoch": 1.54, - "learning_rate": 6.926444833625219e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019231929610364712, + "loss": 0.0112, "step": 142290 }, { - "epoch": 1.54, - "learning_rate": 6.924823247064928e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.0001923117284106331, + "loss": 0.0123, "step": 142300 }, { - "epoch": 1.54, - "learning_rate": 6.923201660504638e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019230416071761908, + "loss": 0.0143, "step": 142310 }, { - "epoch": 1.54, - "learning_rate": 6.921580073944347e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.0001922965930246051, + "loss": 0.0179, "step": 142320 }, { - "epoch": 1.54, - "learning_rate": 6.919958487384056e-05, - "loss": 0.0096, + "epoch": 0.72, + "learning_rate": 0.00019228902533159107, + "loss": 0.0118, "step": 142330 }, { - "epoch": 1.54, - "learning_rate": 6.918336900823765e-05, - "loss": 0.0058, + "epoch": 0.72, + "learning_rate": 0.00019228145763857706, + "loss": 0.013, "step": 142340 }, { - "epoch": 1.54, - "learning_rate": 6.916715314263475e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019227388994556306, + "loss": 0.0128, "step": 142350 }, { - "epoch": 1.54, - "learning_rate": 6.915093727703184e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019226632225254905, + "loss": 0.011, "step": 142360 }, { - "epoch": 1.54, - "learning_rate": 6.913472141142893e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019225875455953503, + "loss": 0.0148, "step": 142370 }, { - "epoch": 1.54, - "learning_rate": 6.911850554582602e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019225118686652104, + "loss": 0.0181, "step": 142380 }, { - "epoch": 1.54, - "learning_rate": 6.910228968022313e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019224361917350702, + "loss": 0.0131, "step": 142390 }, { - "epoch": 1.54, - "learning_rate": 6.908607381462022e-05, - "loss": 0.0109, + "epoch": 0.72, + "learning_rate": 0.000192236051480493, + "loss": 0.0149, "step": 142400 }, { - "epoch": 1.54, - "learning_rate": 6.906985794901732e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019222848378747898, + "loss": 0.0153, "step": 142410 }, { - "epoch": 1.54, - "learning_rate": 6.905364208341441e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.000192220916094465, + "loss": 0.0126, "step": 142420 }, { - "epoch": 1.54, - "learning_rate": 6.90374262178115e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019221334840145097, + "loss": 0.0121, "step": 142430 }, { - "epoch": 1.54, - "learning_rate": 6.90212103522086e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019220578070843695, + "loss": 0.011, "step": 142440 }, { - "epoch": 1.54, - "learning_rate": 6.900499448660569e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.00019219821301542296, + "loss": 0.0117, "step": 142450 }, { - "epoch": 1.54, - "learning_rate": 6.898877862100278e-05, - "loss": 0.0056, + "epoch": 0.72, + "learning_rate": 0.00019219064532240894, + "loss": 0.0129, "step": 142460 }, { - "epoch": 1.54, - "learning_rate": 6.897256275539987e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019218307762939492, + "loss": 0.0139, "step": 142470 }, { - "epoch": 1.54, - "learning_rate": 6.895634688979697e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019217550993638093, + "loss": 0.0126, "step": 142480 }, { - "epoch": 1.54, - "learning_rate": 6.894013102419406e-05, - "loss": 0.0103, + "epoch": 0.72, + "learning_rate": 0.0001921679422433669, + "loss": 0.0118, "step": 142490 }, { - "epoch": 1.54, - "learning_rate": 6.892391515859116e-05, - "loss": 0.0106, + "epoch": 0.72, + "learning_rate": 0.0001921603745503529, + "loss": 0.0116, "step": 142500 }, { - "epoch": 1.54, - "learning_rate": 6.890769929298826e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001921528068573389, + "loss": 0.0144, "step": 142510 }, { - "epoch": 1.54, - "learning_rate": 6.889148342738535e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019214523916432488, + "loss": 0.014, "step": 142520 }, { - "epoch": 1.54, - "learning_rate": 6.887526756178244e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019213767147131087, + "loss": 0.0122, "step": 142530 }, { - "epoch": 1.54, - "learning_rate": 6.885905169617954e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019213010377829687, + "loss": 0.016, "step": 142540 }, { - "epoch": 1.54, - "learning_rate": 6.884283583057663e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019212253608528286, + "loss": 0.0103, "step": 142550 }, { - "epoch": 1.54, - "learning_rate": 6.882661996497372e-05, - "loss": 0.0104, + "epoch": 0.72, + "learning_rate": 0.00019211496839226884, + "loss": 0.0127, "step": 142560 }, { - "epoch": 1.54, - "learning_rate": 6.881040409937081e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019210740069925482, + "loss": 0.0114, "step": 142570 }, { - "epoch": 1.54, - "learning_rate": 6.87941882337679e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019209983300624083, + "loss": 0.0091, "step": 142580 }, { - "epoch": 1.54, - "learning_rate": 6.8777972368165e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.0001920922653132268, + "loss": 0.014, "step": 142590 }, { - "epoch": 1.54, - "learning_rate": 6.876175650256209e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001920846976202128, + "loss": 0.0124, "step": 142600 }, { - "epoch": 1.54, - "learning_rate": 6.87455406369592e-05, - "loss": 0.0062, + "epoch": 0.72, + "learning_rate": 0.0001920771299271988, + "loss": 0.013, "step": 142610 }, { - "epoch": 1.54, - "learning_rate": 6.872932477135629e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019206956223418478, + "loss": 0.01, "step": 142620 }, { - "epoch": 1.54, - "learning_rate": 6.871310890575338e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019206199454117076, + "loss": 0.0132, "step": 142630 }, { - "epoch": 1.54, - "learning_rate": 6.869689304015048e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019205442684815677, + "loss": 0.0143, "step": 142640 }, { - "epoch": 1.54, - "learning_rate": 6.868067717454757e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019204685915514275, + "loss": 0.0164, "step": 142650 }, { - "epoch": 1.54, - "learning_rate": 6.866446130894466e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.0001920392914621287, + "loss": 0.0102, "step": 142660 }, { - "epoch": 1.54, - "learning_rate": 6.864824544334176e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.0001920317237691147, + "loss": 0.0154, "step": 142670 }, { - "epoch": 1.54, - "learning_rate": 6.863202957773885e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001920241560761007, + "loss": 0.0115, "step": 142680 }, { - "epoch": 1.54, - "learning_rate": 6.861581371213594e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019201658838308668, + "loss": 0.0125, "step": 142690 }, { - "epoch": 1.54, - "learning_rate": 6.859959784653303e-05, - "loss": 0.0116, + "epoch": 0.72, + "learning_rate": 0.00019200902069007266, + "loss": 0.0144, "step": 142700 }, { - "epoch": 1.54, - "learning_rate": 6.858338198093013e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019200145299705867, + "loss": 0.0121, "step": 142710 }, { - "epoch": 1.54, - "learning_rate": 6.856716611532723e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019199388530404465, + "loss": 0.0112, "step": 142720 }, { - "epoch": 1.54, - "learning_rate": 6.855095024972433e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019198631761103063, + "loss": 0.0116, "step": 142730 }, { - "epoch": 1.54, - "learning_rate": 6.853473438412142e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019197874991801664, + "loss": 0.0134, "step": 142740 }, { - "epoch": 1.54, - "learning_rate": 6.851851851851851e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019197118222500262, + "loss": 0.0114, "step": 142750 }, { - "epoch": 1.54, - "learning_rate": 6.85023026529156e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001919636145319886, + "loss": 0.012, "step": 142760 }, { - "epoch": 1.54, - "learning_rate": 6.84860867873127e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.0001919560468389746, + "loss": 0.0119, "step": 142770 }, { - "epoch": 1.54, - "learning_rate": 6.846987092170979e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.0001919484791459606, + "loss": 0.0134, "step": 142780 }, { - "epoch": 1.54, - "learning_rate": 6.84536550561069e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019194091145294657, + "loss": 0.0118, "step": 142790 }, { - "epoch": 1.54, - "learning_rate": 6.843743919050399e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019193334375993255, + "loss": 0.0128, "step": 142800 }, { - "epoch": 1.54, - "learning_rate": 6.842122332490108e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.00019192577606691856, + "loss": 0.0123, "step": 142810 }, { - "epoch": 1.54, - "learning_rate": 6.840500745929817e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019191820837390454, + "loss": 0.0112, "step": 142820 }, { - "epoch": 1.54, - "learning_rate": 6.838879159369527e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019191064068089053, + "loss": 0.0137, "step": 142830 }, { - "epoch": 1.54, - "learning_rate": 6.837257572809236e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019190307298787653, + "loss": 0.0129, "step": 142840 }, { - "epoch": 1.54, - "learning_rate": 6.835635986248945e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019189550529486252, + "loss": 0.0115, "step": 142850 }, { - "epoch": 1.54, - "learning_rate": 6.834014399688656e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.0001918879376018485, + "loss": 0.0116, "step": 142860 }, { - "epoch": 1.54, - "learning_rate": 6.832392813128365e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.0001918803699088345, + "loss": 0.0101, "step": 142870 }, { - "epoch": 1.54, - "learning_rate": 6.830771226568074e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.0001918728022158205, + "loss": 0.0141, "step": 142880 }, { - "epoch": 1.54, - "learning_rate": 6.829149640007784e-05, - "loss": 0.0117, + "epoch": 0.72, + "learning_rate": 0.00019186523452280647, + "loss": 0.0137, "step": 142890 }, { - "epoch": 1.54, - "learning_rate": 6.827528053447493e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019185766682979248, + "loss": 0.0127, "step": 142900 }, { - "epoch": 1.54, - "learning_rate": 6.825906466887202e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019185009913677846, + "loss": 0.0171, "step": 142910 }, { - "epoch": 1.55, - "learning_rate": 6.824284880326911e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019184253144376444, + "loss": 0.0109, "step": 142920 }, { - "epoch": 1.55, - "learning_rate": 6.822663293766621e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019183496375075045, + "loss": 0.0139, "step": 142930 }, { - "epoch": 1.55, - "learning_rate": 6.82104170720633e-05, - "loss": 0.011, + "epoch": 0.72, + "learning_rate": 0.00019182739605773643, + "loss": 0.0149, "step": 142940 }, { - "epoch": 1.55, - "learning_rate": 6.819420120646039e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.0001918198283647224, + "loss": 0.0144, "step": 142950 }, { - "epoch": 1.55, - "learning_rate": 6.817798534085749e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.0001918122606717084, + "loss": 0.012, "step": 142960 }, { - "epoch": 1.55, - "learning_rate": 6.816176947525459e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.0001918046929786944, + "loss": 0.0132, "step": 142970 }, { - "epoch": 1.55, - "learning_rate": 6.814555360965168e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019179712528568038, + "loss": 0.0132, "step": 142980 }, { - "epoch": 1.55, - "learning_rate": 6.812933774404878e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019178955759266636, + "loss": 0.0131, "step": 142990 }, { - "epoch": 1.55, - "learning_rate": 6.811312187844587e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019178198989965237, + "loss": 0.0133, "step": 143000 }, { - "epoch": 1.55, - "eval_cer": 0.9215269345090743, - "eval_loss": 0.00622851075604558, - "eval_runtime": 121.148, - "eval_samples_per_second": 16.509, - "eval_steps_per_second": 4.127, + "epoch": 0.72, + "eval_cer": 0.9144770486760401, + "eval_loss": 0.00942008476704359, + "eval_runtime": 116.7292, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, "step": 143000 }, { - "epoch": 1.55, - "learning_rate": 6.809690601284296e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019177442220663835, + "loss": 0.0117, "step": 143010 }, { - "epoch": 1.55, - "learning_rate": 6.808069014724006e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019176685451362434, + "loss": 0.0151, "step": 143020 }, { - "epoch": 1.55, - "learning_rate": 6.806447428163715e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019175928682061034, + "loss": 0.0119, "step": 143030 }, { - "epoch": 1.55, - "learning_rate": 6.804825841603424e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019175171912759633, + "loss": 0.0118, "step": 143040 }, { - "epoch": 1.55, - "learning_rate": 6.803204255043133e-05, - "loss": 0.0053, + "epoch": 0.72, + "learning_rate": 0.0001917441514345823, + "loss": 0.0126, "step": 143050 }, { - "epoch": 1.55, - "learning_rate": 6.801582668482843e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019173658374156832, + "loss": 0.0122, "step": 143060 }, { - "epoch": 1.55, - "learning_rate": 6.799961081922552e-05, - "loss": 0.0106, + "epoch": 0.72, + "learning_rate": 0.0001917290160485543, + "loss": 0.014, "step": 143070 }, { - "epoch": 1.55, - "learning_rate": 6.798339495362263e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019172144835554028, + "loss": 0.0141, "step": 143080 }, { - "epoch": 1.55, - "learning_rate": 6.796717908801972e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001917138806625263, + "loss": 0.0156, "step": 143090 }, { - "epoch": 1.55, - "learning_rate": 6.795096322241681e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019170631296951227, + "loss": 0.0138, "step": 143100 }, { - "epoch": 1.55, - "learning_rate": 6.79347473568139e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019169874527649825, + "loss": 0.0142, "step": 143110 }, { - "epoch": 1.55, - "learning_rate": 6.7918531491211e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019169117758348426, + "loss": 0.0129, "step": 143120 }, { - "epoch": 1.55, - "learning_rate": 6.790231562560809e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019168360989047024, + "loss": 0.0148, "step": 143130 }, { - "epoch": 1.55, - "learning_rate": 6.788609976000518e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019167604219745622, + "loss": 0.0118, "step": 143140 }, { - "epoch": 1.55, - "learning_rate": 6.786988389440227e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001916684745044422, + "loss": 0.0114, "step": 143150 }, { - "epoch": 1.55, - "learning_rate": 6.785366802879937e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.0001916609068114282, + "loss": 0.0154, "step": 143160 }, { - "epoch": 1.55, - "learning_rate": 6.783745216319646e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.0001916533391184142, + "loss": 0.0101, "step": 143170 }, { - "epoch": 1.55, - "learning_rate": 6.782123629759355e-05, - "loss": 0.0096, + "epoch": 0.72, + "learning_rate": 0.00019164577142540017, + "loss": 0.0117, "step": 143180 }, { - "epoch": 1.55, - "learning_rate": 6.780502043199066e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019163820373238618, + "loss": 0.013, "step": 143190 }, { - "epoch": 1.55, - "learning_rate": 6.778880456638775e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019163063603937216, + "loss": 0.0107, "step": 143200 }, { - "epoch": 1.55, - "learning_rate": 6.777258870078484e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.00019162306834635815, + "loss": 0.0127, "step": 143210 }, { - "epoch": 1.55, - "learning_rate": 6.775637283518194e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019161550065334415, + "loss": 0.0124, "step": 143220 }, { - "epoch": 1.55, - "learning_rate": 6.774015696957903e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019160793296033014, + "loss": 0.0114, "step": 143230 }, { - "epoch": 1.55, - "learning_rate": 6.772394110397612e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019160036526731612, + "loss": 0.0146, "step": 143240 }, { - "epoch": 1.55, - "learning_rate": 6.770772523837322e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019159279757430213, + "loss": 0.0129, "step": 143250 }, { - "epoch": 1.55, - "learning_rate": 6.769150937277031e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001915852298812881, + "loss": 0.0117, "step": 143260 }, { - "epoch": 1.55, - "learning_rate": 6.76752935071674e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.0001915776621882741, + "loss": 0.0119, "step": 143270 }, { - "epoch": 1.55, - "learning_rate": 6.76590776415645e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.0001915700944952601, + "loss": 0.014, "step": 143280 }, { - "epoch": 1.55, - "learning_rate": 6.764286177596159e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019156252680224608, + "loss": 0.0117, "step": 143290 }, { - "epoch": 1.55, - "learning_rate": 6.762664591035869e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019155495910923206, + "loss": 0.0136, "step": 143300 }, { - "epoch": 1.55, - "learning_rate": 6.761043004475579e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019154739141621804, + "loss": 0.0107, "step": 143310 }, { - "epoch": 1.55, - "learning_rate": 6.759421417915288e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019153982372320405, + "loss": 0.0184, "step": 143320 }, { - "epoch": 1.55, - "learning_rate": 6.757799831354997e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019153225603019003, + "loss": 0.013, "step": 143330 }, { - "epoch": 1.55, - "learning_rate": 6.756178244794706e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.000191524688337176, + "loss": 0.0119, "step": 143340 }, { - "epoch": 1.55, - "learning_rate": 6.754556658234416e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019151712064416202, + "loss": 0.0107, "step": 143350 }, { - "epoch": 1.55, - "learning_rate": 6.752935071674125e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.000191509552951148, + "loss": 0.0104, "step": 143360 }, { - "epoch": 1.55, - "learning_rate": 6.751313485113834e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019150198525813398, + "loss": 0.0135, "step": 143370 }, { - "epoch": 1.55, - "learning_rate": 6.749691898553543e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019149441756512, + "loss": 0.0128, "step": 143380 }, { - "epoch": 1.55, - "learning_rate": 6.748070311993253e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019148684987210597, + "loss": 0.0124, "step": 143390 }, { - "epoch": 1.55, - "learning_rate": 6.746448725432963e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019147928217909196, + "loss": 0.0147, "step": 143400 }, { - "epoch": 1.55, - "learning_rate": 6.744827138872673e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019147171448607796, + "loss": 0.0101, "step": 143410 }, { - "epoch": 1.55, - "learning_rate": 6.743205552312382e-05, - "loss": 0.0094, + "epoch": 0.72, + "learning_rate": 0.00019146414679306395, + "loss": 0.0112, "step": 143420 }, { - "epoch": 1.55, - "learning_rate": 6.741583965752091e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019145657910004993, + "loss": 0.0129, "step": 143430 }, { - "epoch": 1.55, - "learning_rate": 6.7399623791918e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019144901140703594, + "loss": 0.0153, "step": 143440 }, { - "epoch": 1.55, - "learning_rate": 6.73834079263151e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019144144371402192, + "loss": 0.0125, "step": 143450 }, { - "epoch": 1.55, - "learning_rate": 6.736719206071219e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.0001914338760210079, + "loss": 0.0118, "step": 143460 }, { - "epoch": 1.55, - "learning_rate": 6.735097619510928e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019142630832799388, + "loss": 0.0151, "step": 143470 }, { - "epoch": 1.55, - "learning_rate": 6.733476032950638e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001914187406349799, + "loss": 0.0118, "step": 143480 }, { - "epoch": 1.55, - "learning_rate": 6.731854446390347e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019141117294196587, + "loss": 0.0106, "step": 143490 }, { - "epoch": 1.55, - "learning_rate": 6.730232859830056e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019140360524895185, + "loss": 0.0139, "step": 143500 }, { - "epoch": 1.55, - "learning_rate": 6.728611273269767e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019139603755593786, + "loss": 0.0128, "step": 143510 }, { - "epoch": 1.55, - "learning_rate": 6.726989686709476e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019138846986292384, + "loss": 0.0123, "step": 143520 }, { - "epoch": 1.55, - "learning_rate": 6.725368100149185e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019138090216990982, + "loss": 0.0137, "step": 143530 }, { - "epoch": 1.55, - "learning_rate": 6.723746513588895e-05, - "loss": 0.0055, + "epoch": 0.72, + "learning_rate": 0.00019137333447689583, + "loss": 0.0155, "step": 143540 }, { - "epoch": 1.55, - "learning_rate": 6.722124927028605e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.0001913657667838818, + "loss": 0.0148, "step": 143550 }, { - "epoch": 1.55, - "learning_rate": 6.720503340468314e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001913581990908678, + "loss": 0.0126, "step": 143560 }, { - "epoch": 1.55, - "learning_rate": 6.718881753908024e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.0001913506313978538, + "loss": 0.0119, "step": 143570 }, { - "epoch": 1.55, - "learning_rate": 6.717260167347733e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019134306370483978, + "loss": 0.0104, "step": 143580 }, { - "epoch": 1.55, - "learning_rate": 6.715638580787442e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019133549601182577, + "loss": 0.0147, "step": 143590 }, { - "epoch": 1.55, - "learning_rate": 6.714016994227152e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019132792831881177, + "loss": 0.0133, "step": 143600 }, { - "epoch": 1.55, - "learning_rate": 6.712395407666861e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019132036062579776, + "loss": 0.0133, "step": 143610 }, { - "epoch": 1.55, - "learning_rate": 6.71077382110657e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019131279293278374, + "loss": 0.0137, "step": 143620 }, { - "epoch": 1.55, - "learning_rate": 6.70915223454628e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019130522523976975, + "loss": 0.0189, "step": 143630 }, { - "epoch": 1.55, - "learning_rate": 6.707530647985989e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019129765754675573, + "loss": 0.0178, "step": 143640 }, { - "epoch": 1.55, - "learning_rate": 6.705909061425698e-05, - "loss": 0.0142, + "epoch": 0.72, + "learning_rate": 0.0001912900898537417, + "loss": 0.0132, "step": 143650 }, { - "epoch": 1.55, - "learning_rate": 6.704287474865409e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001912825221607277, + "loss": 0.0116, "step": 143660 }, { - "epoch": 1.55, - "learning_rate": 6.702665888305118e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.0001912749544677137, + "loss": 0.0155, "step": 143670 }, { - "epoch": 1.55, - "learning_rate": 6.701044301744827e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019126738677469968, + "loss": 0.0131, "step": 143680 }, { - "epoch": 1.55, - "learning_rate": 6.699422715184536e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019125981908168566, + "loss": 0.0139, "step": 143690 }, { - "epoch": 1.55, - "learning_rate": 6.697801128624246e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019125225138867167, + "loss": 0.0125, "step": 143700 }, { - "epoch": 1.55, - "learning_rate": 6.696179542063955e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019124468369565765, + "loss": 0.0117, "step": 143710 }, { - "epoch": 1.55, - "learning_rate": 6.694557955503664e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019123711600264363, + "loss": 0.0148, "step": 143720 }, { - "epoch": 1.55, - "learning_rate": 6.692936368943373e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019122954830962964, + "loss": 0.0123, "step": 143730 }, { - "epoch": 1.55, - "learning_rate": 6.691314782383083e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019122198061661562, + "loss": 0.0124, "step": 143740 }, { - "epoch": 1.55, - "learning_rate": 6.689693195822792e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.0001912144129236016, + "loss": 0.0141, "step": 143750 }, { - "epoch": 1.55, - "learning_rate": 6.688071609262501e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.0001912068452305876, + "loss": 0.0107, "step": 143760 }, { - "epoch": 1.55, - "learning_rate": 6.686450022702212e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.0001911992775375736, + "loss": 0.0144, "step": 143770 }, { - "epoch": 1.55, - "learning_rate": 6.684828436141921e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019119170984455958, + "loss": 0.0149, "step": 143780 }, { - "epoch": 1.55, - "learning_rate": 6.68320684958163e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019118414215154558, + "loss": 0.0112, "step": 143790 }, { - "epoch": 1.55, - "learning_rate": 6.68158526302134e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019117657445853157, + "loss": 0.0141, "step": 143800 }, { - "epoch": 1.55, - "learning_rate": 6.679963676461049e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019116900676551755, + "loss": 0.0118, "step": 143810 }, { - "epoch": 1.55, - "learning_rate": 6.678342089900758e-05, - "loss": 0.0103, + "epoch": 0.73, + "learning_rate": 0.00019116143907250353, + "loss": 0.012, "step": 143820 }, { - "epoch": 1.55, - "learning_rate": 6.676720503340468e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019115387137948954, + "loss": 0.0146, "step": 143830 }, { - "epoch": 1.55, - "learning_rate": 6.675098916780177e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019114630368647552, + "loss": 0.011, "step": 143840 }, { - "epoch": 1.56, - "learning_rate": 6.673477330219886e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.0001911387359934615, + "loss": 0.0112, "step": 143850 }, { - "epoch": 1.56, - "learning_rate": 6.671855743659595e-05, - "loss": 0.0097, + "epoch": 0.73, + "learning_rate": 0.0001911311683004475, + "loss": 0.0162, "step": 143860 }, { - "epoch": 1.56, - "learning_rate": 6.670234157099306e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.0001911236006074335, + "loss": 0.0139, "step": 143870 }, { - "epoch": 1.56, - "learning_rate": 6.668612570539015e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019111603291441947, + "loss": 0.0144, "step": 143880 }, { - "epoch": 1.56, - "learning_rate": 6.666990983978725e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019110846522140548, + "loss": 0.0134, "step": 143890 }, { - "epoch": 1.56, - "learning_rate": 6.665369397418434e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.00019110089752839146, + "loss": 0.0126, "step": 143900 }, { - "epoch": 1.56, - "learning_rate": 6.663747810858143e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019109332983537744, + "loss": 0.0127, "step": 143910 }, { - "epoch": 1.56, - "learning_rate": 6.662126224297852e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.0001910857621423634, + "loss": 0.0119, "step": 143920 }, { - "epoch": 1.56, - "learning_rate": 6.660504637737562e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.0001910781944493494, + "loss": 0.016, "step": 143930 }, { - "epoch": 1.56, - "learning_rate": 6.658883051177271e-05, - "loss": 0.0095, + "epoch": 0.73, + "learning_rate": 0.0001910706267563354, + "loss": 0.0108, "step": 143940 }, { - "epoch": 1.56, - "learning_rate": 6.65726146461698e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019106305906332137, + "loss": 0.0166, "step": 143950 }, { - "epoch": 1.56, - "learning_rate": 6.65563987805669e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019105549137030738, + "loss": 0.0135, "step": 143960 }, { - "epoch": 1.56, - "learning_rate": 6.654018291496399e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019104792367729336, + "loss": 0.0133, "step": 143970 }, { - "epoch": 1.56, - "learning_rate": 6.65239670493611e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019104035598427934, + "loss": 0.0134, "step": 143980 }, { - "epoch": 1.56, - "learning_rate": 6.650775118375819e-05, - "loss": 0.0103, + "epoch": 0.73, + "learning_rate": 0.00019103278829126535, + "loss": 0.0121, "step": 143990 }, { - "epoch": 1.56, - "learning_rate": 6.649153531815528e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019102522059825133, + "loss": 0.0111, "step": 144000 }, { - "epoch": 1.56, - "eval_cer": 0.9214974020085575, - "eval_loss": 0.006375683005899191, - "eval_runtime": 121.1626, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.73, + "eval_cer": 0.914481900656667, + "eval_loss": 0.009388601407408714, + "eval_runtime": 116.6959, + "eval_samples_per_second": 17.139, + "eval_steps_per_second": 4.285, "step": 144000 }, { - "epoch": 1.56, - "learning_rate": 6.647531945255237e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.0001910176529052373, + "loss": 0.01, "step": 144010 }, { - "epoch": 1.56, - "learning_rate": 6.645910358694947e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019101008521222332, + "loss": 0.0112, "step": 144020 }, { - "epoch": 1.56, - "learning_rate": 6.644288772134656e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001910025175192093, + "loss": 0.012, "step": 144030 }, { - "epoch": 1.56, - "learning_rate": 6.642667185574365e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019099494982619528, + "loss": 0.0141, "step": 144040 }, { - "epoch": 1.56, - "learning_rate": 6.641045599014074e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019098738213318126, + "loss": 0.0147, "step": 144050 }, { - "epoch": 1.56, - "learning_rate": 6.639424012453784e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019097981444016727, + "loss": 0.0136, "step": 144060 }, { - "epoch": 1.56, - "learning_rate": 6.637802425893493e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019097224674715325, + "loss": 0.011, "step": 144070 }, { - "epoch": 1.56, - "learning_rate": 6.636180839333202e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019096467905413924, + "loss": 0.0129, "step": 144080 }, { - "epoch": 1.56, - "learning_rate": 6.634559252772913e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019095711136112524, + "loss": 0.012, "step": 144090 }, { - "epoch": 1.56, - "learning_rate": 6.632937666212622e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019094954366811123, + "loss": 0.0137, "step": 144100 }, { - "epoch": 1.56, - "learning_rate": 6.631316079652331e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.0001909419759750972, + "loss": 0.0132, "step": 144110 }, { - "epoch": 1.56, - "learning_rate": 6.62969449309204e-05, - "loss": 0.0111, + "epoch": 0.73, + "learning_rate": 0.00019093440828208322, + "loss": 0.0133, "step": 144120 }, { - "epoch": 1.56, - "learning_rate": 6.62807290653175e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001909268405890692, + "loss": 0.0107, "step": 144130 }, { - "epoch": 1.56, - "learning_rate": 6.626451319971459e-05, - "loss": 0.0115, + "epoch": 0.73, + "learning_rate": 0.00019091927289605518, + "loss": 0.0116, "step": 144140 }, { - "epoch": 1.56, - "learning_rate": 6.624829733411168e-05, - "loss": 0.005, + "epoch": 0.73, + "learning_rate": 0.0001909117052030412, + "loss": 0.0114, "step": 144150 }, { - "epoch": 1.56, - "learning_rate": 6.623208146850878e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019090413751002717, + "loss": 0.0115, "step": 144160 }, { - "epoch": 1.56, - "learning_rate": 6.621586560290587e-05, - "loss": 0.0097, + "epoch": 0.73, + "learning_rate": 0.00019089656981701315, + "loss": 0.0125, "step": 144170 }, { - "epoch": 1.56, - "learning_rate": 6.619964973730296e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019088900212399916, + "loss": 0.0101, "step": 144180 }, { - "epoch": 1.56, - "learning_rate": 6.618343387170006e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00019088143443098514, + "loss": 0.016, "step": 144190 }, { - "epoch": 1.56, - "learning_rate": 6.616721800609716e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019087386673797112, + "loss": 0.0162, "step": 144200 }, { - "epoch": 1.56, - "learning_rate": 6.615100214049425e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.0001908662990449571, + "loss": 0.0118, "step": 144210 }, { - "epoch": 1.56, - "learning_rate": 6.613478627489135e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.0001908587313519431, + "loss": 0.0122, "step": 144220 }, { - "epoch": 1.56, - "learning_rate": 6.611857040928844e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.0001908511636589291, + "loss": 0.0149, "step": 144230 }, { - "epoch": 1.56, - "learning_rate": 6.610235454368555e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019084359596591507, + "loss": 0.012, "step": 144240 }, { - "epoch": 1.56, - "learning_rate": 6.608613867808264e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019083602827290108, + "loss": 0.0141, "step": 144250 }, { - "epoch": 1.56, - "learning_rate": 6.606992281247973e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019082846057988706, + "loss": 0.0098, "step": 144260 }, { - "epoch": 1.56, - "learning_rate": 6.605370694687682e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019082089288687305, + "loss": 0.0121, "step": 144270 }, { - "epoch": 1.56, - "learning_rate": 6.603749108127392e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019081332519385905, + "loss": 0.0129, "step": 144280 }, { - "epoch": 1.56, - "learning_rate": 6.602127521567101e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019080575750084504, + "loss": 0.0143, "step": 144290 }, { - "epoch": 1.56, - "learning_rate": 6.60050593500681e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019079818980783102, + "loss": 0.012, "step": 144300 }, { - "epoch": 1.56, - "learning_rate": 6.59888434844652e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00019079062211481703, + "loss": 0.0132, "step": 144310 }, { - "epoch": 1.56, - "learning_rate": 6.597262761886229e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.000190783054421803, + "loss": 0.0128, "step": 144320 }, { - "epoch": 1.56, - "learning_rate": 6.595641175325938e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.000190775486728789, + "loss": 0.0153, "step": 144330 }, { - "epoch": 1.56, - "learning_rate": 6.594019588765647e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.000190767919035775, + "loss": 0.014, "step": 144340 }, { - "epoch": 1.56, - "learning_rate": 6.592398002205358e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.00019076035134276098, + "loss": 0.0125, "step": 144350 }, { - "epoch": 1.56, - "learning_rate": 6.590776415645067e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019075278364974696, + "loss": 0.0138, "step": 144360 }, { - "epoch": 1.56, - "learning_rate": 6.589154829084777e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019074521595673294, + "loss": 0.0145, "step": 144370 }, { - "epoch": 1.56, - "learning_rate": 6.587533242524486e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019073764826371895, + "loss": 0.0121, "step": 144380 }, { - "epoch": 1.56, - "learning_rate": 6.585911655964195e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019073008057070493, + "loss": 0.0144, "step": 144390 }, { - "epoch": 1.56, - "learning_rate": 6.584290069403904e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001907225128776909, + "loss": 0.0141, "step": 144400 }, { - "epoch": 1.56, - "learning_rate": 6.582668482843614e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019071494518467692, + "loss": 0.0119, "step": 144410 }, { - "epoch": 1.56, - "learning_rate": 6.581046896283323e-05, - "loss": 0.0104, + "epoch": 0.73, + "learning_rate": 0.0001907073774916629, + "loss": 0.0145, "step": 144420 }, { - "epoch": 1.56, - "learning_rate": 6.579425309723032e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019069980979864888, + "loss": 0.0189, "step": 144430 }, { - "epoch": 1.56, - "learning_rate": 6.577803723162741e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.0001906922421056349, + "loss": 0.0111, "step": 144440 }, { - "epoch": 1.56, - "learning_rate": 6.576182136602452e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019068467441262087, + "loss": 0.0135, "step": 144450 }, { - "epoch": 1.56, - "learning_rate": 6.574560550042161e-05, - "loss": 0.0111, + "epoch": 0.73, + "learning_rate": 0.00019067710671960686, + "loss": 0.0128, "step": 144460 }, { - "epoch": 1.56, - "learning_rate": 6.57293896348187e-05, - "loss": 0.0124, + "epoch": 0.73, + "learning_rate": 0.00019066953902659286, + "loss": 0.0092, "step": 144470 }, { - "epoch": 1.56, - "learning_rate": 6.57131737692158e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019066197133357885, + "loss": 0.0114, "step": 144480 }, { - "epoch": 1.56, - "learning_rate": 6.569695790361289e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019065440364056483, + "loss": 0.0122, "step": 144490 }, { - "epoch": 1.56, - "learning_rate": 6.568074203800998e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019064683594755084, + "loss": 0.0118, "step": 144500 }, { - "epoch": 1.56, - "learning_rate": 6.566452617240708e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019063926825453682, + "loss": 0.0137, "step": 144510 }, { - "epoch": 1.56, - "learning_rate": 6.564831030680417e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.0001906317005615228, + "loss": 0.0118, "step": 144520 }, { - "epoch": 1.56, - "learning_rate": 6.563209444120126e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.0001906241328685088, + "loss": 0.0152, "step": 144530 }, { - "epoch": 1.56, - "learning_rate": 6.561587857559836e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001906165651754948, + "loss": 0.0183, "step": 144540 }, { - "epoch": 1.56, - "learning_rate": 6.559966270999545e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.00019060899748248077, + "loss": 0.0167, "step": 144550 }, { - "epoch": 1.56, - "learning_rate": 6.558344684439255e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019060142978946675, + "loss": 0.0118, "step": 144560 }, { - "epoch": 1.56, - "learning_rate": 6.556723097878965e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019059386209645276, + "loss": 0.0128, "step": 144570 }, { - "epoch": 1.56, - "learning_rate": 6.555101511318674e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019058629440343874, + "loss": 0.0116, "step": 144580 }, { - "epoch": 1.56, - "learning_rate": 6.553479924758383e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019057872671042472, + "loss": 0.0121, "step": 144590 }, { - "epoch": 1.56, - "learning_rate": 6.551858338198093e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00019057115901741073, + "loss": 0.0132, "step": 144600 }, { - "epoch": 1.56, - "learning_rate": 6.550236751637802e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.0001905635913243967, + "loss": 0.0143, "step": 144610 }, { - "epoch": 1.56, - "learning_rate": 6.548615165077511e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.0001905560236313827, + "loss": 0.0125, "step": 144620 }, { - "epoch": 1.56, - "learning_rate": 6.54699357851722e-05, - "loss": 0.0049, + "epoch": 0.73, + "learning_rate": 0.0001905484559383687, + "loss": 0.0147, "step": 144630 }, { - "epoch": 1.56, - "learning_rate": 6.54537199195693e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019054088824535468, + "loss": 0.0128, "step": 144640 }, { - "epoch": 1.56, - "learning_rate": 6.543750405396639e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019053332055234067, + "loss": 0.0147, "step": 144650 }, { - "epoch": 1.56, - "learning_rate": 6.542128818836348e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019052575285932667, + "loss": 0.0123, "step": 144660 }, { - "epoch": 1.56, - "learning_rate": 6.540507232276059e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019051818516631266, + "loss": 0.0182, "step": 144670 }, { - "epoch": 1.56, - "learning_rate": 6.538885645715768e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019051061747329864, + "loss": 0.0139, "step": 144680 }, { - "epoch": 1.56, - "learning_rate": 6.537264059155477e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.00019050304978028465, + "loss": 0.0118, "step": 144690 }, { - "epoch": 1.56, - "learning_rate": 6.535642472595187e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019049548208727063, + "loss": 0.0149, "step": 144700 }, { - "epoch": 1.56, - "learning_rate": 6.534020886034896e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.0001904879143942566, + "loss": 0.0144, "step": 144710 }, { - "epoch": 1.56, - "learning_rate": 6.532399299474605e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.0001904803467012426, + "loss": 0.0136, "step": 144720 }, { - "epoch": 1.56, - "learning_rate": 6.530777712914314e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.0001904727790082286, + "loss": 0.0174, "step": 144730 }, { - "epoch": 1.56, - "learning_rate": 6.529156126354024e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019046521131521458, + "loss": 0.0144, "step": 144740 }, { - "epoch": 1.56, - "learning_rate": 6.527534539793733e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019045764362220056, + "loss": 0.0121, "step": 144750 }, { - "epoch": 1.56, - "learning_rate": 6.525912953233442e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019045007592918657, + "loss": 0.0161, "step": 144760 }, { - "epoch": 1.57, - "learning_rate": 6.524291366673152e-05, - "loss": 0.0109, + "epoch": 0.73, + "learning_rate": 0.00019044250823617255, + "loss": 0.0108, "step": 144770 }, { - "epoch": 1.57, - "learning_rate": 6.522669780112862e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019043494054315853, + "loss": 0.0159, "step": 144780 }, { - "epoch": 1.57, - "learning_rate": 6.521048193552571e-05, - "loss": 0.01, + "epoch": 0.73, + "learning_rate": 0.00019042737285014454, + "loss": 0.0115, "step": 144790 }, { - "epoch": 1.57, - "learning_rate": 6.519426606992281e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019041980515713052, + "loss": 0.0113, "step": 144800 }, { - "epoch": 1.57, - "learning_rate": 6.51780502043199e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001904122374641165, + "loss": 0.0127, "step": 144810 }, { - "epoch": 1.57, - "learning_rate": 6.516183433871699e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019040466977110251, + "loss": 0.0158, "step": 144820 }, { - "epoch": 1.57, - "learning_rate": 6.514561847311409e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.0001903971020780885, + "loss": 0.0134, "step": 144830 }, { - "epoch": 1.57, - "learning_rate": 6.512940260751118e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00019038953438507448, + "loss": 0.0149, "step": 144840 }, { - "epoch": 1.57, - "learning_rate": 6.511318674190827e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019038196669206049, + "loss": 0.0154, "step": 144850 }, { - "epoch": 1.57, - "learning_rate": 6.509697087630536e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019037439899904647, + "loss": 0.0132, "step": 144860 }, { - "epoch": 1.57, - "learning_rate": 6.508075501070246e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.00019036683130603245, + "loss": 0.0134, "step": 144870 }, { - "epoch": 1.57, - "learning_rate": 6.506453914509955e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019035926361301843, + "loss": 0.014, "step": 144880 }, { - "epoch": 1.57, - "learning_rate": 6.504832327949666e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019035169592000444, + "loss": 0.0122, "step": 144890 }, { - "epoch": 1.57, - "learning_rate": 6.503210741389375e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019034412822699042, + "loss": 0.0125, "step": 144900 }, { - "epoch": 1.57, - "learning_rate": 6.501589154829084e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.0001903365605339764, + "loss": 0.0123, "step": 144910 }, { - "epoch": 1.57, - "learning_rate": 6.499967568268793e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.0001903289928409624, + "loss": 0.0155, "step": 144920 }, { - "epoch": 1.57, - "learning_rate": 6.498345981708503e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.0001903214251479484, + "loss": 0.0157, "step": 144930 }, { - "epoch": 1.57, - "learning_rate": 6.496724395148213e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.00019031385745493437, + "loss": 0.0114, "step": 144940 }, { - "epoch": 1.57, - "learning_rate": 6.495102808587923e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019030628976192038, + "loss": 0.0132, "step": 144950 }, { - "epoch": 1.57, - "learning_rate": 6.493481222027632e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019029872206890636, + "loss": 0.0115, "step": 144960 }, { - "epoch": 1.57, - "learning_rate": 6.491859635467341e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019029115437589234, + "loss": 0.011, "step": 144970 }, { - "epoch": 1.57, - "learning_rate": 6.49023804890705e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019028358668287835, + "loss": 0.0123, "step": 144980 }, { - "epoch": 1.57, - "learning_rate": 6.48861646234676e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.00019027601898986433, + "loss": 0.0121, "step": 144990 }, { - "epoch": 1.57, - "learning_rate": 6.486994875786469e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.00019026845129685032, + "loss": 0.0122, "step": 145000 }, { - "epoch": 1.57, - "eval_cer": 0.9215243287002052, - "eval_loss": 0.006177145056426525, - "eval_runtime": 121.3378, - "eval_samples_per_second": 16.483, - "eval_steps_per_second": 4.121, + "epoch": 0.73, + "eval_cer": 0.9144566703574066, + "eval_loss": 0.00918771605938673, + "eval_runtime": 116.6602, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, "step": 145000 }, { - "epoch": 1.57, - "learning_rate": 6.485373289226178e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019026088360383632, + "loss": 0.0124, "step": 145010 }, { - "epoch": 1.57, - "learning_rate": 6.483751702665887e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.0001902533159108223, + "loss": 0.0144, "step": 145020 }, { - "epoch": 1.57, - "learning_rate": 6.482130116105598e-05, - "loss": 0.0105, + "epoch": 0.73, + "learning_rate": 0.0001902457482178083, + "loss": 0.0127, "step": 145030 }, { - "epoch": 1.57, - "learning_rate": 6.480508529545307e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019023818052479427, + "loss": 0.0136, "step": 145040 }, { - "epoch": 1.57, - "learning_rate": 6.478886942985017e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019023061283178028, + "loss": 0.011, "step": 145050 }, { - "epoch": 1.57, - "learning_rate": 6.477265356424726e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019022304513876626, + "loss": 0.0146, "step": 145060 }, { - "epoch": 1.57, - "learning_rate": 6.475643769864435e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019021547744575224, + "loss": 0.0122, "step": 145070 }, { - "epoch": 1.57, - "learning_rate": 6.474022183304144e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019020790975273825, + "loss": 0.0126, "step": 145080 }, { - "epoch": 1.57, - "learning_rate": 6.472400596743854e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019020034205972423, + "loss": 0.0142, "step": 145090 }, { - "epoch": 1.57, - "learning_rate": 6.470779010183563e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.0001901927743667102, + "loss": 0.0154, "step": 145100 }, { - "epoch": 1.57, - "learning_rate": 6.469157423623272e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019018520667369622, + "loss": 0.0162, "step": 145110 }, { - "epoch": 1.57, - "learning_rate": 6.467535837062982e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001901776389806822, + "loss": 0.0114, "step": 145120 }, { - "epoch": 1.57, - "learning_rate": 6.465914250502691e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019017007128766818, + "loss": 0.0099, "step": 145130 }, { - "epoch": 1.57, - "learning_rate": 6.464292663942402e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.0001901625035946542, + "loss": 0.0117, "step": 145140 }, { - "epoch": 1.57, - "learning_rate": 6.462671077382111e-05, - "loss": 0.0098, + "epoch": 0.73, + "learning_rate": 0.00019015493590164017, + "loss": 0.0137, "step": 145150 }, { - "epoch": 1.57, - "learning_rate": 6.46104949082182e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019014736820862615, + "loss": 0.0133, "step": 145160 }, { - "epoch": 1.57, - "learning_rate": 6.45942790426153e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019013980051561216, + "loss": 0.0083, "step": 145170 }, { - "epoch": 1.57, - "learning_rate": 6.457806317701239e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019013223282259812, + "loss": 0.0161, "step": 145180 }, { - "epoch": 1.57, - "learning_rate": 6.456184731140948e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.0001901246651295841, + "loss": 0.0127, "step": 145190 }, { - "epoch": 1.57, - "learning_rate": 6.454563144580657e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019011709743657008, + "loss": 0.0132, "step": 145200 }, { - "epoch": 1.57, - "learning_rate": 6.452941558020366e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.0001901095297435561, + "loss": 0.0121, "step": 145210 }, { - "epoch": 1.57, - "learning_rate": 6.451319971460076e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019010196205054207, + "loss": 0.0138, "step": 145220 }, { - "epoch": 1.57, - "learning_rate": 6.449698384899785e-05, - "loss": 0.0051, + "epoch": 0.73, + "learning_rate": 0.00019009439435752805, + "loss": 0.0111, "step": 145230 }, { - "epoch": 1.57, - "learning_rate": 6.448076798339494e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019008682666451406, + "loss": 0.0104, "step": 145240 }, { - "epoch": 1.57, - "learning_rate": 6.446455211779205e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.00019007925897150004, + "loss": 0.0138, "step": 145250 }, { - "epoch": 1.57, - "learning_rate": 6.444833625218914e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019007169127848602, + "loss": 0.0134, "step": 145260 }, { - "epoch": 1.57, - "learning_rate": 6.443212038658623e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.000190064123585472, + "loss": 0.0118, "step": 145270 }, { - "epoch": 1.57, - "learning_rate": 6.441590452098333e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.000190056555892458, + "loss": 0.0102, "step": 145280 }, { - "epoch": 1.57, - "learning_rate": 6.439968865538042e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.000190048988199444, + "loss": 0.0148, "step": 145290 }, { - "epoch": 1.57, - "learning_rate": 6.438347278977751e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019004142050642998, + "loss": 0.0117, "step": 145300 }, { - "epoch": 1.57, - "learning_rate": 6.43672569241746e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019003385281341598, + "loss": 0.0125, "step": 145310 }, { - "epoch": 1.57, - "learning_rate": 6.43510410585717e-05, - "loss": 0.0098, + "epoch": 0.73, + "learning_rate": 0.00019002628512040197, + "loss": 0.0093, "step": 145320 }, { - "epoch": 1.57, - "learning_rate": 6.433482519296879e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.00019001871742738795, + "loss": 0.0128, "step": 145330 }, { - "epoch": 1.57, - "learning_rate": 6.431860932736588e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019001114973437396, + "loss": 0.0137, "step": 145340 }, { - "epoch": 1.57, - "learning_rate": 6.430239346176298e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00019000358204135994, + "loss": 0.0143, "step": 145350 }, { - "epoch": 1.57, - "learning_rate": 6.428617759616008e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00018999601434834592, + "loss": 0.0134, "step": 145360 }, { - "epoch": 1.57, - "learning_rate": 6.426996173055718e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00018998844665533193, + "loss": 0.0143, "step": 145370 }, { - "epoch": 1.57, - "learning_rate": 6.425374586495427e-05, - "loss": 0.0102, + "epoch": 0.73, + "learning_rate": 0.0001899808789623179, + "loss": 0.0155, "step": 145380 }, { - "epoch": 1.57, - "learning_rate": 6.423752999935136e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001899733112693039, + "loss": 0.0134, "step": 145390 }, { - "epoch": 1.57, - "learning_rate": 6.422131413374845e-05, - "loss": 0.0059, + "epoch": 0.73, + "learning_rate": 0.0001899657435762899, + "loss": 0.0108, "step": 145400 }, { - "epoch": 1.57, - "learning_rate": 6.420509826814555e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00018995817588327588, + "loss": 0.0098, "step": 145410 }, { - "epoch": 1.57, - "learning_rate": 6.418888240254264e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00018995060819026186, + "loss": 0.0128, "step": 145420 }, { - "epoch": 1.57, - "learning_rate": 6.417266653693973e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00018994304049724784, + "loss": 0.0108, "step": 145430 }, { - "epoch": 1.57, - "learning_rate": 6.415645067133682e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00018993547280423385, + "loss": 0.0138, "step": 145440 }, { - "epoch": 1.57, - "learning_rate": 6.414023480573392e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00018992790511121983, + "loss": 0.0129, "step": 145450 }, { - "epoch": 1.57, - "learning_rate": 6.412401894013102e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00018992033741820581, + "loss": 0.0134, "step": 145460 }, { - "epoch": 1.57, - "learning_rate": 6.410780307452812e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00018991276972519182, + "loss": 0.0147, "step": 145470 }, { - "epoch": 1.57, - "learning_rate": 6.409158720892521e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001899052020321778, + "loss": 0.011, "step": 145480 }, { - "epoch": 1.57, - "learning_rate": 6.40753713433223e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00018989763433916379, + "loss": 0.0132, "step": 145490 }, { - "epoch": 1.57, - "learning_rate": 6.40591554777194e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.0001898900666461498, + "loss": 0.0127, "step": 145500 }, { - "epoch": 1.57, - "learning_rate": 6.404293961211649e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00018988249895313578, + "loss": 0.0114, "step": 145510 }, { - "epoch": 1.57, - "learning_rate": 6.402672374651358e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00018987493126012176, + "loss": 0.0111, "step": 145520 }, { - "epoch": 1.57, - "learning_rate": 6.401050788091067e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00018986736356710777, + "loss": 0.0169, "step": 145530 }, { - "epoch": 1.57, - "learning_rate": 6.399429201530777e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00018985979587409375, + "loss": 0.0125, "step": 145540 }, { - "epoch": 1.57, - "learning_rate": 6.397807614970486e-05, - "loss": 0.0143, + "epoch": 0.73, + "learning_rate": 0.00018985222818107973, + "loss": 0.0183, "step": 145550 }, { - "epoch": 1.57, - "learning_rate": 6.396186028410195e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00018984466048806574, + "loss": 0.0129, "step": 145560 }, { - "epoch": 1.57, - "learning_rate": 6.394564441849906e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00018983709279505172, + "loss": 0.0134, "step": 145570 }, { - "epoch": 1.57, - "learning_rate": 6.392942855289615e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.0001898295251020377, + "loss": 0.0119, "step": 145580 }, { - "epoch": 1.57, - "learning_rate": 6.391321268729324e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.0001898219574090237, + "loss": 0.014, "step": 145590 }, { - "epoch": 1.57, - "learning_rate": 6.389699682169034e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.0001898143897160097, + "loss": 0.0116, "step": 145600 }, { - "epoch": 1.57, - "learning_rate": 6.388078095608743e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00018980682202299567, + "loss": 0.013, "step": 145610 }, { - "epoch": 1.57, - "learning_rate": 6.386456509048452e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00018979925432998165, + "loss": 0.0135, "step": 145620 }, { - "epoch": 1.57, - "learning_rate": 6.384834922488161e-05, - "loss": 0.0099, + "epoch": 0.73, + "learning_rate": 0.00018979168663696766, + "loss": 0.0126, "step": 145630 }, { - "epoch": 1.57, - "learning_rate": 6.38321333592787e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00018978411894395364, + "loss": 0.0169, "step": 145640 }, { - "epoch": 1.57, - "learning_rate": 6.38159174936758e-05, - "loss": 0.0059, + "epoch": 0.73, + "learning_rate": 0.00018977655125093962, + "loss": 0.0104, "step": 145650 }, { - "epoch": 1.57, - "learning_rate": 6.37997016280729e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00018976898355792563, + "loss": 0.0143, "step": 145660 }, { - "epoch": 1.57, - "learning_rate": 6.378348576247e-05, - "loss": 0.0095, + "epoch": 0.73, + "learning_rate": 0.00018976141586491161, + "loss": 0.0128, "step": 145670 }, { - "epoch": 1.57, - "learning_rate": 6.376726989686709e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.0001897538481718976, + "loss": 0.0149, "step": 145680 }, { - "epoch": 1.57, - "learning_rate": 6.375105403126418e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001897462804788836, + "loss": 0.0128, "step": 145690 }, { - "epoch": 1.58, - "learning_rate": 6.373483816566128e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018973871278586959, + "loss": 0.0147, "step": 145700 }, { - "epoch": 1.58, - "learning_rate": 6.371862230005837e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018973114509285557, + "loss": 0.0128, "step": 145710 }, { - "epoch": 1.58, - "learning_rate": 6.370240643445548e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018972357739984158, + "loss": 0.0137, "step": 145720 }, { - "epoch": 1.58, - "learning_rate": 6.368619056885257e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018971600970682756, + "loss": 0.0156, "step": 145730 }, { - "epoch": 1.58, - "learning_rate": 6.366997470324966e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018970844201381354, + "loss": 0.0128, "step": 145740 }, { - "epoch": 1.58, - "learning_rate": 6.365375883764675e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018970087432079955, + "loss": 0.0138, "step": 145750 }, { - "epoch": 1.58, - "learning_rate": 6.363754297204385e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018969330662778553, + "loss": 0.0172, "step": 145760 }, { - "epoch": 1.58, - "learning_rate": 6.362132710644094e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.0001896857389347715, + "loss": 0.0127, "step": 145770 }, { - "epoch": 1.58, - "learning_rate": 6.360511124083803e-05, - "loss": 0.0111, + "epoch": 0.74, + "learning_rate": 0.0001896781712417575, + "loss": 0.0116, "step": 145780 }, { - "epoch": 1.58, - "learning_rate": 6.358889537523512e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.0001896706035487435, + "loss": 0.0107, "step": 145790 }, { - "epoch": 1.58, - "learning_rate": 6.357267950963222e-05, - "loss": 0.0098, + "epoch": 0.74, + "learning_rate": 0.00018966303585572948, + "loss": 0.0138, "step": 145800 }, { - "epoch": 1.58, - "learning_rate": 6.355646364402931e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018965546816271546, + "loss": 0.0175, "step": 145810 }, { - "epoch": 1.58, - "learning_rate": 6.35402477784264e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018964790046970147, + "loss": 0.0105, "step": 145820 }, { - "epoch": 1.58, - "learning_rate": 6.352403191282351e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018964033277668745, + "loss": 0.0113, "step": 145830 }, { - "epoch": 1.58, - "learning_rate": 6.35078160472206e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018963276508367343, + "loss": 0.0144, "step": 145840 }, { - "epoch": 1.58, - "learning_rate": 6.34916001816177e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018962519739065944, + "loss": 0.0151, "step": 145850 }, { - "epoch": 1.58, - "learning_rate": 6.347538431601479e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018961762969764542, + "loss": 0.0126, "step": 145860 }, { - "epoch": 1.58, - "learning_rate": 6.345916845041188e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.0001896100620046314, + "loss": 0.0119, "step": 145870 }, { - "epoch": 1.58, - "learning_rate": 6.344295258480897e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018960249431161741, + "loss": 0.0121, "step": 145880 }, { - "epoch": 1.58, - "learning_rate": 6.342673671920607e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.0001895949266186034, + "loss": 0.0137, "step": 145890 }, { - "epoch": 1.58, - "learning_rate": 6.341052085360316e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018958735892558938, + "loss": 0.0108, "step": 145900 }, { - "epoch": 1.58, - "learning_rate": 6.339430498800025e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018957979123257539, + "loss": 0.0146, "step": 145910 }, { - "epoch": 1.58, - "learning_rate": 6.337808912239734e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018957222353956137, + "loss": 0.0137, "step": 145920 }, { - "epoch": 1.58, - "learning_rate": 6.336187325679444e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018956465584654735, + "loss": 0.013, "step": 145930 }, { - "epoch": 1.58, - "learning_rate": 6.334565739119154e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.00018955708815353333, + "loss": 0.013, "step": 145940 }, { - "epoch": 1.58, - "learning_rate": 6.332944152558864e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018954952046051934, + "loss": 0.0113, "step": 145950 }, { - "epoch": 1.58, - "learning_rate": 6.331322565998573e-05, - "loss": 0.0107, + "epoch": 0.74, + "learning_rate": 0.00018954195276750532, + "loss": 0.0143, "step": 145960 }, { - "epoch": 1.58, - "learning_rate": 6.329700979438282e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.0001895343850744913, + "loss": 0.0102, "step": 145970 }, { - "epoch": 1.58, - "learning_rate": 6.328079392877991e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.0001895268173814773, + "loss": 0.0118, "step": 145980 }, { - "epoch": 1.58, - "learning_rate": 6.3264578063177e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.0001895192496884633, + "loss": 0.0121, "step": 145990 }, { - "epoch": 1.58, - "learning_rate": 6.32483621975741e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018951168199544927, + "loss": 0.0157, "step": 146000 }, { - "epoch": 1.58, - "eval_cer": 0.921514774067685, - "eval_loss": 0.006277143489569426, - "eval_runtime": 121.0938, - "eval_samples_per_second": 16.516, - "eval_steps_per_second": 4.129, + "epoch": 0.74, + "eval_cer": 0.9144770486760401, + "eval_loss": 0.009305712766945362, + "eval_runtime": 116.6484, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.286, "step": 146000 }, { - "epoch": 1.58, - "learning_rate": 6.323214633197119e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018950411430243528, + "loss": 0.0103, "step": 146010 }, { - "epoch": 1.58, - "learning_rate": 6.321593046636828e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018949654660942126, + "loss": 0.0162, "step": 146020 }, { - "epoch": 1.58, - "learning_rate": 6.319971460076538e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018948897891640724, + "loss": 0.01, "step": 146030 }, { - "epoch": 1.58, - "learning_rate": 6.318349873516248e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018948141122339325, + "loss": 0.0143, "step": 146040 }, { - "epoch": 1.58, - "learning_rate": 6.316728286955958e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018947384353037923, + "loss": 0.014, "step": 146050 }, { - "epoch": 1.58, - "learning_rate": 6.315106700395667e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018946627583736522, + "loss": 0.0128, "step": 146060 }, { - "epoch": 1.58, - "learning_rate": 6.313485113835376e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018945870814435122, + "loss": 0.0133, "step": 146070 }, { - "epoch": 1.58, - "learning_rate": 6.311863527275085e-05, - "loss": 0.0104, + "epoch": 0.74, + "learning_rate": 0.0001894511404513372, + "loss": 0.0132, "step": 146080 }, { - "epoch": 1.58, - "learning_rate": 6.310241940714795e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.0001894435727583232, + "loss": 0.0133, "step": 146090 }, { - "epoch": 1.58, - "learning_rate": 6.308620354154504e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.0001894360050653092, + "loss": 0.0127, "step": 146100 }, { - "epoch": 1.58, - "learning_rate": 6.306998767594213e-05, - "loss": 0.0109, + "epoch": 0.74, + "learning_rate": 0.00018942843737229518, + "loss": 0.0104, "step": 146110 }, { - "epoch": 1.58, - "learning_rate": 6.305377181033923e-05, - "loss": 0.0056, + "epoch": 0.74, + "learning_rate": 0.00018942086967928116, + "loss": 0.0102, "step": 146120 }, { - "epoch": 1.58, - "learning_rate": 6.303755594473632e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018941330198626714, + "loss": 0.0129, "step": 146130 }, { - "epoch": 1.58, - "learning_rate": 6.302134007913341e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018940573429325315, + "loss": 0.0128, "step": 146140 }, { - "epoch": 1.58, - "learning_rate": 6.300512421353052e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018939816660023913, + "loss": 0.0118, "step": 146150 }, { - "epoch": 1.58, - "learning_rate": 6.298890834792761e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.0001893905989072251, + "loss": 0.0127, "step": 146160 }, { - "epoch": 1.58, - "learning_rate": 6.29726924823247e-05, - "loss": 0.01, + "epoch": 0.74, + "learning_rate": 0.00018938303121421112, + "loss": 0.0113, "step": 146170 }, { - "epoch": 1.58, - "learning_rate": 6.29564766167218e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.0001893754635211971, + "loss": 0.0113, "step": 146180 }, { - "epoch": 1.58, - "learning_rate": 6.294026075111889e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018936789582818308, + "loss": 0.0154, "step": 146190 }, { - "epoch": 1.58, - "learning_rate": 6.292404488551598e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.0001893603281351691, + "loss": 0.0127, "step": 146200 }, { - "epoch": 1.58, - "learning_rate": 6.290782901991307e-05, - "loss": 0.011, + "epoch": 0.74, + "learning_rate": 0.00018935276044215507, + "loss": 0.0134, "step": 146210 }, { - "epoch": 1.58, - "learning_rate": 6.289161315431017e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018934519274914105, + "loss": 0.0145, "step": 146220 }, { - "epoch": 1.58, - "learning_rate": 6.287539728870726e-05, - "loss": 0.0105, + "epoch": 0.74, + "learning_rate": 0.00018933762505612706, + "loss": 0.0145, "step": 146230 }, { - "epoch": 1.58, - "learning_rate": 6.285918142310435e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018933005736311304, + "loss": 0.0116, "step": 146240 }, { - "epoch": 1.58, - "learning_rate": 6.284296555750145e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018932248967009903, + "loss": 0.0126, "step": 146250 }, { - "epoch": 1.58, - "learning_rate": 6.282674969189855e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018931492197708503, + "loss": 0.0094, "step": 146260 }, { - "epoch": 1.58, - "learning_rate": 6.281053382629564e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018930735428407102, + "loss": 0.0142, "step": 146270 }, { - "epoch": 1.58, - "learning_rate": 6.279431796069274e-05, - "loss": 0.0101, + "epoch": 0.74, + "learning_rate": 0.000189299786591057, + "loss": 0.0114, "step": 146280 }, { - "epoch": 1.58, - "learning_rate": 6.277810209508983e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018929221889804298, + "loss": 0.0165, "step": 146290 }, { - "epoch": 1.58, - "learning_rate": 6.276188622948692e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.000189284651205029, + "loss": 0.0119, "step": 146300 }, { - "epoch": 1.58, - "learning_rate": 6.274567036388402e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018927708351201497, + "loss": 0.0185, "step": 146310 }, { - "epoch": 1.58, - "learning_rate": 6.272945449828111e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018926951581900095, + "loss": 0.0133, "step": 146320 }, { - "epoch": 1.58, - "learning_rate": 6.27132386326782e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018926194812598696, + "loss": 0.0124, "step": 146330 }, { - "epoch": 1.58, - "learning_rate": 6.26970227670753e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018925438043297294, + "loss": 0.01, "step": 146340 }, { - "epoch": 1.58, - "learning_rate": 6.268080690147239e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018924681273995892, + "loss": 0.0126, "step": 146350 }, { - "epoch": 1.58, - "learning_rate": 6.266459103586948e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018923924504694493, + "loss": 0.0106, "step": 146360 }, { - "epoch": 1.58, - "learning_rate": 6.264837517026659e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.0001892316773539309, + "loss": 0.0127, "step": 146370 }, { - "epoch": 1.58, - "learning_rate": 6.263215930466368e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.0001892241096609169, + "loss": 0.0116, "step": 146380 }, { - "epoch": 1.58, - "learning_rate": 6.261594343906077e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.0001892165419679029, + "loss": 0.0138, "step": 146390 }, { - "epoch": 1.58, - "learning_rate": 6.259972757345786e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018920897427488888, + "loss": 0.015, "step": 146400 }, { - "epoch": 1.58, - "learning_rate": 6.258351170785497e-05, - "loss": 0.0106, + "epoch": 0.74, + "learning_rate": 0.00018920140658187486, + "loss": 0.0128, "step": 146410 }, { - "epoch": 1.58, - "learning_rate": 6.256729584225206e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018919383888886087, + "loss": 0.0128, "step": 146420 }, { - "epoch": 1.58, - "learning_rate": 6.255107997664916e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018918627119584683, + "loss": 0.0137, "step": 146430 }, { - "epoch": 1.58, - "learning_rate": 6.253486411104625e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.0001891787035028328, + "loss": 0.0099, "step": 146440 }, { - "epoch": 1.58, - "learning_rate": 6.251864824544334e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.0001891711358098188, + "loss": 0.0089, "step": 146450 }, { - "epoch": 1.58, - "learning_rate": 6.250243237984043e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.0001891635681168048, + "loss": 0.0142, "step": 146460 }, { - "epoch": 1.58, - "learning_rate": 6.248621651423753e-05, - "loss": 0.012, + "epoch": 0.74, + "learning_rate": 0.00018915600042379078, + "loss": 0.0104, "step": 146470 }, { - "epoch": 1.58, - "learning_rate": 6.247000064863462e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018914843273077676, + "loss": 0.0111, "step": 146480 }, { - "epoch": 1.58, - "learning_rate": 6.245378478303171e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018914086503776277, + "loss": 0.0136, "step": 146490 }, { - "epoch": 1.58, - "learning_rate": 6.24375689174288e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.00018913329734474875, + "loss": 0.0143, "step": 146500 }, { - "epoch": 1.58, - "learning_rate": 6.24213530518259e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.00018912572965173473, + "loss": 0.012, "step": 146510 }, { - "epoch": 1.58, - "learning_rate": 6.2405137186223e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018911816195872071, + "loss": 0.0107, "step": 146520 }, { - "epoch": 1.58, - "learning_rate": 6.23889213206201e-05, - "loss": 0.011, + "epoch": 0.74, + "learning_rate": 0.00018911059426570672, + "loss": 0.0107, "step": 146530 }, { - "epoch": 1.58, - "learning_rate": 6.237270545501719e-05, - "loss": 0.0115, + "epoch": 0.74, + "learning_rate": 0.0001891030265726927, + "loss": 0.0127, "step": 146540 }, { - "epoch": 1.58, - "learning_rate": 6.235648958941428e-05, - "loss": 0.011, + "epoch": 0.74, + "learning_rate": 0.00018909545887967869, + "loss": 0.013, "step": 146550 }, { - "epoch": 1.58, - "learning_rate": 6.234027372381137e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.0001890878911866647, + "loss": 0.0143, "step": 146560 }, { - "epoch": 1.58, - "learning_rate": 6.232405785820847e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018908032349365068, + "loss": 0.0135, "step": 146570 }, { - "epoch": 1.58, - "learning_rate": 6.230784199260556e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018907275580063666, + "loss": 0.0128, "step": 146580 }, { - "epoch": 1.58, - "learning_rate": 6.229162612700265e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018906518810762267, + "loss": 0.0124, "step": 146590 }, { - "epoch": 1.58, - "learning_rate": 6.227541026139975e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018905762041460865, + "loss": 0.0144, "step": 146600 }, { - "epoch": 1.58, - "learning_rate": 6.225919439579684e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018905005272159463, + "loss": 0.0141, "step": 146610 }, { - "epoch": 1.59, - "learning_rate": 6.224297853019394e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018904248502858064, + "loss": 0.0121, "step": 146620 }, { - "epoch": 1.59, - "learning_rate": 6.222676266459104e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018903491733556662, + "loss": 0.0158, "step": 146630 }, { - "epoch": 1.59, - "learning_rate": 6.221054679898813e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.0001890273496425526, + "loss": 0.0117, "step": 146640 }, { - "epoch": 1.59, - "learning_rate": 6.219433093338522e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.0001890197819495386, + "loss": 0.0097, "step": 146650 }, { - "epoch": 1.59, - "learning_rate": 6.217811506778232e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.0001890122142565246, + "loss": 0.0161, "step": 146660 }, { - "epoch": 1.59, - "learning_rate": 6.216189920217941e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018900464656351057, + "loss": 0.0094, "step": 146670 }, { - "epoch": 1.59, - "learning_rate": 6.21456833365765e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.00018899707887049655, + "loss": 0.013, "step": 146680 }, { - "epoch": 1.59, - "learning_rate": 6.21294674709736e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018898951117748256, + "loss": 0.015, "step": 146690 }, { - "epoch": 1.59, - "learning_rate": 6.211325160537069e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018898194348446854, + "loss": 0.0135, "step": 146700 }, { - "epoch": 1.59, - "learning_rate": 6.209703573976778e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018897437579145452, + "loss": 0.0152, "step": 146710 }, { - "epoch": 1.59, - "learning_rate": 6.208081987416487e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018896680809844053, + "loss": 0.0142, "step": 146720 }, { - "epoch": 1.59, - "learning_rate": 6.206460400856198e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018895924040542651, + "loss": 0.014, "step": 146730 }, { - "epoch": 1.59, - "learning_rate": 6.204838814295907e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.0001889516727124125, + "loss": 0.0123, "step": 146740 }, { - "epoch": 1.59, - "learning_rate": 6.203217227735616e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.0001889441050193985, + "loss": 0.0142, "step": 146750 }, { - "epoch": 1.59, - "learning_rate": 6.201595641175326e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018893653732638449, + "loss": 0.0121, "step": 146760 }, { - "epoch": 1.59, - "learning_rate": 6.199974054615035e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018892896963337047, + "loss": 0.0116, "step": 146770 }, { - "epoch": 1.59, - "learning_rate": 6.198352468054744e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018892140194035648, + "loss": 0.0117, "step": 146780 }, { - "epoch": 1.59, - "learning_rate": 6.196730881494453e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018891383424734246, + "loss": 0.0113, "step": 146790 }, { - "epoch": 1.59, - "learning_rate": 6.195109294934163e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018890626655432844, + "loss": 0.0107, "step": 146800 }, { - "epoch": 1.59, - "learning_rate": 6.193487708373872e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018889869886131445, + "loss": 0.0138, "step": 146810 }, { - "epoch": 1.59, - "learning_rate": 6.191866121813581e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018889113116830043, + "loss": 0.013, "step": 146820 }, { - "epoch": 1.59, - "learning_rate": 6.19024453525329e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.0001888835634752864, + "loss": 0.0139, "step": 146830 }, { - "epoch": 1.59, - "learning_rate": 6.188622948693001e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.0001888759957822724, + "loss": 0.0129, "step": 146840 }, { - "epoch": 1.59, - "learning_rate": 6.18700136213271e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.0001888684280892584, + "loss": 0.0121, "step": 146850 }, { - "epoch": 1.59, - "learning_rate": 6.18537977557242e-05, - "loss": 0.0124, + "epoch": 0.74, + "learning_rate": 0.00018886086039624438, + "loss": 0.0145, "step": 146860 }, { - "epoch": 1.59, - "learning_rate": 6.183758189012129e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018885329270323036, + "loss": 0.0144, "step": 146870 }, { - "epoch": 1.59, - "learning_rate": 6.182136602451838e-05, - "loss": 0.01, + "epoch": 0.74, + "learning_rate": 0.00018884572501021637, + "loss": 0.0156, "step": 146880 }, { - "epoch": 1.59, - "learning_rate": 6.180515015891548e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018883815731720235, + "loss": 0.0133, "step": 146890 }, { - "epoch": 1.59, - "learning_rate": 6.178893429331257e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018883058962418833, + "loss": 0.0132, "step": 146900 }, { - "epoch": 1.59, - "learning_rate": 6.177271842770966e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018882302193117434, + "loss": 0.0141, "step": 146910 }, { - "epoch": 1.59, - "learning_rate": 6.175650256210675e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.00018881545423816032, + "loss": 0.0138, "step": 146920 }, { - "epoch": 1.59, - "learning_rate": 6.174028669650385e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.0001888078865451463, + "loss": 0.0111, "step": 146930 }, { - "epoch": 1.59, - "learning_rate": 6.172407083090094e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018880031885213231, + "loss": 0.0111, "step": 146940 }, { - "epoch": 1.59, - "learning_rate": 6.170785496529805e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.0001887927511591183, + "loss": 0.0135, "step": 146950 }, { - "epoch": 1.59, - "learning_rate": 6.169163909969514e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018878518346610428, + "loss": 0.0141, "step": 146960 }, { - "epoch": 1.59, - "learning_rate": 6.167542323409223e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018877761577309029, + "loss": 0.0126, "step": 146970 }, { - "epoch": 1.59, - "learning_rate": 6.165920736848932e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018877004808007627, + "loss": 0.0121, "step": 146980 }, { - "epoch": 1.59, - "learning_rate": 6.164299150288642e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018876248038706225, + "loss": 0.0122, "step": 146990 }, { - "epoch": 1.59, - "learning_rate": 6.162677563728351e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018875491269404826, + "loss": 0.0125, "step": 147000 }, { - "epoch": 1.59, - "eval_cer": 0.9215234600972488, - "eval_loss": 0.006228927057236433, - "eval_runtime": 121.1059, - "eval_samples_per_second": 16.514, - "eval_steps_per_second": 4.129, + "epoch": 0.74, + "eval_cer": 0.914457640753532, + "eval_loss": 0.009390231221914291, + "eval_runtime": 115.7292, + "eval_samples_per_second": 17.282, + "eval_steps_per_second": 4.32, "step": 147000 }, { - "epoch": 1.59, - "learning_rate": 6.16105597716806e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018874734500103424, + "loss": 0.0168, "step": 147010 }, { - "epoch": 1.59, - "learning_rate": 6.15943439060777e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018873977730802022, + "loss": 0.0153, "step": 147020 }, { - "epoch": 1.59, - "learning_rate": 6.157812804047479e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.0001887322096150062, + "loss": 0.0142, "step": 147030 }, { - "epoch": 1.59, - "learning_rate": 6.156191217487188e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.0001887246419219922, + "loss": 0.0138, "step": 147040 }, { - "epoch": 1.59, - "learning_rate": 6.154569630926899e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.0001887170742289782, + "loss": 0.0144, "step": 147050 }, { - "epoch": 1.59, - "learning_rate": 6.152948044366608e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018870950653596417, + "loss": 0.0118, "step": 147060 }, { - "epoch": 1.59, - "learning_rate": 6.151326457806317e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018870193884295018, + "loss": 0.0128, "step": 147070 }, { - "epoch": 1.59, - "learning_rate": 6.149704871246026e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018869437114993616, + "loss": 0.0133, "step": 147080 }, { - "epoch": 1.59, - "learning_rate": 6.148083284685736e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.00018868680345692214, + "loss": 0.0148, "step": 147090 }, { - "epoch": 1.59, - "learning_rate": 6.146461698125446e-05, - "loss": 0.005, + "epoch": 0.74, + "learning_rate": 0.00018867923576390815, + "loss": 0.013, "step": 147100 }, { - "epoch": 1.59, - "learning_rate": 6.144840111565156e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018867166807089413, + "loss": 0.0122, "step": 147110 }, { - "epoch": 1.59, - "learning_rate": 6.143218525004865e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018866410037788012, + "loss": 0.0137, "step": 147120 }, { - "epoch": 1.59, - "learning_rate": 6.141596938444574e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018865653268486612, + "loss": 0.0127, "step": 147130 }, { - "epoch": 1.59, - "learning_rate": 6.139975351884283e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.0001886489649918521, + "loss": 0.0151, "step": 147140 }, { - "epoch": 1.59, - "learning_rate": 6.138353765323993e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.0001886413972988381, + "loss": 0.0145, "step": 147150 }, { - "epoch": 1.59, - "learning_rate": 6.136732178763702e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001886338296058241, + "loss": 0.0142, "step": 147160 }, { - "epoch": 1.59, - "learning_rate": 6.135110592203411e-05, - "loss": 0.0055, + "epoch": 0.74, + "learning_rate": 0.00018862626191281008, + "loss": 0.0187, "step": 147170 }, { - "epoch": 1.59, - "learning_rate": 6.13348900564312e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018861869421979606, + "loss": 0.0136, "step": 147180 }, { - "epoch": 1.59, - "learning_rate": 6.13186741908283e-05, - "loss": 0.0106, + "epoch": 0.74, + "learning_rate": 0.00018861112652678204, + "loss": 0.0119, "step": 147190 }, { - "epoch": 1.59, - "learning_rate": 6.13024583252254e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018860355883376805, + "loss": 0.0126, "step": 147200 }, { - "epoch": 1.59, - "learning_rate": 6.12862424596225e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018859599114075403, + "loss": 0.0126, "step": 147210 }, { - "epoch": 1.59, - "learning_rate": 6.127002659401959e-05, - "loss": 0.0097, + "epoch": 0.74, + "learning_rate": 0.00018858842344774, + "loss": 0.0144, "step": 147220 }, { - "epoch": 1.59, - "learning_rate": 6.125381072841668e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018858085575472602, + "loss": 0.0143, "step": 147230 }, { - "epoch": 1.59, - "learning_rate": 6.123759486281378e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.000188573288061712, + "loss": 0.0139, "step": 147240 }, { - "epoch": 1.59, - "learning_rate": 6.122137899721087e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018856572036869798, + "loss": 0.0123, "step": 147250 }, { - "epoch": 1.59, - "learning_rate": 6.120516313160796e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.000188558152675684, + "loss": 0.0161, "step": 147260 }, { - "epoch": 1.59, - "learning_rate": 6.118894726600505e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018855058498266997, + "loss": 0.0156, "step": 147270 }, { - "epoch": 1.59, - "learning_rate": 6.117273140040215e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018854301728965595, + "loss": 0.0119, "step": 147280 }, { - "epoch": 1.59, - "learning_rate": 6.115651553479924e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018853544959664196, + "loss": 0.0136, "step": 147290 }, { - "epoch": 1.59, - "learning_rate": 6.114029966919633e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018852788190362794, + "loss": 0.0152, "step": 147300 }, { - "epoch": 1.59, - "learning_rate": 6.112408380359344e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018852031421061393, + "loss": 0.0135, "step": 147310 }, { - "epoch": 1.59, - "learning_rate": 6.110786793799053e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018851274651759993, + "loss": 0.0117, "step": 147320 }, { - "epoch": 1.59, - "learning_rate": 6.109165207238762e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018850517882458592, + "loss": 0.0136, "step": 147330 }, { - "epoch": 1.59, - "learning_rate": 6.107543620678472e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.0001884976111315719, + "loss": 0.0143, "step": 147340 }, { - "epoch": 1.59, - "learning_rate": 6.105922034118181e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018849004343855788, + "loss": 0.0097, "step": 147350 }, { - "epoch": 1.59, - "learning_rate": 6.10430044755789e-05, - "loss": 0.0099, + "epoch": 0.74, + "learning_rate": 0.0001884824757455439, + "loss": 0.0157, "step": 147360 }, { - "epoch": 1.59, - "learning_rate": 6.1026788609975995e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018847490805252987, + "loss": 0.0125, "step": 147370 }, { - "epoch": 1.59, - "learning_rate": 6.101057274437309e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018846734035951585, + "loss": 0.0113, "step": 147380 }, { - "epoch": 1.59, - "learning_rate": 6.099435687877019e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018845977266650186, + "loss": 0.0133, "step": 147390 }, { - "epoch": 1.59, - "learning_rate": 6.097814101316728e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018845220497348784, + "loss": 0.0119, "step": 147400 }, { - "epoch": 1.59, - "learning_rate": 6.096192514756437e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018844463728047382, + "loss": 0.0108, "step": 147410 }, { - "epoch": 1.59, - "learning_rate": 6.0945709281961465e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018843706958745983, + "loss": 0.0169, "step": 147420 }, { - "epoch": 1.59, - "learning_rate": 6.092949341635856e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.0001884295018944458, + "loss": 0.0117, "step": 147430 }, { - "epoch": 1.59, - "learning_rate": 6.091327755075565e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.0001884219342014318, + "loss": 0.0177, "step": 147440 }, { - "epoch": 1.59, - "learning_rate": 6.089706168515275e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.0001884143665084178, + "loss": 0.0168, "step": 147450 }, { - "epoch": 1.59, - "learning_rate": 6.088084581954984e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018840679881540378, + "loss": 0.0136, "step": 147460 }, { - "epoch": 1.59, - "learning_rate": 6.0864629953946936e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018839923112238976, + "loss": 0.0131, "step": 147470 }, { - "epoch": 1.59, - "learning_rate": 6.084841408834403e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018839166342937577, + "loss": 0.0133, "step": 147480 }, { - "epoch": 1.59, - "learning_rate": 6.083219822274112e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018838409573636175, + "loss": 0.0148, "step": 147490 }, { - "epoch": 1.59, - "learning_rate": 6.081598235713822e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018837652804334774, + "loss": 0.0119, "step": 147500 }, { - "epoch": 1.59, - "learning_rate": 6.0799766491535314e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018836896035033374, + "loss": 0.0116, "step": 147510 }, { - "epoch": 1.59, - "learning_rate": 6.0783550625932406e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018836139265731973, + "loss": 0.011, "step": 147520 }, { - "epoch": 1.59, - "learning_rate": 6.07673347603295e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.0001883538249643057, + "loss": 0.0143, "step": 147530 }, { - "epoch": 1.59, - "learning_rate": 6.075111889472659e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.0001883462572712917, + "loss": 0.0133, "step": 147540 }, { - "epoch": 1.6, - "learning_rate": 6.073490302912369e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.0001883386895782777, + "loss": 0.0136, "step": 147550 }, { - "epoch": 1.6, - "learning_rate": 6.0718687163520784e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018833112188526368, + "loss": 0.0161, "step": 147560 }, { - "epoch": 1.6, - "learning_rate": 6.070247129791788e-05, - "loss": 0.0052, + "epoch": 0.74, + "learning_rate": 0.00018832355419224966, + "loss": 0.0123, "step": 147570 }, { - "epoch": 1.6, - "learning_rate": 6.068625543231497e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018831598649923567, + "loss": 0.0163, "step": 147580 }, { - "epoch": 1.6, - "learning_rate": 6.067003956671206e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.00018830841880622165, + "loss": 0.0165, "step": 147590 }, { - "epoch": 1.6, - "learning_rate": 6.0653823701109155e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018830085111320763, + "loss": 0.0138, "step": 147600 }, { - "epoch": 1.6, - "learning_rate": 6.0637607835506255e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018829328342019364, + "loss": 0.0126, "step": 147610 }, { - "epoch": 1.6, - "learning_rate": 6.062139196990335e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.00018828571572717962, + "loss": 0.0133, "step": 147620 }, { - "epoch": 1.6, - "learning_rate": 6.060517610430044e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.0001882781480341656, + "loss": 0.0129, "step": 147630 }, { - "epoch": 1.6, - "learning_rate": 6.058896023869753e-05, - "loss": 0.0052, + "epoch": 0.74, + "learning_rate": 0.0001882705803411516, + "loss": 0.014, "step": 147640 }, { - "epoch": 1.6, - "learning_rate": 6.0572744373094626e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.0001882630126481376, + "loss": 0.0203, "step": 147650 }, { - "epoch": 1.6, - "learning_rate": 6.0556528507491725e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018825544495512357, + "loss": 0.0125, "step": 147660 }, { - "epoch": 1.6, - "learning_rate": 6.054031264188882e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018824787726210958, + "loss": 0.0102, "step": 147670 }, { - "epoch": 1.6, - "learning_rate": 6.052409677628591e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018824030956909556, + "loss": 0.0194, "step": 147680 }, { - "epoch": 1.6, - "learning_rate": 6.0507880910683003e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018823274187608152, + "loss": 0.0132, "step": 147690 }, { - "epoch": 1.6, - "learning_rate": 6.0491665045080096e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001882251741830675, + "loss": 0.0143, "step": 147700 }, { - "epoch": 1.6, - "learning_rate": 6.047544917947719e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001882176064900535, + "loss": 0.0124, "step": 147710 }, { - "epoch": 1.6, - "learning_rate": 6.045923331387429e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.0001882100387970395, + "loss": 0.0128, "step": 147720 }, { - "epoch": 1.6, - "learning_rate": 6.044301744827138e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018820247110402547, + "loss": 0.0116, "step": 147730 }, { - "epoch": 1.6, - "learning_rate": 6.0426801582668474e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018819490341101145, + "loss": 0.0126, "step": 147740 }, { - "epoch": 1.6, - "learning_rate": 6.041058571706557e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018818733571799746, + "loss": 0.0118, "step": 147750 }, { - "epoch": 1.6, - "learning_rate": 6.039436985146266e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018817976802498344, + "loss": 0.0131, "step": 147760 }, { - "epoch": 1.6, - "learning_rate": 6.037815398585976e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018817220033196942, + "loss": 0.0151, "step": 147770 }, { - "epoch": 1.6, - "learning_rate": 6.036193812025685e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018816463263895543, + "loss": 0.0143, "step": 147780 }, { - "epoch": 1.6, - "learning_rate": 6.0345722254653944e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018815706494594141, + "loss": 0.0139, "step": 147790 }, { - "epoch": 1.6, - "learning_rate": 6.032950638905104e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.0001881494972529274, + "loss": 0.0103, "step": 147800 }, { - "epoch": 1.6, - "learning_rate": 6.031329052344813e-05, - "loss": 0.0108, + "epoch": 0.75, + "learning_rate": 0.0001881419295599134, + "loss": 0.0167, "step": 147810 }, { - "epoch": 1.6, - "learning_rate": 6.0297074657845236e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018813436186689939, + "loss": 0.0122, "step": 147820 }, { - "epoch": 1.6, - "learning_rate": 6.028085879224233e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018812679417388537, + "loss": 0.011, "step": 147830 }, { - "epoch": 1.6, - "learning_rate": 6.026464292663942e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018811922648087138, + "loss": 0.0152, "step": 147840 }, { - "epoch": 1.6, - "learning_rate": 6.0248427061036514e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018811165878785736, + "loss": 0.0138, "step": 147850 }, { - "epoch": 1.6, - "learning_rate": 6.0232211195433614e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018810409109484334, + "loss": 0.0142, "step": 147860 }, { - "epoch": 1.6, - "learning_rate": 6.021599532983071e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018809652340182935, + "loss": 0.0131, "step": 147870 }, { - "epoch": 1.6, - "learning_rate": 6.01997794642278e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018808895570881533, + "loss": 0.0126, "step": 147880 }, { - "epoch": 1.6, - "learning_rate": 6.018356359862489e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001880813880158013, + "loss": 0.0138, "step": 147890 }, { - "epoch": 1.6, - "learning_rate": 6.0167347733021985e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018807382032278732, + "loss": 0.0108, "step": 147900 }, { - "epoch": 1.6, - "learning_rate": 6.015113186741908e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.0001880662526297733, + "loss": 0.0136, "step": 147910 }, { - "epoch": 1.6, - "learning_rate": 6.013491600181618e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018805868493675928, + "loss": 0.0121, "step": 147920 }, { - "epoch": 1.6, - "learning_rate": 6.011870013621327e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018805111724374526, + "loss": 0.0116, "step": 147930 }, { - "epoch": 1.6, - "learning_rate": 6.010248427061036e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018804354955073127, + "loss": 0.0122, "step": 147940 }, { - "epoch": 1.6, - "learning_rate": 6.0086268405007455e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018803598185771725, + "loss": 0.0095, "step": 147950 }, { - "epoch": 1.6, - "learning_rate": 6.007005253940455e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018802841416470323, + "loss": 0.0169, "step": 147960 }, { - "epoch": 1.6, - "learning_rate": 6.005383667380165e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018802084647168924, + "loss": 0.0119, "step": 147970 }, { - "epoch": 1.6, - "learning_rate": 6.003762080819874e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018801327877867522, + "loss": 0.0121, "step": 147980 }, { - "epoch": 1.6, - "learning_rate": 6.002140494259583e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001880057110856612, + "loss": 0.0152, "step": 147990 }, { - "epoch": 1.6, - "learning_rate": 6.0005189076992926e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018799814339264721, + "loss": 0.0136, "step": 148000 }, { - "epoch": 1.6, - "eval_cer": 0.9215364891415945, - "eval_loss": 0.006136965937912464, - "eval_runtime": 121.1416, - "eval_samples_per_second": 16.51, - "eval_steps_per_second": 4.127, + "epoch": 0.75, + "eval_cer": 0.9144741374876638, + "eval_loss": 0.009097721427679062, + "eval_runtime": 116.6762, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, "step": 148000 }, { - "epoch": 1.6, - "learning_rate": 5.998897321139002e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001879905756996332, + "loss": 0.016, "step": 148010 }, { - "epoch": 1.6, - "learning_rate": 5.997275734578711e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018798300800661918, + "loss": 0.0138, "step": 148020 }, { - "epoch": 1.6, - "learning_rate": 5.995654148018421e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018797544031360519, + "loss": 0.0145, "step": 148030 }, { - "epoch": 1.6, - "learning_rate": 5.9940325614581304e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018796787262059117, + "loss": 0.0128, "step": 148040 }, { - "epoch": 1.6, - "learning_rate": 5.9924109748978396e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018796030492757715, + "loss": 0.0167, "step": 148050 }, { - "epoch": 1.6, - "learning_rate": 5.990789388337549e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018795273723456316, + "loss": 0.0175, "step": 148060 }, { - "epoch": 1.6, - "learning_rate": 5.989167801777258e-05, - "loss": 0.0102, + "epoch": 0.75, + "learning_rate": 0.00018794516954154914, + "loss": 0.0136, "step": 148070 }, { - "epoch": 1.6, - "learning_rate": 5.987546215216968e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018793760184853512, + "loss": 0.0129, "step": 148080 }, { - "epoch": 1.6, - "learning_rate": 5.9859246286566774e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.0001879300341555211, + "loss": 0.0146, "step": 148090 }, { - "epoch": 1.6, - "learning_rate": 5.984303042096387e-05, - "loss": 0.0055, + "epoch": 0.75, + "learning_rate": 0.0001879224664625071, + "loss": 0.0162, "step": 148100 }, { - "epoch": 1.6, - "learning_rate": 5.982681455536096e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.0001879148987694931, + "loss": 0.0122, "step": 148110 }, { - "epoch": 1.6, - "learning_rate": 5.981059868975805e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018790733107647907, + "loss": 0.0128, "step": 148120 }, { - "epoch": 1.6, - "learning_rate": 5.979438282415515e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018789976338346508, + "loss": 0.0124, "step": 148130 }, { - "epoch": 1.6, - "learning_rate": 5.9778166958552245e-05, - "loss": 0.0202, + "epoch": 0.75, + "learning_rate": 0.00018789219569045106, + "loss": 0.0112, "step": 148140 }, { - "epoch": 1.6, - "learning_rate": 5.976195109294934e-05, - "loss": 0.01, + "epoch": 0.75, + "learning_rate": 0.00018788462799743704, + "loss": 0.0116, "step": 148150 }, { - "epoch": 1.6, - "learning_rate": 5.974573522734643e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018787706030442305, + "loss": 0.0113, "step": 148160 }, { - "epoch": 1.6, - "learning_rate": 5.972951936174352e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018786949261140903, + "loss": 0.0106, "step": 148170 }, { - "epoch": 1.6, - "learning_rate": 5.9713303496140616e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018786192491839502, + "loss": 0.012, "step": 148180 }, { - "epoch": 1.6, - "learning_rate": 5.9697087630537715e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018785435722538102, + "loss": 0.013, "step": 148190 }, { - "epoch": 1.6, - "learning_rate": 5.968087176493481e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.000187846789532367, + "loss": 0.0164, "step": 148200 }, { - "epoch": 1.6, - "learning_rate": 5.96646558993319e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.000187839221839353, + "loss": 0.011, "step": 148210 }, { - "epoch": 1.6, - "learning_rate": 5.964844003372899e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.000187831654146339, + "loss": 0.017, "step": 148220 }, { - "epoch": 1.6, - "learning_rate": 5.9632224168126086e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018782408645332498, + "loss": 0.015, "step": 148230 }, { - "epoch": 1.6, - "learning_rate": 5.9616008302523186e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018781651876031096, + "loss": 0.0115, "step": 148240 }, { - "epoch": 1.6, - "learning_rate": 5.959979243692028e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018780895106729694, + "loss": 0.0114, "step": 148250 }, { - "epoch": 1.6, - "learning_rate": 5.958357657131737e-05, - "loss": 0.0105, + "epoch": 0.75, + "learning_rate": 0.00018780138337428295, + "loss": 0.0139, "step": 148260 }, { - "epoch": 1.6, - "learning_rate": 5.9567360705714464e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018779381568126893, + "loss": 0.0115, "step": 148270 }, { - "epoch": 1.6, - "learning_rate": 5.9551144840111557e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001877862479882549, + "loss": 0.0128, "step": 148280 }, { - "epoch": 1.6, - "learning_rate": 5.9534928974508656e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018777868029524092, + "loss": 0.0121, "step": 148290 }, { - "epoch": 1.6, - "learning_rate": 5.951871310890575e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.0001877711126022269, + "loss": 0.0134, "step": 148300 }, { - "epoch": 1.6, - "learning_rate": 5.950249724330284e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018776354490921288, + "loss": 0.0091, "step": 148310 }, { - "epoch": 1.6, - "learning_rate": 5.9486281377699934e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001877559772161989, + "loss": 0.0105, "step": 148320 }, { - "epoch": 1.6, - "learning_rate": 5.947006551209703e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018774840952318487, + "loss": 0.0131, "step": 148330 }, { - "epoch": 1.6, - "learning_rate": 5.945384964649412e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018774084183017085, + "loss": 0.0114, "step": 148340 }, { - "epoch": 1.6, - "learning_rate": 5.943763378089122e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018773327413715686, + "loss": 0.0142, "step": 148350 }, { - "epoch": 1.6, - "learning_rate": 5.942141791528831e-05, - "loss": 0.0105, + "epoch": 0.75, + "learning_rate": 0.00018772570644414284, + "loss": 0.012, "step": 148360 }, { - "epoch": 1.6, - "learning_rate": 5.9405202049685405e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018771813875112883, + "loss": 0.0122, "step": 148370 }, { - "epoch": 1.6, - "learning_rate": 5.93889861840825e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018771057105811483, + "loss": 0.0123, "step": 148380 }, { - "epoch": 1.6, - "learning_rate": 5.937277031847959e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018770300336510082, + "loss": 0.0134, "step": 148390 }, { - "epoch": 1.6, - "learning_rate": 5.935655445287669e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001876954356720868, + "loss": 0.0158, "step": 148400 }, { - "epoch": 1.6, - "learning_rate": 5.934033858727378e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.0001876878679790728, + "loss": 0.0137, "step": 148410 }, { - "epoch": 1.6, - "learning_rate": 5.9324122721670875e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.0001876803002860588, + "loss": 0.0114, "step": 148420 }, { - "epoch": 1.6, - "learning_rate": 5.930790685606797e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018767273259304477, + "loss": 0.0125, "step": 148430 }, { - "epoch": 1.6, - "learning_rate": 5.929169099046506e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018766516490003075, + "loss": 0.0134, "step": 148440 }, { - "epoch": 1.6, - "learning_rate": 5.9275475124862154e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018765759720701676, + "loss": 0.0123, "step": 148450 }, { - "epoch": 1.6, - "learning_rate": 5.925925925925925e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018765002951400274, + "loss": 0.0112, "step": 148460 }, { - "epoch": 1.61, - "learning_rate": 5.9243043393656346e-05, - "loss": 0.0096, + "epoch": 0.75, + "learning_rate": 0.00018764246182098872, + "loss": 0.0111, "step": 148470 }, { - "epoch": 1.61, - "learning_rate": 5.922682752805344e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018763489412797473, + "loss": 0.012, "step": 148480 }, { - "epoch": 1.61, - "learning_rate": 5.921061166245053e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001876273264349607, + "loss": 0.0116, "step": 148490 }, { - "epoch": 1.61, - "learning_rate": 5.9194395796847624e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001876197587419467, + "loss": 0.0145, "step": 148500 }, { - "epoch": 1.61, - "learning_rate": 5.9178179931244724e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001876121910489327, + "loss": 0.0133, "step": 148510 }, { - "epoch": 1.61, - "learning_rate": 5.9161964065641816e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018760462335591868, + "loss": 0.011, "step": 148520 }, { - "epoch": 1.61, - "learning_rate": 5.914574820003891e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018759705566290466, + "loss": 0.0161, "step": 148530 }, { - "epoch": 1.61, - "learning_rate": 5.912953233443601e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018758948796989067, + "loss": 0.0134, "step": 148540 }, { - "epoch": 1.61, - "learning_rate": 5.911331646883311e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018758192027687665, + "loss": 0.0102, "step": 148550 }, { - "epoch": 1.61, - "learning_rate": 5.90971006032302e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018757435258386264, + "loss": 0.0115, "step": 148560 }, { - "epoch": 1.61, - "learning_rate": 5.9080884737627294e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018756678489084864, + "loss": 0.0123, "step": 148570 }, { - "epoch": 1.61, - "learning_rate": 5.9064668872024386e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018755921719783463, + "loss": 0.0123, "step": 148580 }, { - "epoch": 1.61, - "learning_rate": 5.904845300642148e-05, - "loss": 0.0102, + "epoch": 0.75, + "learning_rate": 0.0001875516495048206, + "loss": 0.0108, "step": 148590 }, { - "epoch": 1.61, - "learning_rate": 5.903223714081857e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001875440818118066, + "loss": 0.0125, "step": 148600 }, { - "epoch": 1.61, - "learning_rate": 5.901602127521567e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.0001875365141187926, + "loss": 0.0115, "step": 148610 }, { - "epoch": 1.61, - "learning_rate": 5.8999805409612764e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.00018752894642577858, + "loss": 0.0128, "step": 148620 }, { - "epoch": 1.61, - "learning_rate": 5.898358954400986e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018752137873276456, + "loss": 0.0118, "step": 148630 }, { - "epoch": 1.61, - "learning_rate": 5.896737367840695e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.00018751381103975057, + "loss": 0.0169, "step": 148640 }, { - "epoch": 1.61, - "learning_rate": 5.895115781280404e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018750624334673655, + "loss": 0.014, "step": 148650 }, { - "epoch": 1.61, - "learning_rate": 5.893494194720114e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018749867565372253, + "loss": 0.0177, "step": 148660 }, { - "epoch": 1.61, - "learning_rate": 5.8918726081598235e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.00018749110796070854, + "loss": 0.0156, "step": 148670 }, { - "epoch": 1.61, - "learning_rate": 5.890251021599533e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018748354026769452, + "loss": 0.015, "step": 148680 }, { - "epoch": 1.61, - "learning_rate": 5.888629435039242e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.0001874759725746805, + "loss": 0.0136, "step": 148690 }, { - "epoch": 1.61, - "learning_rate": 5.887007848478951e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.0001874684048816665, + "loss": 0.0124, "step": 148700 }, { - "epoch": 1.61, - "learning_rate": 5.885386261918661e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.0001874608371886525, + "loss": 0.0119, "step": 148710 }, { - "epoch": 1.61, - "learning_rate": 5.8837646753583705e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018745326949563847, + "loss": 0.0102, "step": 148720 }, { - "epoch": 1.61, - "learning_rate": 5.88214308879808e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018744570180262448, + "loss": 0.0105, "step": 148730 }, { - "epoch": 1.61, - "learning_rate": 5.880521502237789e-05, - "loss": 0.0104, + "epoch": 0.75, + "learning_rate": 0.00018743813410961046, + "loss": 0.0094, "step": 148740 }, { - "epoch": 1.61, - "learning_rate": 5.878899915677498e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018743056641659645, + "loss": 0.0146, "step": 148750 }, { - "epoch": 1.61, - "learning_rate": 5.8772783291172076e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018742299872358243, + "loss": 0.011, "step": 148760 }, { - "epoch": 1.61, - "learning_rate": 5.8756567425569176e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018741543103056844, + "loss": 0.0125, "step": 148770 }, { - "epoch": 1.61, - "learning_rate": 5.874035155996627e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018740786333755442, + "loss": 0.0189, "step": 148780 }, { - "epoch": 1.61, - "learning_rate": 5.872413569436336e-05, - "loss": 0.011, + "epoch": 0.75, + "learning_rate": 0.0001874002956445404, + "loss": 0.0137, "step": 148790 }, { - "epoch": 1.61, - "learning_rate": 5.8707919828760454e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.0001873927279515264, + "loss": 0.0113, "step": 148800 }, { - "epoch": 1.61, - "learning_rate": 5.8691703963157547e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.0001873851602585124, + "loss": 0.013, "step": 148810 }, { - "epoch": 1.61, - "learning_rate": 5.8675488097554646e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018737759256549837, + "loss": 0.0116, "step": 148820 }, { - "epoch": 1.61, - "learning_rate": 5.865927223195174e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.00018737002487248438, + "loss": 0.0098, "step": 148830 }, { - "epoch": 1.61, - "learning_rate": 5.864305636634883e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018736245717947036, + "loss": 0.0136, "step": 148840 }, { - "epoch": 1.61, - "learning_rate": 5.8626840500745924e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018735488948645634, + "loss": 0.0115, "step": 148850 }, { - "epoch": 1.61, - "learning_rate": 5.861062463514302e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018734732179344235, + "loss": 0.012, "step": 148860 }, { - "epoch": 1.61, - "learning_rate": 5.8594408769540117e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018733975410042833, + "loss": 0.0108, "step": 148870 }, { - "epoch": 1.61, - "learning_rate": 5.857819290393721e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.0001873321864074143, + "loss": 0.0124, "step": 148880 }, { - "epoch": 1.61, - "learning_rate": 5.85619770383343e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018732461871440032, + "loss": 0.012, "step": 148890 }, { - "epoch": 1.61, - "learning_rate": 5.8545761172731395e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.0001873170510213863, + "loss": 0.0123, "step": 148900 }, { - "epoch": 1.61, - "learning_rate": 5.852954530712849e-05, - "loss": 0.0053, + "epoch": 0.75, + "learning_rate": 0.00018730948332837228, + "loss": 0.0141, "step": 148910 }, { - "epoch": 1.61, - "learning_rate": 5.851332944152558e-05, - "loss": 0.0107, + "epoch": 0.75, + "learning_rate": 0.00018730191563535827, + "loss": 0.0228, "step": 148920 }, { - "epoch": 1.61, - "learning_rate": 5.849711357592268e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018729434794234427, + "loss": 0.0132, "step": 148930 }, { - "epoch": 1.61, - "learning_rate": 5.848089771031977e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018728678024933026, + "loss": 0.0147, "step": 148940 }, { - "epoch": 1.61, - "learning_rate": 5.8464681844716865e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.0001872792125563162, + "loss": 0.0122, "step": 148950 }, { - "epoch": 1.61, - "learning_rate": 5.844846597911396e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018727164486330222, + "loss": 0.0163, "step": 148960 }, { - "epoch": 1.61, - "learning_rate": 5.843225011351105e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001872640771702882, + "loss": 0.0108, "step": 148970 }, { - "epoch": 1.61, - "learning_rate": 5.841603424790815e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018725650947727418, + "loss": 0.0169, "step": 148980 }, { - "epoch": 1.61, - "learning_rate": 5.839981838230524e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018724894178426016, + "loss": 0.0163, "step": 148990 }, { - "epoch": 1.61, - "learning_rate": 5.8383602516702336e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018724137409124617, + "loss": 0.019, "step": 149000 }, { - "epoch": 1.61, - "eval_cer": 0.9215234600972488, - "eval_loss": 0.006172089837491512, - "eval_runtime": 121.2213, - "eval_samples_per_second": 16.499, - "eval_steps_per_second": 4.125, + "epoch": 0.75, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.009037774056196213, + "eval_runtime": 116.6835, + "eval_samples_per_second": 17.14, + "eval_steps_per_second": 4.285, "step": 149000 }, { - "epoch": 1.61, - "learning_rate": 5.836738665109943e-05, - "loss": 0.009, + "epoch": 0.75, + "learning_rate": 0.00018723380639823215, + "loss": 0.0123, "step": 149010 }, { - "epoch": 1.61, - "learning_rate": 5.835117078549652e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018722623870521813, + "loss": 0.013, "step": 149020 }, { - "epoch": 1.61, - "learning_rate": 5.8334954919893614e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018721867101220414, + "loss": 0.0146, "step": 149030 }, { - "epoch": 1.61, - "learning_rate": 5.8318739054290713e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.00018721110331919012, + "loss": 0.0126, "step": 149040 }, { - "epoch": 1.61, - "learning_rate": 5.8302523188687806e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001872035356261761, + "loss": 0.0105, "step": 149050 }, { - "epoch": 1.61, - "learning_rate": 5.82863073230849e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018719596793316211, + "loss": 0.0149, "step": 149060 }, { - "epoch": 1.61, - "learning_rate": 5.827009145748199e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001871884002401481, + "loss": 0.0138, "step": 149070 }, { - "epoch": 1.61, - "learning_rate": 5.8253875591879084e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018718083254713408, + "loss": 0.0135, "step": 149080 }, { - "epoch": 1.61, - "learning_rate": 5.8237659726276184e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018717326485412009, + "loss": 0.0127, "step": 149090 }, { - "epoch": 1.61, - "learning_rate": 5.822144386067328e-05, - "loss": 0.0117, + "epoch": 0.75, + "learning_rate": 0.00018716569716110607, + "loss": 0.0153, "step": 149100 }, { - "epoch": 1.61, - "learning_rate": 5.820522799507037e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.00018715812946809205, + "loss": 0.0154, "step": 149110 }, { - "epoch": 1.61, - "learning_rate": 5.818901212946746e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018715056177507806, + "loss": 0.0151, "step": 149120 }, { - "epoch": 1.61, - "learning_rate": 5.8172796263864555e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018714299408206404, + "loss": 0.0149, "step": 149130 }, { - "epoch": 1.61, - "learning_rate": 5.8156580398261654e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018713542638905002, + "loss": 0.0113, "step": 149140 }, { - "epoch": 1.61, - "learning_rate": 5.814036453265875e-05, - "loss": 0.0096, + "epoch": 0.75, + "learning_rate": 0.000187127858696036, + "loss": 0.0185, "step": 149150 }, { - "epoch": 1.61, - "learning_rate": 5.812414866705584e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.000187120291003022, + "loss": 0.0144, "step": 149160 }, { - "epoch": 1.61, - "learning_rate": 5.810793280145293e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.000187112723310008, + "loss": 0.0124, "step": 149170 }, { - "epoch": 1.61, - "learning_rate": 5.8091716935850025e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018710515561699397, + "loss": 0.0121, "step": 149180 }, { - "epoch": 1.61, - "learning_rate": 5.807550107024712e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018709758792397998, + "loss": 0.0129, "step": 149190 }, { - "epoch": 1.61, - "learning_rate": 5.805928520464422e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018709002023096596, + "loss": 0.0101, "step": 149200 }, { - "epoch": 1.61, - "learning_rate": 5.804306933904131e-05, - "loss": 0.0113, + "epoch": 0.75, + "learning_rate": 0.00018708245253795194, + "loss": 0.0137, "step": 149210 }, { - "epoch": 1.61, - "learning_rate": 5.80268534734384e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.00018707488484493795, + "loss": 0.0132, "step": 149220 }, { - "epoch": 1.61, - "learning_rate": 5.8010637607835496e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018706731715192393, + "loss": 0.0107, "step": 149230 }, { - "epoch": 1.61, - "learning_rate": 5.799442174223259e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018705974945890992, + "loss": 0.0129, "step": 149240 }, { - "epoch": 1.61, - "learning_rate": 5.797820587662969e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.00018705218176589592, + "loss": 0.0107, "step": 149250 }, { - "epoch": 1.61, - "learning_rate": 5.796199001102679e-05, - "loss": 0.0105, + "epoch": 0.75, + "learning_rate": 0.0001870446140728819, + "loss": 0.0149, "step": 149260 }, { - "epoch": 1.61, - "learning_rate": 5.794577414542388e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.0001870370463798679, + "loss": 0.011, "step": 149270 }, { - "epoch": 1.61, - "learning_rate": 5.792955827982097e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001870294786868539, + "loss": 0.012, "step": 149280 }, { - "epoch": 1.61, - "learning_rate": 5.791334241421807e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018702191099383988, + "loss": 0.0133, "step": 149290 }, { - "epoch": 1.61, - "learning_rate": 5.7897126548615165e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018701434330082586, + "loss": 0.0115, "step": 149300 }, { - "epoch": 1.61, - "learning_rate": 5.788091068301226e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.00018700677560781184, + "loss": 0.0155, "step": 149310 }, { - "epoch": 1.61, - "learning_rate": 5.786469481740935e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018699920791479785, + "loss": 0.0124, "step": 149320 }, { - "epoch": 1.61, - "learning_rate": 5.7848478951806444e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.00018699164022178383, + "loss": 0.0129, "step": 149330 }, { - "epoch": 1.61, - "learning_rate": 5.7832263086203536e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.0001869840725287698, + "loss": 0.012, "step": 149340 }, { - "epoch": 1.61, - "learning_rate": 5.7816047220600636e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018697650483575582, + "loss": 0.0114, "step": 149350 }, { - "epoch": 1.61, - "learning_rate": 5.779983135499773e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001869689371427418, + "loss": 0.0147, "step": 149360 }, { - "epoch": 1.61, - "learning_rate": 5.778361548939482e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018696136944972778, + "loss": 0.0151, "step": 149370 }, { - "epoch": 1.61, - "learning_rate": 5.7767399623791914e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001869538017567138, + "loss": 0.015, "step": 149380 }, { - "epoch": 1.61, - "learning_rate": 5.775118375818901e-05, - "loss": 0.0045, + "epoch": 0.75, + "learning_rate": 0.00018694623406369977, + "loss": 0.0155, "step": 149390 }, { - "epoch": 1.62, - "learning_rate": 5.7734967892586106e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018693866637068575, + "loss": 0.0161, "step": 149400 }, { - "epoch": 1.62, - "learning_rate": 5.77187520269832e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018693109867767176, + "loss": 0.0122, "step": 149410 }, { - "epoch": 1.62, - "learning_rate": 5.770253616138029e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.00018692353098465774, + "loss": 0.0132, "step": 149420 }, { - "epoch": 1.62, - "learning_rate": 5.7686320295777385e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018691596329164373, + "loss": 0.0129, "step": 149430 }, { - "epoch": 1.62, - "learning_rate": 5.767010443017448e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018690839559862973, + "loss": 0.018, "step": 149440 }, { - "epoch": 1.62, - "learning_rate": 5.765388856457158e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018690082790561572, + "loss": 0.0137, "step": 149450 }, { - "epoch": 1.62, - "learning_rate": 5.763767269896867e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.0001868932602126017, + "loss": 0.0142, "step": 149460 }, { - "epoch": 1.62, - "learning_rate": 5.762145683336576e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001868856925195877, + "loss": 0.0145, "step": 149470 }, { - "epoch": 1.62, - "learning_rate": 5.7605240967762855e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.0001868781248265737, + "loss": 0.0095, "step": 149480 }, { - "epoch": 1.62, - "learning_rate": 5.758902510215995e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018687055713355967, + "loss": 0.0127, "step": 149490 }, { - "epoch": 1.62, - "learning_rate": 5.757280923655704e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018686298944054565, + "loss": 0.0162, "step": 149500 }, { - "epoch": 1.62, - "learning_rate": 5.755659337095414e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018685542174753166, + "loss": 0.0174, "step": 149510 }, { - "epoch": 1.62, - "learning_rate": 5.754037750535123e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018684785405451764, + "loss": 0.0115, "step": 149520 }, { - "epoch": 1.62, - "learning_rate": 5.7524161639748326e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018684028636150362, + "loss": 0.0126, "step": 149530 }, { - "epoch": 1.62, - "learning_rate": 5.750794577414542e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018683271866848963, + "loss": 0.0129, "step": 149540 }, { - "epoch": 1.62, - "learning_rate": 5.749172990854251e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001868251509754756, + "loss": 0.0121, "step": 149550 }, { - "epoch": 1.62, - "learning_rate": 5.747551404293961e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001868175832824616, + "loss": 0.0121, "step": 149560 }, { - "epoch": 1.62, - "learning_rate": 5.7459298177336703e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.0001868100155894476, + "loss": 0.0166, "step": 149570 }, { - "epoch": 1.62, - "learning_rate": 5.7443082311733796e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018680244789643358, + "loss": 0.0095, "step": 149580 }, { - "epoch": 1.62, - "learning_rate": 5.742686644613089e-05, - "loss": 0.0106, + "epoch": 0.75, + "learning_rate": 0.00018679488020341956, + "loss": 0.0134, "step": 149590 }, { - "epoch": 1.62, - "learning_rate": 5.741065058052798e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018678731251040557, + "loss": 0.0108, "step": 149600 }, { - "epoch": 1.62, - "learning_rate": 5.7394434714925074e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018677974481739155, + "loss": 0.0167, "step": 149610 }, { - "epoch": 1.62, - "learning_rate": 5.7378218849322174e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018677217712437754, + "loss": 0.0141, "step": 149620 }, { - "epoch": 1.62, - "learning_rate": 5.736200298371927e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018676460943136354, + "loss": 0.0117, "step": 149630 }, { - "epoch": 1.62, - "learning_rate": 5.734578711811636e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.00018675704173834953, + "loss": 0.0113, "step": 149640 }, { - "epoch": 1.62, - "learning_rate": 5.732957125251345e-05, - "loss": 0.011, + "epoch": 0.76, + "learning_rate": 0.0001867494740453355, + "loss": 0.0172, "step": 149650 }, { - "epoch": 1.62, - "learning_rate": 5.7313355386910545e-05, - "loss": 0.0098, + "epoch": 0.76, + "learning_rate": 0.0001867419063523215, + "loss": 0.0099, "step": 149660 }, { - "epoch": 1.62, - "learning_rate": 5.7297139521307644e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001867343386593075, + "loss": 0.0109, "step": 149670 }, { - "epoch": 1.62, - "learning_rate": 5.728092365570474e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018672677096629348, + "loss": 0.0152, "step": 149680 }, { - "epoch": 1.62, - "learning_rate": 5.726470779010183e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.00018671920327327946, + "loss": 0.0152, "step": 149690 }, { - "epoch": 1.62, - "learning_rate": 5.724849192449892e-05, - "loss": 0.0108, + "epoch": 0.76, + "learning_rate": 0.00018671163558026547, + "loss": 0.0116, "step": 149700 }, { - "epoch": 1.62, - "learning_rate": 5.7232276058896015e-05, - "loss": 0.0108, + "epoch": 0.76, + "learning_rate": 0.00018670406788725145, + "loss": 0.0138, "step": 149710 }, { - "epoch": 1.62, - "learning_rate": 5.7216060193293115e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018669650019423743, + "loss": 0.0166, "step": 149720 }, { - "epoch": 1.62, - "learning_rate": 5.719984432769021e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018668893250122344, + "loss": 0.0128, "step": 149730 }, { - "epoch": 1.62, - "learning_rate": 5.71836284620873e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.00018668136480820942, + "loss": 0.0136, "step": 149740 }, { - "epoch": 1.62, - "learning_rate": 5.716741259648439e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001866737971151954, + "loss": 0.0126, "step": 149750 }, { - "epoch": 1.62, - "learning_rate": 5.7151196730881486e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.0001866662294221814, + "loss": 0.0147, "step": 149760 }, { - "epoch": 1.62, - "learning_rate": 5.713498086527858e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001866586617291674, + "loss": 0.0118, "step": 149770 }, { - "epoch": 1.62, - "learning_rate": 5.711876499967568e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018665109403615337, + "loss": 0.0116, "step": 149780 }, { - "epoch": 1.62, - "learning_rate": 5.710254913407277e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.00018664352634313938, + "loss": 0.0117, "step": 149790 }, { - "epoch": 1.62, - "learning_rate": 5.7086333268469864e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018663595865012536, + "loss": 0.0152, "step": 149800 }, { - "epoch": 1.62, - "learning_rate": 5.7070117402866956e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018662839095711135, + "loss": 0.0135, "step": 149810 }, { - "epoch": 1.62, - "learning_rate": 5.705390153726405e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018662082326409733, + "loss": 0.0131, "step": 149820 }, { - "epoch": 1.62, - "learning_rate": 5.703768567166115e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018661325557108334, + "loss": 0.0165, "step": 149830 }, { - "epoch": 1.62, - "learning_rate": 5.702146980605824e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018660568787806932, + "loss": 0.0147, "step": 149840 }, { - "epoch": 1.62, - "learning_rate": 5.7005253940455334e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001865981201850553, + "loss": 0.0125, "step": 149850 }, { - "epoch": 1.62, - "learning_rate": 5.698903807485243e-05, - "loss": 0.0125, + "epoch": 0.76, + "learning_rate": 0.0001865905524920413, + "loss": 0.0152, "step": 149860 }, { - "epoch": 1.62, - "learning_rate": 5.697282220924952e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.0001865829847990273, + "loss": 0.0146, "step": 149870 }, { - "epoch": 1.62, - "learning_rate": 5.695660634364662e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018657541710601327, + "loss": 0.0148, "step": 149880 }, { - "epoch": 1.62, - "learning_rate": 5.694039047804371e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018656784941299928, + "loss": 0.0123, "step": 149890 }, { - "epoch": 1.62, - "learning_rate": 5.6924174612440805e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018656028171998526, + "loss": 0.0121, "step": 149900 }, { - "epoch": 1.62, - "learning_rate": 5.69079587468379e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018655271402697124, + "loss": 0.0144, "step": 149910 }, { - "epoch": 1.62, - "learning_rate": 5.689174288123499e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.00018654514633395725, + "loss": 0.0161, "step": 149920 }, { - "epoch": 1.62, - "learning_rate": 5.687552701563208e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018653757864094323, + "loss": 0.0126, "step": 149930 }, { - "epoch": 1.62, - "learning_rate": 5.685931115002918e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001865300109479292, + "loss": 0.0218, "step": 149940 }, { - "epoch": 1.62, - "learning_rate": 5.6843095284426275e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018652244325491522, + "loss": 0.0143, "step": 149950 }, { - "epoch": 1.62, - "learning_rate": 5.682687941882337e-05, - "loss": 0.0093, + "epoch": 0.76, + "learning_rate": 0.0001865148755619012, + "loss": 0.0144, "step": 149960 }, { - "epoch": 1.62, - "learning_rate": 5.681066355322046e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018650730786888718, + "loss": 0.0104, "step": 149970 }, { - "epoch": 1.62, - "learning_rate": 5.679444768761757e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.0001864997401758732, + "loss": 0.0141, "step": 149980 }, { - "epoch": 1.62, - "learning_rate": 5.677823182201466e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018649217248285917, + "loss": 0.014, "step": 149990 }, { - "epoch": 1.62, - "learning_rate": 5.676201595641175e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018648460478984516, + "loss": 0.012, "step": 150000 }, { - "epoch": 1.62, - "eval_cer": 0.9215086938469904, - "eval_loss": 0.006060704588890076, - "eval_runtime": 121.178, - "eval_samples_per_second": 16.505, - "eval_steps_per_second": 4.126, + "epoch": 0.76, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.008926572278141975, + "eval_runtime": 116.0551, + "eval_samples_per_second": 17.233, + "eval_steps_per_second": 4.308, "step": 150000 }, { - "epoch": 1.62, - "learning_rate": 5.6745800090808845e-05, - "loss": 0.0092, + "epoch": 0.76, + "learning_rate": 0.00018647703709683114, + "loss": 0.0139, "step": 150010 }, { - "epoch": 1.62, - "learning_rate": 5.672958422520594e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018646946940381715, + "loss": 0.0121, "step": 150020 }, { - "epoch": 1.62, - "learning_rate": 5.671336835960304e-05, - "loss": 0.0049, + "epoch": 0.76, + "learning_rate": 0.00018646190171080313, + "loss": 0.0115, "step": 150030 }, { - "epoch": 1.62, - "learning_rate": 5.669715249400013e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.0001864543340177891, + "loss": 0.0109, "step": 150040 }, { - "epoch": 1.62, - "learning_rate": 5.668093662839722e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018644676632477512, + "loss": 0.0137, "step": 150050 }, { - "epoch": 1.62, - "learning_rate": 5.6664720762794316e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001864391986317611, + "loss": 0.0137, "step": 150060 }, { - "epoch": 1.62, - "learning_rate": 5.664850489719141e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018643163093874708, + "loss": 0.015, "step": 150070 }, { - "epoch": 1.62, - "learning_rate": 5.66322890315885e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001864240632457331, + "loss": 0.0114, "step": 150080 }, { - "epoch": 1.62, - "learning_rate": 5.66160731659856e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018641649555271907, + "loss": 0.0102, "step": 150090 }, { - "epoch": 1.62, - "learning_rate": 5.659985730038269e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018640892785970505, + "loss": 0.0133, "step": 150100 }, { - "epoch": 1.62, - "learning_rate": 5.6583641434779786e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018640136016669106, + "loss": 0.0132, "step": 150110 }, { - "epoch": 1.62, - "learning_rate": 5.656742556917688e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018639379247367704, + "loss": 0.012, "step": 150120 }, { - "epoch": 1.62, - "learning_rate": 5.655120970357397e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018638622478066302, + "loss": 0.0124, "step": 150130 }, { - "epoch": 1.62, - "learning_rate": 5.653499383797107e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018637865708764903, + "loss": 0.0113, "step": 150140 }, { - "epoch": 1.62, - "learning_rate": 5.6518777972368164e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.000186371089394635, + "loss": 0.0131, "step": 150150 }, { - "epoch": 1.62, - "learning_rate": 5.650256210676526e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.000186363521701621, + "loss": 0.0122, "step": 150160 }, { - "epoch": 1.62, - "learning_rate": 5.648634624116235e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018635595400860698, + "loss": 0.0127, "step": 150170 }, { - "epoch": 1.62, - "learning_rate": 5.647013037555944e-05, - "loss": 0.0114, + "epoch": 0.76, + "learning_rate": 0.00018634838631559298, + "loss": 0.0116, "step": 150180 }, { - "epoch": 1.62, - "learning_rate": 5.6453914509956535e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018634081862257897, + "loss": 0.0137, "step": 150190 }, { - "epoch": 1.62, - "learning_rate": 5.6437698644353634e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018633325092956492, + "loss": 0.0133, "step": 150200 }, { - "epoch": 1.62, - "learning_rate": 5.642148277875073e-05, - "loss": 0.0116, + "epoch": 0.76, + "learning_rate": 0.0001863256832365509, + "loss": 0.0131, "step": 150210 }, { - "epoch": 1.62, - "learning_rate": 5.640526691314782e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.0001863181155435369, + "loss": 0.0157, "step": 150220 }, { - "epoch": 1.62, - "learning_rate": 5.638905104754491e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.0001863105478505229, + "loss": 0.0153, "step": 150230 }, { - "epoch": 1.62, - "learning_rate": 5.6372835181942005e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018630298015750887, + "loss": 0.0136, "step": 150240 }, { - "epoch": 1.62, - "learning_rate": 5.6356619316339105e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018629541246449488, + "loss": 0.0134, "step": 150250 }, { - "epoch": 1.62, - "learning_rate": 5.63404034507362e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018628784477148086, + "loss": 0.0107, "step": 150260 }, { - "epoch": 1.62, - "learning_rate": 5.632418758513329e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018628027707846684, + "loss": 0.0121, "step": 150270 }, { - "epoch": 1.62, - "learning_rate": 5.630797171953038e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.00018627270938545285, + "loss": 0.0164, "step": 150280 }, { - "epoch": 1.62, - "learning_rate": 5.6291755853927476e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018626514169243883, + "loss": 0.0144, "step": 150290 }, { - "epoch": 1.62, - "learning_rate": 5.6275539988324575e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018625757399942482, + "loss": 0.0094, "step": 150300 }, { - "epoch": 1.62, - "learning_rate": 5.625932412272167e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018625000630641082, + "loss": 0.014, "step": 150310 }, { - "epoch": 1.63, - "learning_rate": 5.624310825711876e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001862424386133968, + "loss": 0.0117, "step": 150320 }, { - "epoch": 1.63, - "learning_rate": 5.6226892391515854e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.0001862348709203828, + "loss": 0.0151, "step": 150330 }, { - "epoch": 1.63, - "learning_rate": 5.6210676525912946e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.0001862273032273688, + "loss": 0.0137, "step": 150340 }, { - "epoch": 1.63, - "learning_rate": 5.619446066031004e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018621973553435478, + "loss": 0.0163, "step": 150350 }, { - "epoch": 1.63, - "learning_rate": 5.617824479470714e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018621216784134076, + "loss": 0.0098, "step": 150360 }, { - "epoch": 1.63, - "learning_rate": 5.616202892910423e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.00018620460014832677, + "loss": 0.0141, "step": 150370 }, { - "epoch": 1.63, - "learning_rate": 5.6145813063501324e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018619703245531275, + "loss": 0.0116, "step": 150380 }, { - "epoch": 1.63, - "learning_rate": 5.612959719789842e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018618946476229873, + "loss": 0.0127, "step": 150390 }, { - "epoch": 1.63, - "learning_rate": 5.611338133229551e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.0001861818970692847, + "loss": 0.0108, "step": 150400 }, { - "epoch": 1.63, - "learning_rate": 5.609716546669261e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018617432937627072, + "loss": 0.0158, "step": 150410 }, { - "epoch": 1.63, - "learning_rate": 5.60809496010897e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.0001861667616832567, + "loss": 0.0146, "step": 150420 }, { - "epoch": 1.63, - "learning_rate": 5.6064733735486795e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.00018615919399024268, + "loss": 0.0151, "step": 150430 }, { - "epoch": 1.63, - "learning_rate": 5.604851786988389e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.0001861516262972287, + "loss": 0.0123, "step": 150440 }, { - "epoch": 1.63, - "learning_rate": 5.603230200428098e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018614405860421467, + "loss": 0.0136, "step": 150450 }, { - "epoch": 1.63, - "learning_rate": 5.601608613867808e-05, - "loss": 0.0052, + "epoch": 0.76, + "learning_rate": 0.00018613649091120066, + "loss": 0.0167, "step": 150460 }, { - "epoch": 1.63, - "learning_rate": 5.599987027307517e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018612892321818666, + "loss": 0.0133, "step": 150470 }, { - "epoch": 1.63, - "learning_rate": 5.5983654407472265e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018612135552517264, + "loss": 0.0115, "step": 150480 }, { - "epoch": 1.63, - "learning_rate": 5.596743854186936e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018611378783215863, + "loss": 0.0131, "step": 150490 }, { - "epoch": 1.63, - "learning_rate": 5.595122267626645e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018610622013914463, + "loss": 0.0169, "step": 150500 }, { - "epoch": 1.63, - "learning_rate": 5.593500681066354e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018609865244613062, + "loss": 0.014, "step": 150510 }, { - "epoch": 1.63, - "learning_rate": 5.591879094506064e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.0001860910847531166, + "loss": 0.0155, "step": 150520 }, { - "epoch": 1.63, - "learning_rate": 5.5902575079457736e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001860835170601026, + "loss": 0.0136, "step": 150530 }, { - "epoch": 1.63, - "learning_rate": 5.588635921385483e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.0001860759493670886, + "loss": 0.0115, "step": 150540 }, { - "epoch": 1.63, - "learning_rate": 5.587014334825192e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018606838167407457, + "loss": 0.0092, "step": 150550 }, { - "epoch": 1.63, - "learning_rate": 5.5853927482649014e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018606081398106055, + "loss": 0.0118, "step": 150560 }, { - "epoch": 1.63, - "learning_rate": 5.583771161704611e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018605324628804656, + "loss": 0.0131, "step": 150570 }, { - "epoch": 1.63, - "learning_rate": 5.5821495751443206e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018604567859503254, + "loss": 0.0131, "step": 150580 }, { - "epoch": 1.63, - "learning_rate": 5.58052798858403e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018603811090201852, + "loss": 0.0128, "step": 150590 }, { - "epoch": 1.63, - "learning_rate": 5.578906402023739e-05, - "loss": 0.0092, + "epoch": 0.76, + "learning_rate": 0.00018603054320900453, + "loss": 0.0138, "step": 150600 }, { - "epoch": 1.63, - "learning_rate": 5.5772848154634484e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.0001860229755159905, + "loss": 0.0117, "step": 150610 }, { - "epoch": 1.63, - "learning_rate": 5.575663228903158e-05, - "loss": 0.0045, + "epoch": 0.76, + "learning_rate": 0.0001860154078229765, + "loss": 0.0149, "step": 150620 }, { - "epoch": 1.63, - "learning_rate": 5.5740416423428677e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001860078401299625, + "loss": 0.0148, "step": 150630 }, { - "epoch": 1.63, - "learning_rate": 5.572420055782577e-05, - "loss": 0.0107, + "epoch": 0.76, + "learning_rate": 0.00018600027243694848, + "loss": 0.0143, "step": 150640 }, { - "epoch": 1.63, - "learning_rate": 5.570798469222286e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018599270474393447, + "loss": 0.0151, "step": 150650 }, { - "epoch": 1.63, - "learning_rate": 5.5691768826619955e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018598513705092047, + "loss": 0.0116, "step": 150660 }, { - "epoch": 1.63, - "learning_rate": 5.567555296101705e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018597756935790646, + "loss": 0.0146, "step": 150670 }, { - "epoch": 1.63, - "learning_rate": 5.565933709541415e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018597000166489244, + "loss": 0.0112, "step": 150680 }, { - "epoch": 1.63, - "learning_rate": 5.564312122981124e-05, - "loss": 0.0092, + "epoch": 0.76, + "learning_rate": 0.00018596243397187845, + "loss": 0.0105, "step": 150690 }, { - "epoch": 1.63, - "learning_rate": 5.562690536420834e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018595486627886443, + "loss": 0.0139, "step": 150700 }, { - "epoch": 1.63, - "learning_rate": 5.561068949860543e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001859472985858504, + "loss": 0.0105, "step": 150710 }, { - "epoch": 1.63, - "learning_rate": 5.559447363300253e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.0001859397308928364, + "loss": 0.0125, "step": 150720 }, { - "epoch": 1.63, - "learning_rate": 5.5578257767399624e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.0001859321631998224, + "loss": 0.012, "step": 150730 }, { - "epoch": 1.63, - "learning_rate": 5.556204190179672e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018592459550680838, + "loss": 0.0114, "step": 150740 }, { - "epoch": 1.63, - "learning_rate": 5.554582603619381e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018591702781379436, + "loss": 0.0129, "step": 150750 }, { - "epoch": 1.63, - "learning_rate": 5.55296101705909e-05, - "loss": 0.0125, + "epoch": 0.76, + "learning_rate": 0.00018590946012078037, + "loss": 0.0112, "step": 150760 }, { - "epoch": 1.63, - "learning_rate": 5.5513394304987995e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018590189242776635, + "loss": 0.0135, "step": 150770 }, { - "epoch": 1.63, - "learning_rate": 5.5497178439385095e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018589432473475233, + "loss": 0.0138, "step": 150780 }, { - "epoch": 1.63, - "learning_rate": 5.548096257378219e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018588675704173834, + "loss": 0.0158, "step": 150790 }, { - "epoch": 1.63, - "learning_rate": 5.546474670817928e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018587918934872432, + "loss": 0.0143, "step": 150800 }, { - "epoch": 1.63, - "learning_rate": 5.544853084257637e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.0001858716216557103, + "loss": 0.0139, "step": 150810 }, { - "epoch": 1.63, - "learning_rate": 5.5432314976973466e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.0001858640539626963, + "loss": 0.0118, "step": 150820 }, { - "epoch": 1.63, - "learning_rate": 5.5416099111370565e-05, - "loss": 0.0052, + "epoch": 0.76, + "learning_rate": 0.0001858564862696823, + "loss": 0.0112, "step": 150830 }, { - "epoch": 1.63, - "learning_rate": 5.539988324576766e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018584891857666828, + "loss": 0.0104, "step": 150840 }, { - "epoch": 1.63, - "learning_rate": 5.538366738016475e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018584135088365428, + "loss": 0.0118, "step": 150850 }, { - "epoch": 1.63, - "learning_rate": 5.5367451514561844e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018583378319064027, + "loss": 0.0122, "step": 150860 }, { - "epoch": 1.63, - "learning_rate": 5.5351235648958936e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018582621549762625, + "loss": 0.0142, "step": 150870 }, { - "epoch": 1.63, - "learning_rate": 5.5335019783356036e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018581864780461226, + "loss": 0.0119, "step": 150880 }, { - "epoch": 1.63, - "learning_rate": 5.531880391775313e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.00018581108011159824, + "loss": 0.0122, "step": 150890 }, { - "epoch": 1.63, - "learning_rate": 5.530258805215022e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.00018580351241858422, + "loss": 0.0147, "step": 150900 }, { - "epoch": 1.63, - "learning_rate": 5.5286372186547314e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.0001857959447255702, + "loss": 0.0147, "step": 150910 }, { - "epoch": 1.63, - "learning_rate": 5.527015632094441e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001857883770325562, + "loss": 0.0139, "step": 150920 }, { - "epoch": 1.63, - "learning_rate": 5.52539404553415e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.0001857808093395422, + "loss": 0.0158, "step": 150930 }, { - "epoch": 1.63, - "learning_rate": 5.52377245897386e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018577324164652817, + "loss": 0.0113, "step": 150940 }, { - "epoch": 1.63, - "learning_rate": 5.522150872413569e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018576567395351418, + "loss": 0.0117, "step": 150950 }, { - "epoch": 1.63, - "learning_rate": 5.5205292858532785e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018575810626050016, + "loss": 0.0124, "step": 150960 }, { - "epoch": 1.63, - "learning_rate": 5.518907699292988e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018575053856748614, + "loss": 0.0141, "step": 150970 }, { - "epoch": 1.63, - "learning_rate": 5.517286112732697e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018574297087447215, + "loss": 0.0149, "step": 150980 }, { - "epoch": 1.63, - "learning_rate": 5.515664526172407e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018573540318145813, + "loss": 0.0116, "step": 150990 }, { - "epoch": 1.63, - "learning_rate": 5.514042939612116e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018572783548844411, + "loss": 0.0146, "step": 151000 }, { - "epoch": 1.63, - "eval_cer": 0.9215286717149871, - "eval_loss": 0.0059387171640992165, - "eval_runtime": 121.2054, - "eval_samples_per_second": 16.501, - "eval_steps_per_second": 4.125, + "epoch": 0.76, + "eval_cer": 0.9144760782799146, + "eval_loss": 0.00918071623891592, + "eval_runtime": 116.7205, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 151000 }, { - "epoch": 1.63, - "learning_rate": 5.5124213530518255e-05, - "loss": 0.0106, + "epoch": 0.76, + "learning_rate": 0.00018572026779543012, + "loss": 0.0125, "step": 151010 }, { - "epoch": 1.63, - "learning_rate": 5.510799766491535e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001857127001024161, + "loss": 0.0133, "step": 151020 }, { - "epoch": 1.63, - "learning_rate": 5.509178179931244e-05, - "loss": 0.0057, + "epoch": 0.76, + "learning_rate": 0.00018570513240940209, + "loss": 0.0129, "step": 151030 }, { - "epoch": 1.63, - "learning_rate": 5.507556593370954e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.0001856975647163881, + "loss": 0.0122, "step": 151040 }, { - "epoch": 1.63, - "learning_rate": 5.505935006810663e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018568999702337408, + "loss": 0.0135, "step": 151050 }, { - "epoch": 1.63, - "learning_rate": 5.5043134202503726e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018568242933036006, + "loss": 0.0141, "step": 151060 }, { - "epoch": 1.63, - "learning_rate": 5.502691833690082e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018567486163734604, + "loss": 0.0118, "step": 151070 }, { - "epoch": 1.63, - "learning_rate": 5.501070247129791e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.00018566729394433205, + "loss": 0.0113, "step": 151080 }, { - "epoch": 1.63, - "learning_rate": 5.4994486605695004e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018565972625131803, + "loss": 0.015, "step": 151090 }, { - "epoch": 1.63, - "learning_rate": 5.49782707400921e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.000185652158558304, + "loss": 0.0135, "step": 151100 }, { - "epoch": 1.63, - "learning_rate": 5.4962054874489196e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018564459086529002, + "loss": 0.0149, "step": 151110 }, { - "epoch": 1.63, - "learning_rate": 5.494583900888629e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.000185637023172276, + "loss": 0.0118, "step": 151120 }, { - "epoch": 1.63, - "learning_rate": 5.492962314328338e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018562945547926198, + "loss": 0.013, "step": 151130 }, { - "epoch": 1.63, - "learning_rate": 5.4913407277680474e-05, - "loss": 0.0096, + "epoch": 0.76, + "learning_rate": 0.000185621887786248, + "loss": 0.0111, "step": 151140 }, { - "epoch": 1.63, - "learning_rate": 5.4897191412077574e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018561432009323397, + "loss": 0.0139, "step": 151150 }, { - "epoch": 1.63, - "learning_rate": 5.4880975546474666e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018560675240021995, + "loss": 0.0121, "step": 151160 }, { - "epoch": 1.63, - "learning_rate": 5.486475968087176e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018559918470720596, + "loss": 0.0114, "step": 151170 }, { - "epoch": 1.63, - "learning_rate": 5.484854381526885e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018559161701419194, + "loss": 0.0111, "step": 151180 }, { - "epoch": 1.63, - "learning_rate": 5.4832327949665945e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018558404932117792, + "loss": 0.0192, "step": 151190 }, { - "epoch": 1.63, - "learning_rate": 5.481611208406304e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018557648162816393, + "loss": 0.0119, "step": 151200 }, { - "epoch": 1.63, - "learning_rate": 5.479989621846014e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018556891393514991, + "loss": 0.0108, "step": 151210 }, { - "epoch": 1.63, - "learning_rate": 5.478368035285723e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.0001855613462421359, + "loss": 0.0114, "step": 151220 }, { - "epoch": 1.63, - "learning_rate": 5.476746448725432e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.00018555377854912188, + "loss": 0.0104, "step": 151230 }, { - "epoch": 1.63, - "learning_rate": 5.4751248621651415e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018554621085610789, + "loss": 0.0143, "step": 151240 }, { - "epoch": 1.64, - "learning_rate": 5.473503275604851e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018553864316309387, + "loss": 0.0122, "step": 151250 }, { - "epoch": 1.64, - "learning_rate": 5.471881689044561e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018553107547007985, + "loss": 0.0103, "step": 151260 }, { - "epoch": 1.64, - "learning_rate": 5.47026010248427e-05, - "loss": 0.0119, + "epoch": 0.76, + "learning_rate": 0.00018552350777706586, + "loss": 0.0133, "step": 151270 }, { - "epoch": 1.64, - "learning_rate": 5.468638515923979e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018551594008405184, + "loss": 0.0112, "step": 151280 }, { - "epoch": 1.64, - "learning_rate": 5.4670169293636886e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.00018550837239103782, + "loss": 0.0123, "step": 151290 }, { - "epoch": 1.64, - "learning_rate": 5.465395342803398e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018550080469802383, + "loss": 0.0121, "step": 151300 }, { - "epoch": 1.64, - "learning_rate": 5.463773756243108e-05, - "loss": 0.0055, + "epoch": 0.76, + "learning_rate": 0.0001854932370050098, + "loss": 0.0125, "step": 151310 }, { - "epoch": 1.64, - "learning_rate": 5.462152169682817e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.0001854856693119958, + "loss": 0.0135, "step": 151320 }, { - "epoch": 1.64, - "learning_rate": 5.4605305831225263e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.0001854781016189818, + "loss": 0.0115, "step": 151330 }, { - "epoch": 1.64, - "learning_rate": 5.4589089965622356e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018547053392596778, + "loss": 0.0086, "step": 151340 }, { - "epoch": 1.64, - "learning_rate": 5.457287410001945e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018546296623295376, + "loss": 0.0119, "step": 151350 }, { - "epoch": 1.64, - "learning_rate": 5.455665823441654e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018545539853993977, + "loss": 0.0117, "step": 151360 }, { - "epoch": 1.64, - "learning_rate": 5.454044236881364e-05, - "loss": 0.0104, + "epoch": 0.76, + "learning_rate": 0.00018544783084692575, + "loss": 0.0129, "step": 151370 }, { - "epoch": 1.64, - "learning_rate": 5.4524226503210734e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018544026315391173, + "loss": 0.0141, "step": 151380 }, { - "epoch": 1.64, - "learning_rate": 5.450801063760783e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018543269546089774, + "loss": 0.0139, "step": 151390 }, { - "epoch": 1.64, - "learning_rate": 5.449179477200492e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018542512776788372, + "loss": 0.0141, "step": 151400 }, { - "epoch": 1.64, - "learning_rate": 5.447557890640201e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.0001854175600748697, + "loss": 0.0112, "step": 151410 }, { - "epoch": 1.64, - "learning_rate": 5.445936304079912e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.0001854099923818557, + "loss": 0.014, "step": 151420 }, { - "epoch": 1.64, - "learning_rate": 5.444314717519621e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.0001854024246888417, + "loss": 0.0133, "step": 151430 }, { - "epoch": 1.64, - "learning_rate": 5.4426931309593304e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018539485699582768, + "loss": 0.0128, "step": 151440 }, { - "epoch": 1.64, - "learning_rate": 5.44107154439904e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018538728930281366, + "loss": 0.0111, "step": 151450 }, { - "epoch": 1.64, - "learning_rate": 5.4394499578387496e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001853797216097996, + "loss": 0.0141, "step": 151460 }, { - "epoch": 1.64, - "learning_rate": 5.437828371278459e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018537215391678562, + "loss": 0.0125, "step": 151470 }, { - "epoch": 1.64, - "learning_rate": 5.436206784718168e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.0001853645862237716, + "loss": 0.0131, "step": 151480 }, { - "epoch": 1.64, - "learning_rate": 5.4345851981578774e-05, - "loss": 0.0049, + "epoch": 0.76, + "learning_rate": 0.00018535701853075758, + "loss": 0.0144, "step": 151490 }, { - "epoch": 1.64, - "learning_rate": 5.432963611597587e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.0001853494508377436, + "loss": 0.0118, "step": 151500 }, { - "epoch": 1.64, - "learning_rate": 5.431342025037296e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018534188314472957, + "loss": 0.0126, "step": 151510 }, { - "epoch": 1.64, - "learning_rate": 5.429720438477006e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018533431545171556, + "loss": 0.0117, "step": 151520 }, { - "epoch": 1.64, - "learning_rate": 5.428098851916715e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018532674775870156, + "loss": 0.0142, "step": 151530 }, { - "epoch": 1.64, - "learning_rate": 5.4264772653564245e-05, - "loss": 0.0051, + "epoch": 0.76, + "learning_rate": 0.00018531918006568755, + "loss": 0.0144, "step": 151540 }, { - "epoch": 1.64, - "learning_rate": 5.424855678796134e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018531161237267353, + "loss": 0.0117, "step": 151550 }, { - "epoch": 1.64, - "learning_rate": 5.423234092235843e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018530404467965954, + "loss": 0.0178, "step": 151560 }, { - "epoch": 1.64, - "learning_rate": 5.421612505675553e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018529647698664552, + "loss": 0.0133, "step": 151570 }, { - "epoch": 1.64, - "learning_rate": 5.419990919115262e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001852889092936315, + "loss": 0.0144, "step": 151580 }, { - "epoch": 1.64, - "learning_rate": 5.4183693325549715e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.0001852813416006175, + "loss": 0.0131, "step": 151590 }, { - "epoch": 1.64, - "learning_rate": 5.416747745994681e-05, - "loss": 0.0041, + "epoch": 0.76, + "learning_rate": 0.0001852737739076035, + "loss": 0.0136, "step": 151600 }, { - "epoch": 1.64, - "learning_rate": 5.41512615943439e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018526620621458947, + "loss": 0.0125, "step": 151610 }, { - "epoch": 1.64, - "learning_rate": 5.4135045728741e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018525863852157545, + "loss": 0.0122, "step": 151620 }, { - "epoch": 1.64, - "learning_rate": 5.411882986313809e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018525107082856146, + "loss": 0.0166, "step": 151630 }, { - "epoch": 1.64, - "learning_rate": 5.4102613997535186e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018524350313554744, + "loss": 0.0127, "step": 151640 }, { - "epoch": 1.64, - "learning_rate": 5.408639813193228e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018523593544253342, + "loss": 0.012, "step": 151650 }, { - "epoch": 1.64, - "learning_rate": 5.407018226632937e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018522836774951943, + "loss": 0.0187, "step": 151660 }, { - "epoch": 1.64, - "learning_rate": 5.4053966400726464e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001852208000565054, + "loss": 0.0119, "step": 151670 }, { - "epoch": 1.64, - "learning_rate": 5.4037750535123564e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.0001852132323634914, + "loss": 0.0146, "step": 151680 }, { - "epoch": 1.64, - "learning_rate": 5.4021534669520656e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001852056646704774, + "loss": 0.0126, "step": 151690 }, { - "epoch": 1.64, - "learning_rate": 5.400531880391775e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018519809697746338, + "loss": 0.0128, "step": 151700 }, { - "epoch": 1.64, - "learning_rate": 5.398910293831484e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.00018519052928444937, + "loss": 0.0125, "step": 151710 }, { - "epoch": 1.64, - "learning_rate": 5.3972887072711935e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018518296159143537, + "loss": 0.0139, "step": 151720 }, { - "epoch": 1.64, - "learning_rate": 5.3956671207109034e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018517539389842136, + "loss": 0.0112, "step": 151730 }, { - "epoch": 1.64, - "learning_rate": 5.394045534150613e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018516782620540734, + "loss": 0.0099, "step": 151740 }, { - "epoch": 1.64, - "learning_rate": 5.392423947590322e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018516025851239335, + "loss": 0.0105, "step": 151750 }, { - "epoch": 1.64, - "learning_rate": 5.390802361030031e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018515269081937933, + "loss": 0.0139, "step": 151760 }, { - "epoch": 1.64, - "learning_rate": 5.3891807744697405e-05, - "loss": 0.0091, + "epoch": 0.77, + "learning_rate": 0.0001851451231263653, + "loss": 0.0109, "step": 151770 }, { - "epoch": 1.64, - "learning_rate": 5.38755918790945e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018513755543335132, + "loss": 0.0135, "step": 151780 }, { - "epoch": 1.64, - "learning_rate": 5.38593760134916e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.0001851299877403373, + "loss": 0.0145, "step": 151790 }, { - "epoch": 1.64, - "learning_rate": 5.384316014788869e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018512242004732328, + "loss": 0.0136, "step": 151800 }, { - "epoch": 1.64, - "learning_rate": 5.382694428228578e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018511485235430926, + "loss": 0.018, "step": 151810 }, { - "epoch": 1.64, - "learning_rate": 5.3810728416682876e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018510728466129527, + "loss": 0.0134, "step": 151820 }, { - "epoch": 1.64, - "learning_rate": 5.379451255107997e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018509971696828125, + "loss": 0.0104, "step": 151830 }, { - "epoch": 1.64, - "learning_rate": 5.377829668547707e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018509214927526723, + "loss": 0.0141, "step": 151840 }, { - "epoch": 1.64, - "learning_rate": 5.376208081987416e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018508458158225324, + "loss": 0.0125, "step": 151850 }, { - "epoch": 1.64, - "learning_rate": 5.3745864954271253e-05, - "loss": 0.0121, + "epoch": 0.77, + "learning_rate": 0.00018507701388923922, + "loss": 0.0154, "step": 151860 }, { - "epoch": 1.64, - "learning_rate": 5.3729649088668346e-05, - "loss": 0.0094, + "epoch": 0.77, + "learning_rate": 0.0001850694461962252, + "loss": 0.0109, "step": 151870 }, { - "epoch": 1.64, - "learning_rate": 5.371343322306544e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.0001850618785032112, + "loss": 0.0108, "step": 151880 }, { - "epoch": 1.64, - "learning_rate": 5.369721735746254e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.0001850543108101972, + "loss": 0.0131, "step": 151890 }, { - "epoch": 1.64, - "learning_rate": 5.368100149185963e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018504674311718318, + "loss": 0.0095, "step": 151900 }, { - "epoch": 1.64, - "learning_rate": 5.3664785626256724e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018503917542416918, + "loss": 0.0151, "step": 151910 }, { - "epoch": 1.64, - "learning_rate": 5.364856976065382e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018503160773115517, + "loss": 0.0112, "step": 151920 }, { - "epoch": 1.64, - "learning_rate": 5.363235389505091e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018502404003814115, + "loss": 0.0126, "step": 151930 }, { - "epoch": 1.64, - "learning_rate": 5.3616138029448e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018501647234512716, + "loss": 0.0124, "step": 151940 }, { - "epoch": 1.64, - "learning_rate": 5.35999221638451e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018500890465211314, + "loss": 0.0118, "step": 151950 }, { - "epoch": 1.64, - "learning_rate": 5.3583706298242194e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018500133695909912, + "loss": 0.0133, "step": 151960 }, { - "epoch": 1.64, - "learning_rate": 5.356749043263929e-05, - "loss": 0.0104, + "epoch": 0.77, + "learning_rate": 0.0001849937692660851, + "loss": 0.0117, "step": 151970 }, { - "epoch": 1.64, - "learning_rate": 5.355127456703638e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001849862015730711, + "loss": 0.0124, "step": 151980 }, { - "epoch": 1.64, - "learning_rate": 5.353505870143347e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001849786338800571, + "loss": 0.0122, "step": 151990 }, { - "epoch": 1.64, - "learning_rate": 5.351884283583057e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018497106618704307, + "loss": 0.0119, "step": 152000 }, { - "epoch": 1.64, - "eval_cer": 0.9215173798765541, - "eval_loss": 0.005879946518689394, - "eval_runtime": 121.1735, - "eval_samples_per_second": 16.505, - "eval_steps_per_second": 4.126, + "epoch": 0.77, + "eval_cer": 0.914467344714786, + "eval_loss": 0.00894253607839346, + "eval_runtime": 116.687, + "eval_samples_per_second": 17.14, + "eval_steps_per_second": 4.285, "step": 152000 }, { - "epoch": 1.64, - "learning_rate": 5.3502626970227665e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018496349849402908, + "loss": 0.0124, "step": 152010 }, { - "epoch": 1.64, - "learning_rate": 5.348641110462476e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018495593080101506, + "loss": 0.0146, "step": 152020 }, { - "epoch": 1.64, - "learning_rate": 5.347019523902185e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018494836310800104, + "loss": 0.0107, "step": 152030 }, { - "epoch": 1.64, - "learning_rate": 5.345397937341894e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018494079541498705, + "loss": 0.014, "step": 152040 }, { - "epoch": 1.64, - "learning_rate": 5.343776350781604e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018493322772197303, + "loss": 0.0096, "step": 152050 }, { - "epoch": 1.64, - "learning_rate": 5.3421547642213135e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018492566002895901, + "loss": 0.0149, "step": 152060 }, { - "epoch": 1.64, - "learning_rate": 5.340533177661023e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018491809233594502, + "loss": 0.0156, "step": 152070 }, { - "epoch": 1.64, - "learning_rate": 5.338911591100732e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.000184910524642931, + "loss": 0.0122, "step": 152080 }, { - "epoch": 1.64, - "learning_rate": 5.3372900045404414e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018490295694991699, + "loss": 0.0115, "step": 152090 }, { - "epoch": 1.64, - "learning_rate": 5.3356684179801506e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.000184895389256903, + "loss": 0.0144, "step": 152100 }, { - "epoch": 1.64, - "learning_rate": 5.3340468314198606e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018488782156388898, + "loss": 0.0134, "step": 152110 }, { - "epoch": 1.64, - "learning_rate": 5.33242524485957e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.00018488025387087496, + "loss": 0.0129, "step": 152120 }, { - "epoch": 1.64, - "learning_rate": 5.330803658299279e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018487268617786094, + "loss": 0.0152, "step": 152130 }, { - "epoch": 1.64, - "learning_rate": 5.329182071738989e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.00018486511848484695, + "loss": 0.0098, "step": 152140 }, { - "epoch": 1.64, - "learning_rate": 5.327560485178699e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018485755079183293, + "loss": 0.0128, "step": 152150 }, { - "epoch": 1.64, - "learning_rate": 5.325938898618408e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.0001848499830988189, + "loss": 0.0131, "step": 152160 }, { - "epoch": 1.65, - "learning_rate": 5.3243173120581176e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.00018484241540580492, + "loss": 0.0136, "step": 152170 }, { - "epoch": 1.65, - "learning_rate": 5.322695725497827e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.0001848348477127909, + "loss": 0.0114, "step": 152180 }, { - "epoch": 1.65, - "learning_rate": 5.321074138937536e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018482728001977688, + "loss": 0.0113, "step": 152190 }, { - "epoch": 1.65, - "learning_rate": 5.319452552377246e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.0001848197123267629, + "loss": 0.0161, "step": 152200 }, { - "epoch": 1.65, - "learning_rate": 5.3178309658169554e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018481214463374887, + "loss": 0.0161, "step": 152210 }, { - "epoch": 1.65, - "learning_rate": 5.3162093792566646e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018480457694073485, + "loss": 0.0136, "step": 152220 }, { - "epoch": 1.65, - "learning_rate": 5.314587792696374e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.00018479700924772086, + "loss": 0.0108, "step": 152230 }, { - "epoch": 1.65, - "learning_rate": 5.312966206136083e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018478944155470684, + "loss": 0.0123, "step": 152240 }, { - "epoch": 1.65, - "learning_rate": 5.3113446195757925e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018478187386169282, + "loss": 0.0108, "step": 152250 }, { - "epoch": 1.65, - "learning_rate": 5.3097230330155024e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018477430616867883, + "loss": 0.0125, "step": 152260 }, { - "epoch": 1.65, - "learning_rate": 5.308101446455212e-05, - "loss": 0.0055, + "epoch": 0.77, + "learning_rate": 0.00018476673847566481, + "loss": 0.012, "step": 152270 }, { - "epoch": 1.65, - "learning_rate": 5.306479859894921e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.0001847591707826508, + "loss": 0.0111, "step": 152280 }, { - "epoch": 1.65, - "learning_rate": 5.30485827333463e-05, - "loss": 0.0088, + "epoch": 0.77, + "learning_rate": 0.0001847516030896368, + "loss": 0.0152, "step": 152290 }, { - "epoch": 1.65, - "learning_rate": 5.3032366867743395e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018474403539662279, + "loss": 0.0117, "step": 152300 }, { - "epoch": 1.65, - "learning_rate": 5.3016151002140495e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018473646770360877, + "loss": 0.0133, "step": 152310 }, { - "epoch": 1.65, - "learning_rate": 5.299993513653759e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018472890001059475, + "loss": 0.0144, "step": 152320 }, { - "epoch": 1.65, - "learning_rate": 5.298371927093468e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018472133231758076, + "loss": 0.0119, "step": 152330 }, { - "epoch": 1.65, - "learning_rate": 5.296750340533177e-05, - "loss": 0.0104, + "epoch": 0.77, + "learning_rate": 0.00018471376462456674, + "loss": 0.0142, "step": 152340 }, { - "epoch": 1.65, - "learning_rate": 5.2951287539728866e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.00018470619693155272, + "loss": 0.0156, "step": 152350 }, { - "epoch": 1.65, - "learning_rate": 5.2935071674125965e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018469862923853873, + "loss": 0.0131, "step": 152360 }, { - "epoch": 1.65, - "learning_rate": 5.291885580852306e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.0001846910615455247, + "loss": 0.0107, "step": 152370 }, { - "epoch": 1.65, - "learning_rate": 5.290263994292015e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.0001846834938525107, + "loss": 0.0103, "step": 152380 }, { - "epoch": 1.65, - "learning_rate": 5.288642407731724e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001846759261594967, + "loss": 0.0149, "step": 152390 }, { - "epoch": 1.65, - "learning_rate": 5.2870208211714336e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018466835846648268, + "loss": 0.0123, "step": 152400 }, { - "epoch": 1.65, - "learning_rate": 5.285399234611143e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018466079077346866, + "loss": 0.0113, "step": 152410 }, { - "epoch": 1.65, - "learning_rate": 5.283777648050853e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.00018465322308045467, + "loss": 0.0129, "step": 152420 }, { - "epoch": 1.65, - "learning_rate": 5.282156061490562e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018464565538744065, + "loss": 0.0164, "step": 152430 }, { - "epoch": 1.65, - "learning_rate": 5.2805344749302714e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.00018463808769442663, + "loss": 0.0129, "step": 152440 }, { - "epoch": 1.65, - "learning_rate": 5.2789128883699807e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018463052000141264, + "loss": 0.014, "step": 152450 }, { - "epoch": 1.65, - "learning_rate": 5.27729130180969e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018462295230839862, + "loss": 0.0125, "step": 152460 }, { - "epoch": 1.65, - "learning_rate": 5.2756697152494e-05, - "loss": 0.0088, + "epoch": 0.77, + "learning_rate": 0.0001846153846153846, + "loss": 0.0141, "step": 152470 }, { - "epoch": 1.65, - "learning_rate": 5.274048128689109e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.0001846078169223706, + "loss": 0.0139, "step": 152480 }, { - "epoch": 1.65, - "learning_rate": 5.2724265421288184e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001846002492293566, + "loss": 0.0225, "step": 152490 }, { - "epoch": 1.65, - "learning_rate": 5.270804955568528e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018459268153634258, + "loss": 0.0156, "step": 152500 }, { - "epoch": 1.65, - "learning_rate": 5.269183369008237e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018458511384332856, + "loss": 0.0118, "step": 152510 }, { - "epoch": 1.65, - "learning_rate": 5.267561782447946e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018457754615031457, + "loss": 0.0132, "step": 152520 }, { - "epoch": 1.65, - "learning_rate": 5.265940195887656e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018456997845730055, + "loss": 0.0178, "step": 152530 }, { - "epoch": 1.65, - "learning_rate": 5.2643186093273655e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018456241076428653, + "loss": 0.0088, "step": 152540 }, { - "epoch": 1.65, - "learning_rate": 5.262697022767075e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018455484307127254, + "loss": 0.0104, "step": 152550 }, { - "epoch": 1.65, - "learning_rate": 5.261075436206784e-05, - "loss": 0.0101, + "epoch": 0.77, + "learning_rate": 0.00018454727537825852, + "loss": 0.0112, "step": 152560 }, { - "epoch": 1.65, - "learning_rate": 5.259453849646493e-05, - "loss": 0.0093, + "epoch": 0.77, + "learning_rate": 0.0001845397076852445, + "loss": 0.0143, "step": 152570 }, { - "epoch": 1.65, - "learning_rate": 5.257832263086203e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.0001845321399922305, + "loss": 0.0126, "step": 152580 }, { - "epoch": 1.65, - "learning_rate": 5.2562106765259125e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.0001845245722992165, + "loss": 0.0107, "step": 152590 }, { - "epoch": 1.65, - "learning_rate": 5.254589089965622e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018451700460620247, + "loss": 0.0125, "step": 152600 }, { - "epoch": 1.65, - "learning_rate": 5.252967503405331e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018450943691318848, + "loss": 0.0116, "step": 152610 }, { - "epoch": 1.65, - "learning_rate": 5.2513459168450404e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018450186922017446, + "loss": 0.0143, "step": 152620 }, { - "epoch": 1.65, - "learning_rate": 5.24972433028475e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018449430152716044, + "loss": 0.0144, "step": 152630 }, { - "epoch": 1.65, - "learning_rate": 5.2481027437244596e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018448673383414643, + "loss": 0.0101, "step": 152640 }, { - "epoch": 1.65, - "learning_rate": 5.246481157164169e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018447916614113243, + "loss": 0.0143, "step": 152650 }, { - "epoch": 1.65, - "learning_rate": 5.244859570603878e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018447159844811842, + "loss": 0.0116, "step": 152660 }, { - "epoch": 1.65, - "learning_rate": 5.2432379840435874e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.0001844640307551044, + "loss": 0.0124, "step": 152670 }, { - "epoch": 1.65, - "learning_rate": 5.241616397483297e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001844564630620904, + "loss": 0.0126, "step": 152680 }, { - "epoch": 1.65, - "learning_rate": 5.2399948109230066e-05, - "loss": 0.0094, + "epoch": 0.77, + "learning_rate": 0.0001844488953690764, + "loss": 0.0152, "step": 152690 }, { - "epoch": 1.65, - "learning_rate": 5.238373224362716e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018444132767606237, + "loss": 0.0134, "step": 152700 }, { - "epoch": 1.65, - "learning_rate": 5.236751637802425e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018443375998304838, + "loss": 0.01, "step": 152710 }, { - "epoch": 1.65, - "learning_rate": 5.2351300512421345e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018442619229003433, + "loss": 0.0135, "step": 152720 }, { - "epoch": 1.65, - "learning_rate": 5.233508464681844e-05, - "loss": 0.0108, + "epoch": 0.77, + "learning_rate": 0.0001844186245970203, + "loss": 0.0117, "step": 152730 }, { - "epoch": 1.65, - "learning_rate": 5.231886878121554e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001844110569040063, + "loss": 0.0171, "step": 152740 }, { - "epoch": 1.65, - "learning_rate": 5.230265291561263e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.0001844034892109923, + "loss": 0.012, "step": 152750 }, { - "epoch": 1.65, - "learning_rate": 5.228643705000972e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018439592151797828, + "loss": 0.0111, "step": 152760 }, { - "epoch": 1.65, - "learning_rate": 5.2270221184406815e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018438835382496427, + "loss": 0.0111, "step": 152770 }, { - "epoch": 1.65, - "learning_rate": 5.225400531880391e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.00018438078613195027, + "loss": 0.0114, "step": 152780 }, { - "epoch": 1.65, - "learning_rate": 5.2237789453201e-05, - "loss": 0.01, + "epoch": 0.77, + "learning_rate": 0.00018437321843893626, + "loss": 0.0123, "step": 152790 }, { - "epoch": 1.65, - "learning_rate": 5.22215735875981e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018436565074592224, + "loss": 0.0127, "step": 152800 }, { - "epoch": 1.65, - "learning_rate": 5.220535772199519e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018435808305290825, + "loss": 0.0121, "step": 152810 }, { - "epoch": 1.65, - "learning_rate": 5.2189141856392286e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018435051535989423, + "loss": 0.0137, "step": 152820 }, { - "epoch": 1.65, - "learning_rate": 5.217292599078938e-05, - "loss": 0.0093, + "epoch": 0.77, + "learning_rate": 0.0001843429476668802, + "loss": 0.0105, "step": 152830 }, { - "epoch": 1.65, - "learning_rate": 5.215671012518647e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018433537997386622, + "loss": 0.0113, "step": 152840 }, { - "epoch": 1.65, - "learning_rate": 5.214049425958357e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001843278122808522, + "loss": 0.0186, "step": 152850 }, { - "epoch": 1.65, - "learning_rate": 5.212427839398067e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018432024458783818, + "loss": 0.0117, "step": 152860 }, { - "epoch": 1.65, - "learning_rate": 5.210806252837776e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018431267689482416, + "loss": 0.0124, "step": 152870 }, { - "epoch": 1.65, - "learning_rate": 5.2091846662774856e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018430510920181017, + "loss": 0.0127, "step": 152880 }, { - "epoch": 1.65, - "learning_rate": 5.2075630797171955e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018429754150879615, + "loss": 0.0141, "step": 152890 }, { - "epoch": 1.65, - "learning_rate": 5.205941493156905e-05, - "loss": 0.0048, + "epoch": 0.77, + "learning_rate": 0.00018428997381578213, + "loss": 0.0143, "step": 152900 }, { - "epoch": 1.65, - "learning_rate": 5.204319906596614e-05, - "loss": 0.0046, + "epoch": 0.77, + "learning_rate": 0.00018428240612276814, + "loss": 0.0147, "step": 152910 }, { - "epoch": 1.65, - "learning_rate": 5.202698320036323e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018427483842975412, + "loss": 0.0119, "step": 152920 }, { - "epoch": 1.65, - "learning_rate": 5.2010767334760326e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.0001842672707367401, + "loss": 0.0155, "step": 152930 }, { - "epoch": 1.65, - "learning_rate": 5.1994551469157426e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.0001842597030437261, + "loss": 0.0131, "step": 152940 }, { - "epoch": 1.65, - "learning_rate": 5.197833560355452e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.0001842521353507121, + "loss": 0.0135, "step": 152950 }, { - "epoch": 1.65, - "learning_rate": 5.196211973795161e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018424456765769808, + "loss": 0.011, "step": 152960 }, { - "epoch": 1.65, - "learning_rate": 5.1945903872348704e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018423699996468408, + "loss": 0.0125, "step": 152970 }, { - "epoch": 1.65, - "learning_rate": 5.1929688006745797e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018422943227167007, + "loss": 0.0144, "step": 152980 }, { - "epoch": 1.65, - "learning_rate": 5.191347214114289e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018422186457865605, + "loss": 0.0123, "step": 152990 }, { - "epoch": 1.65, - "learning_rate": 5.189725627553999e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018421429688564206, + "loss": 0.0142, "step": 153000 }, { - "epoch": 1.65, - "eval_cer": 0.9215121682588159, - "eval_loss": 0.005926909390836954, - "eval_runtime": 121.2098, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.77, + "eval_cer": 0.9144702559031622, + "eval_loss": 0.008783689700067043, + "eval_runtime": 116.6617, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, "step": 153000 }, { - "epoch": 1.65, - "learning_rate": 5.188104040993708e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.00018420672919262804, + "loss": 0.0109, "step": 153010 }, { - "epoch": 1.65, - "learning_rate": 5.1864824544334174e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.00018419916149961402, + "loss": 0.0154, "step": 153020 }, { - "epoch": 1.65, - "learning_rate": 5.184860867873127e-05, - "loss": 0.0054, + "epoch": 0.77, + "learning_rate": 0.0001841915938066, + "loss": 0.0121, "step": 153030 }, { - "epoch": 1.65, - "learning_rate": 5.183239281312836e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.000184184026113586, + "loss": 0.0115, "step": 153040 }, { - "epoch": 1.65, - "learning_rate": 5.181617694752546e-05, - "loss": 0.0052, + "epoch": 0.77, + "learning_rate": 0.000184176458420572, + "loss": 0.0118, "step": 153050 }, { - "epoch": 1.65, - "learning_rate": 5.179996108192255e-05, - "loss": 0.0091, + "epoch": 0.77, + "learning_rate": 0.00018416889072755797, + "loss": 0.0121, "step": 153060 }, { - "epoch": 1.65, - "learning_rate": 5.1783745216319645e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018416132303454398, + "loss": 0.0127, "step": 153070 }, { - "epoch": 1.65, - "learning_rate": 5.176752935071674e-05, - "loss": 0.0049, + "epoch": 0.77, + "learning_rate": 0.00018415375534152996, + "loss": 0.0151, "step": 153080 }, { - "epoch": 1.65, - "learning_rate": 5.175131348511383e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018414618764851594, + "loss": 0.0142, "step": 153090 }, { - "epoch": 1.66, - "learning_rate": 5.173509761951092e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018413861995550195, + "loss": 0.0153, "step": 153100 }, { - "epoch": 1.66, - "learning_rate": 5.171888175390802e-05, - "loss": 0.0091, + "epoch": 0.77, + "learning_rate": 0.00018413105226248793, + "loss": 0.0132, "step": 153110 }, { - "epoch": 1.66, - "learning_rate": 5.1702665888305115e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018412348456947391, + "loss": 0.012, "step": 153120 }, { - "epoch": 1.66, - "learning_rate": 5.168645002270221e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018411591687645992, + "loss": 0.0117, "step": 153130 }, { - "epoch": 1.66, - "learning_rate": 5.16702341570993e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.0001841083491834459, + "loss": 0.0112, "step": 153140 }, { - "epoch": 1.66, - "learning_rate": 5.1654018291496393e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018410078149043189, + "loss": 0.0183, "step": 153150 }, { - "epoch": 1.66, - "learning_rate": 5.163780242589349e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.0001840932137974179, + "loss": 0.0155, "step": 153160 }, { - "epoch": 1.66, - "learning_rate": 5.1621586560290586e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.00018408564610440388, + "loss": 0.016, "step": 153170 }, { - "epoch": 1.66, - "learning_rate": 5.160537069468768e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.00018407807841138986, + "loss": 0.0132, "step": 153180 }, { - "epoch": 1.66, - "learning_rate": 5.158915482908477e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018407051071837584, + "loss": 0.0181, "step": 153190 }, { - "epoch": 1.66, - "learning_rate": 5.1572938963481864e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018406294302536185, + "loss": 0.0173, "step": 153200 }, { - "epoch": 1.66, - "learning_rate": 5.1556723097878963e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018405537533234783, + "loss": 0.018, "step": 153210 }, { - "epoch": 1.66, - "learning_rate": 5.1540507232276056e-05, - "loss": 0.0099, + "epoch": 0.77, + "learning_rate": 0.0001840478076393338, + "loss": 0.0161, "step": 153220 }, { - "epoch": 1.66, - "learning_rate": 5.152429136667315e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018404023994631982, + "loss": 0.0144, "step": 153230 }, { - "epoch": 1.66, - "learning_rate": 5.150807550107024e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001840326722533058, + "loss": 0.015, "step": 153240 }, { - "epoch": 1.66, - "learning_rate": 5.1491859635467334e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018402510456029178, + "loss": 0.0151, "step": 153250 }, { - "epoch": 1.66, - "learning_rate": 5.147564376986443e-05, - "loss": 0.0093, + "epoch": 0.77, + "learning_rate": 0.0001840175368672778, + "loss": 0.0126, "step": 153260 }, { - "epoch": 1.66, - "learning_rate": 5.145942790426153e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018400996917426377, + "loss": 0.0133, "step": 153270 }, { - "epoch": 1.66, - "learning_rate": 5.144321203865862e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018400240148124975, + "loss": 0.0149, "step": 153280 }, { - "epoch": 1.66, - "learning_rate": 5.142699617305571e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018399483378823576, + "loss": 0.0156, "step": 153290 }, { - "epoch": 1.66, - "learning_rate": 5.1410780307452805e-05, - "loss": 0.0108, + "epoch": 0.77, + "learning_rate": 0.00018398726609522174, + "loss": 0.0117, "step": 153300 }, { - "epoch": 1.66, - "learning_rate": 5.13945644418499e-05, - "loss": 0.012, + "epoch": 0.77, + "learning_rate": 0.00018397969840220772, + "loss": 0.0125, "step": 153310 }, { - "epoch": 1.66, - "learning_rate": 5.1378348576247e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018397213070919373, + "loss": 0.0121, "step": 153320 }, { - "epoch": 1.66, - "learning_rate": 5.136213271064409e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018396456301617971, + "loss": 0.0136, "step": 153330 }, { - "epoch": 1.66, - "learning_rate": 5.134591684504118e-05, - "loss": 0.0092, + "epoch": 0.77, + "learning_rate": 0.0001839569953231657, + "loss": 0.0131, "step": 153340 }, { - "epoch": 1.66, - "learning_rate": 5.1329700979438275e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.0001839494276301517, + "loss": 0.012, "step": 153350 }, { - "epoch": 1.66, - "learning_rate": 5.131348511383537e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018394185993713769, + "loss": 0.0146, "step": 153360 }, { - "epoch": 1.66, - "learning_rate": 5.129726924823246e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018393429224412367, + "loss": 0.0115, "step": 153370 }, { - "epoch": 1.66, - "learning_rate": 5.128105338262956e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018392672455110965, + "loss": 0.0106, "step": 153380 }, { - "epoch": 1.66, - "learning_rate": 5.126483751702665e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018391915685809566, + "loss": 0.0102, "step": 153390 }, { - "epoch": 1.66, - "learning_rate": 5.1248621651423746e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018391158916508164, + "loss": 0.0142, "step": 153400 }, { - "epoch": 1.66, - "learning_rate": 5.123240578582084e-05, - "loss": 0.0053, + "epoch": 0.77, + "learning_rate": 0.00018390402147206762, + "loss": 0.0135, "step": 153410 }, { - "epoch": 1.66, - "learning_rate": 5.121618992021793e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018389645377905363, + "loss": 0.0128, "step": 153420 }, { - "epoch": 1.66, - "learning_rate": 5.119997405461503e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.0001838888860860396, + "loss": 0.0129, "step": 153430 }, { - "epoch": 1.66, - "learning_rate": 5.1183758189012124e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.0001838813183930256, + "loss": 0.0138, "step": 153440 }, { - "epoch": 1.66, - "learning_rate": 5.1167542323409216e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001838737507000116, + "loss": 0.0145, "step": 153450 }, { - "epoch": 1.66, - "learning_rate": 5.115132645780631e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018386618300699758, + "loss": 0.0112, "step": 153460 }, { - "epoch": 1.66, - "learning_rate": 5.11351105922034e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.00018385861531398356, + "loss": 0.0088, "step": 153470 }, { - "epoch": 1.66, - "learning_rate": 5.11188947266005e-05, - "loss": 0.0051, + "epoch": 0.77, + "learning_rate": 0.00018385104762096957, + "loss": 0.0178, "step": 153480 }, { - "epoch": 1.66, - "learning_rate": 5.1102678860997594e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018384347992795555, + "loss": 0.017, "step": 153490 }, { - "epoch": 1.66, - "learning_rate": 5.108646299539469e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018383591223494153, + "loss": 0.012, "step": 153500 }, { - "epoch": 1.66, - "learning_rate": 5.107024712979178e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018382834454192754, + "loss": 0.0136, "step": 153510 }, { - "epoch": 1.66, - "learning_rate": 5.105403126418887e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018382077684891352, + "loss": 0.0135, "step": 153520 }, { - "epoch": 1.66, - "learning_rate": 5.1037815398585965e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001838132091558995, + "loss": 0.0123, "step": 153530 }, { - "epoch": 1.66, - "learning_rate": 5.1021599532983065e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.0001838056414628855, + "loss": 0.0118, "step": 153540 }, { - "epoch": 1.66, - "learning_rate": 5.100538366738016e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001837980737698715, + "loss": 0.0128, "step": 153550 }, { - "epoch": 1.66, - "learning_rate": 5.098916780177725e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018379050607685748, + "loss": 0.0107, "step": 153560 }, { - "epoch": 1.66, - "learning_rate": 5.097295193617434e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018378293838384346, + "loss": 0.0158, "step": 153570 }, { - "epoch": 1.66, - "learning_rate": 5.095673607057145e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018377537069082947, + "loss": 0.0121, "step": 153580 }, { - "epoch": 1.66, - "learning_rate": 5.094052020496854e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018376780299781545, + "loss": 0.0098, "step": 153590 }, { - "epoch": 1.66, - "learning_rate": 5.0924304339365635e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018376023530480143, + "loss": 0.0156, "step": 153600 }, { - "epoch": 1.66, - "learning_rate": 5.090808847376273e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018375266761178744, + "loss": 0.0129, "step": 153610 }, { - "epoch": 1.66, - "learning_rate": 5.089187260815982e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018374509991877342, + "loss": 0.0095, "step": 153620 }, { - "epoch": 1.66, - "learning_rate": 5.087565674255692e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.0001837375322257594, + "loss": 0.0139, "step": 153630 }, { - "epoch": 1.66, - "learning_rate": 5.085944087695401e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001837299645327454, + "loss": 0.0128, "step": 153640 }, { - "epoch": 1.66, - "learning_rate": 5.0843225011351105e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.0001837223968397314, + "loss": 0.0146, "step": 153650 }, { - "epoch": 1.66, - "learning_rate": 5.08270091457482e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018371482914671737, + "loss": 0.0122, "step": 153660 }, { - "epoch": 1.66, - "learning_rate": 5.081079328014529e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018370726145370338, + "loss": 0.0142, "step": 153670 }, { - "epoch": 1.66, - "learning_rate": 5.0794577414542383e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.00018369969376068936, + "loss": 0.0119, "step": 153680 }, { - "epoch": 1.66, - "learning_rate": 5.077836154893948e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018369212606767534, + "loss": 0.0089, "step": 153690 }, { - "epoch": 1.66, - "learning_rate": 5.0762145683336576e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018368455837466133, + "loss": 0.011, "step": 153700 }, { - "epoch": 1.66, - "learning_rate": 5.074592981773367e-05, - "loss": 0.0077, + "epoch": 0.78, + "learning_rate": 0.00018367699068164733, + "loss": 0.0145, "step": 153710 }, { - "epoch": 1.66, - "learning_rate": 5.072971395213076e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018366942298863332, + "loss": 0.0122, "step": 153720 }, { - "epoch": 1.66, - "learning_rate": 5.0713498086527854e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.0001836618552956193, + "loss": 0.0124, "step": 153730 }, { - "epoch": 1.66, - "learning_rate": 5.0697282220924953e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001836542876026053, + "loss": 0.0126, "step": 153740 }, { - "epoch": 1.66, - "learning_rate": 5.0681066355322046e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.0001836467199095913, + "loss": 0.0112, "step": 153750 }, { - "epoch": 1.66, - "learning_rate": 5.066485048971914e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018363915221657727, + "loss": 0.0137, "step": 153760 }, { - "epoch": 1.66, - "learning_rate": 5.064863462411623e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018363158452356328, + "loss": 0.011, "step": 153770 }, { - "epoch": 1.66, - "learning_rate": 5.0632418758513324e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018362401683054926, + "loss": 0.0143, "step": 153780 }, { - "epoch": 1.66, - "learning_rate": 5.0616202892910424e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.00018361644913753524, + "loss": 0.0137, "step": 153790 }, { - "epoch": 1.66, - "learning_rate": 5.059998702730752e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018360888144452125, + "loss": 0.0131, "step": 153800 }, { - "epoch": 1.66, - "learning_rate": 5.058377116170461e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018360131375150723, + "loss": 0.0101, "step": 153810 }, { - "epoch": 1.66, - "learning_rate": 5.05675552961017e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.0001835937460584932, + "loss": 0.0145, "step": 153820 }, { - "epoch": 1.66, - "learning_rate": 5.0551339430498795e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018358617836547922, + "loss": 0.0116, "step": 153830 }, { - "epoch": 1.66, - "learning_rate": 5.053512356489589e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.0001835786106724652, + "loss": 0.0104, "step": 153840 }, { - "epoch": 1.66, - "learning_rate": 5.051890769929299e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018357104297945118, + "loss": 0.0114, "step": 153850 }, { - "epoch": 1.66, - "learning_rate": 5.050269183369008e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001835634752864372, + "loss": 0.0122, "step": 153860 }, { - "epoch": 1.66, - "learning_rate": 5.048647596808717e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.00018355590759342317, + "loss": 0.0109, "step": 153870 }, { - "epoch": 1.66, - "learning_rate": 5.0470260102484265e-05, - "loss": 0.0092, + "epoch": 0.78, + "learning_rate": 0.00018354833990040915, + "loss": 0.0132, "step": 153880 }, { - "epoch": 1.66, - "learning_rate": 5.045404423688136e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018354077220739514, + "loss": 0.0143, "step": 153890 }, { - "epoch": 1.66, - "learning_rate": 5.043782837127846e-05, - "loss": 0.0077, + "epoch": 0.78, + "learning_rate": 0.00018353320451438114, + "loss": 0.0126, "step": 153900 }, { - "epoch": 1.66, - "learning_rate": 5.042161250567555e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.00018352563682136713, + "loss": 0.0112, "step": 153910 }, { - "epoch": 1.66, - "learning_rate": 5.040539664007264e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001835180691283531, + "loss": 0.01, "step": 153920 }, { - "epoch": 1.66, - "learning_rate": 5.0389180774469736e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018351050143533912, + "loss": 0.0111, "step": 153930 }, { - "epoch": 1.66, - "learning_rate": 5.037296490886683e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.0001835029337423251, + "loss": 0.0125, "step": 153940 }, { - "epoch": 1.66, - "learning_rate": 5.035674904326393e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018349536604931108, + "loss": 0.0126, "step": 153950 }, { - "epoch": 1.66, - "learning_rate": 5.034053317766102e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001834877983562971, + "loss": 0.0158, "step": 153960 }, { - "epoch": 1.66, - "learning_rate": 5.0324317312058114e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.00018348023066328304, + "loss": 0.0129, "step": 153970 }, { - "epoch": 1.66, - "learning_rate": 5.0308101446455206e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018347266297026902, + "loss": 0.0126, "step": 153980 }, { - "epoch": 1.66, - "learning_rate": 5.02918855808523e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.000183465095277255, + "loss": 0.0096, "step": 153990 }, { - "epoch": 1.66, - "learning_rate": 5.027566971524939e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.000183457527584241, + "loss": 0.0128, "step": 154000 }, { - "epoch": 1.66, - "eval_cer": 0.9215251973031615, - "eval_loss": 0.005830066278576851, - "eval_runtime": 121.2077, - "eval_samples_per_second": 16.501, - "eval_steps_per_second": 4.125, + "epoch": 0.78, + "eval_cer": 0.9144789894682909, + "eval_loss": 0.008818663656711578, + "eval_runtime": 116.7061, + "eval_samples_per_second": 17.137, + "eval_steps_per_second": 4.284, "step": 154000 }, { - "epoch": 1.66, - "learning_rate": 5.025945384964649e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.000183449959891227, + "loss": 0.011, "step": 154010 }, { - "epoch": 1.67, - "learning_rate": 5.0243237984043584e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.00018344239219821298, + "loss": 0.0127, "step": 154020 }, { - "epoch": 1.67, - "learning_rate": 5.022702211844068e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018343482450519898, + "loss": 0.0111, "step": 154030 }, { - "epoch": 1.67, - "learning_rate": 5.021080625283777e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018342725681218497, + "loss": 0.0127, "step": 154040 }, { - "epoch": 1.67, - "learning_rate": 5.019459038723486e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018341968911917095, + "loss": 0.0114, "step": 154050 }, { - "epoch": 1.67, - "learning_rate": 5.017837452163196e-05, - "loss": 0.0091, + "epoch": 0.78, + "learning_rate": 0.00018341212142615696, + "loss": 0.0101, "step": 154060 }, { - "epoch": 1.67, - "learning_rate": 5.0162158656029055e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018340455373314294, + "loss": 0.0143, "step": 154070 }, { - "epoch": 1.67, - "learning_rate": 5.014594279042615e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018339698604012892, + "loss": 0.013, "step": 154080 }, { - "epoch": 1.67, - "learning_rate": 5.012972692482324e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.0001833894183471149, + "loss": 0.0121, "step": 154090 }, { - "epoch": 1.67, - "learning_rate": 5.011351105922033e-05, - "loss": 0.0091, + "epoch": 0.78, + "learning_rate": 0.0001833818506541009, + "loss": 0.0158, "step": 154100 }, { - "epoch": 1.67, - "learning_rate": 5.0097295193617426e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001833742829610869, + "loss": 0.013, "step": 154110 }, { - "epoch": 1.67, - "learning_rate": 5.0081079328014525e-05, - "loss": 0.01, + "epoch": 0.78, + "learning_rate": 0.00018336671526807287, + "loss": 0.0161, "step": 154120 }, { - "epoch": 1.67, - "learning_rate": 5.006486346241162e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018335914757505888, + "loss": 0.0153, "step": 154130 }, { - "epoch": 1.67, - "learning_rate": 5.004864759680871e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018335157988204486, + "loss": 0.0163, "step": 154140 }, { - "epoch": 1.67, - "learning_rate": 5.00324317312058e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018334401218903084, + "loss": 0.014, "step": 154150 }, { - "epoch": 1.67, - "learning_rate": 5.0016215865602896e-05, - "loss": 0.0114, + "epoch": 0.78, + "learning_rate": 0.00018333644449601685, + "loss": 0.011, "step": 154160 }, { - "epoch": 1.67, - "learning_rate": 4.9999999999999996e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018332887680300283, + "loss": 0.0134, "step": 154170 }, { - "epoch": 1.67, - "learning_rate": 4.998378413439709e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018332130910998881, + "loss": 0.0101, "step": 154180 }, { - "epoch": 1.67, - "learning_rate": 4.996756826879418e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018331374141697482, + "loss": 0.014, "step": 154190 }, { - "epoch": 1.67, - "learning_rate": 4.9951352403191274e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.0001833061737239608, + "loss": 0.0103, "step": 154200 }, { - "epoch": 1.67, - "learning_rate": 4.9935136537588367e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018329860603094679, + "loss": 0.0127, "step": 154210 }, { - "epoch": 1.67, - "learning_rate": 4.9918920671985466e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001832910383379328, + "loss": 0.0098, "step": 154220 }, { - "epoch": 1.67, - "learning_rate": 4.990270480638256e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018328347064491878, + "loss": 0.0135, "step": 154230 }, { - "epoch": 1.67, - "learning_rate": 4.988648894077965e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018327590295190476, + "loss": 0.012, "step": 154240 }, { - "epoch": 1.67, - "learning_rate": 4.9870273075176744e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018326833525889077, + "loss": 0.0125, "step": 154250 }, { - "epoch": 1.67, - "learning_rate": 4.985405720957384e-05, - "loss": 0.0092, + "epoch": 0.78, + "learning_rate": 0.00018326076756587675, + "loss": 0.0116, "step": 154260 }, { - "epoch": 1.67, - "learning_rate": 4.983784134397093e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018325319987286273, + "loss": 0.0137, "step": 154270 }, { - "epoch": 1.67, - "learning_rate": 4.982162547836803e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.0001832456321798487, + "loss": 0.0114, "step": 154280 }, { - "epoch": 1.67, - "learning_rate": 4.980540961276513e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018323806448683472, + "loss": 0.0127, "step": 154290 }, { - "epoch": 1.67, - "learning_rate": 4.978919374716222e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.0001832304967938207, + "loss": 0.0126, "step": 154300 }, { - "epoch": 1.67, - "learning_rate": 4.9772977881559314e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.00018322292910080668, + "loss": 0.0166, "step": 154310 }, { - "epoch": 1.67, - "learning_rate": 4.9756762015956414e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.0001832153614077927, + "loss": 0.0135, "step": 154320 }, { - "epoch": 1.67, - "learning_rate": 4.974054615035351e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.00018320779371477867, + "loss": 0.0116, "step": 154330 }, { - "epoch": 1.67, - "learning_rate": 4.97243302847506e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.00018320022602176465, + "loss": 0.0122, "step": 154340 }, { - "epoch": 1.67, - "learning_rate": 4.970811441914769e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.00018319265832875066, + "loss": 0.0115, "step": 154350 }, { - "epoch": 1.67, - "learning_rate": 4.9691898553544785e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018318509063573664, + "loss": 0.0096, "step": 154360 }, { - "epoch": 1.67, - "learning_rate": 4.9675682687941884e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018317752294272262, + "loss": 0.0114, "step": 154370 }, { - "epoch": 1.67, - "learning_rate": 4.965946682233898e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018316995524970863, + "loss": 0.0115, "step": 154380 }, { - "epoch": 1.67, - "learning_rate": 4.964325095673607e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018316238755669461, + "loss": 0.0101, "step": 154390 }, { - "epoch": 1.67, - "learning_rate": 4.962703509113316e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.0001831548198636806, + "loss": 0.0109, "step": 154400 }, { - "epoch": 1.67, - "learning_rate": 4.9610819225530255e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.0001831472521706666, + "loss": 0.0094, "step": 154410 }, { - "epoch": 1.67, - "learning_rate": 4.959460335992735e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018313968447765259, + "loss": 0.0119, "step": 154420 }, { - "epoch": 1.67, - "learning_rate": 4.957838749432445e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018313211678463857, + "loss": 0.0128, "step": 154430 }, { - "epoch": 1.67, - "learning_rate": 4.956217162872154e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018312454909162455, + "loss": 0.0131, "step": 154440 }, { - "epoch": 1.67, - "learning_rate": 4.954595576311863e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018311698139861056, + "loss": 0.0112, "step": 154450 }, { - "epoch": 1.67, - "learning_rate": 4.9529739897515726e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018310941370559654, + "loss": 0.0107, "step": 154460 }, { - "epoch": 1.67, - "learning_rate": 4.951352403191282e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018310184601258252, + "loss": 0.0141, "step": 154470 }, { - "epoch": 1.67, - "learning_rate": 4.949730816630992e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018309427831956853, + "loss": 0.0112, "step": 154480 }, { - "epoch": 1.67, - "learning_rate": 4.948109230070701e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.0001830867106265545, + "loss": 0.0154, "step": 154490 }, { - "epoch": 1.67, - "learning_rate": 4.9464876435104104e-05, - "loss": 0.0048, + "epoch": 0.78, + "learning_rate": 0.0001830791429335405, + "loss": 0.0103, "step": 154500 }, { - "epoch": 1.67, - "learning_rate": 4.9448660569501196e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.0001830715752405265, + "loss": 0.0175, "step": 154510 }, { - "epoch": 1.67, - "learning_rate": 4.943244470389829e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018306400754751248, + "loss": 0.0152, "step": 154520 }, { - "epoch": 1.67, - "learning_rate": 4.941622883829539e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018305643985449846, + "loss": 0.0131, "step": 154530 }, { - "epoch": 1.67, - "learning_rate": 4.940001297269248e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018304887216148447, + "loss": 0.013, "step": 154540 }, { - "epoch": 1.67, - "learning_rate": 4.9383797107089574e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018304130446847045, + "loss": 0.0145, "step": 154550 }, { - "epoch": 1.67, - "learning_rate": 4.936758124148667e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018303373677545643, + "loss": 0.0134, "step": 154560 }, { - "epoch": 1.67, - "learning_rate": 4.935136537588376e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018302616908244244, + "loss": 0.0129, "step": 154570 }, { - "epoch": 1.67, - "learning_rate": 4.933514951028085e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018301860138942842, + "loss": 0.0149, "step": 154580 }, { - "epoch": 1.67, - "learning_rate": 4.931893364467795e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.0001830110336964144, + "loss": 0.0105, "step": 154590 }, { - "epoch": 1.67, - "learning_rate": 4.9302717779075045e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001830034660034004, + "loss": 0.0161, "step": 154600 }, { - "epoch": 1.67, - "learning_rate": 4.928650191347214e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001829958983103864, + "loss": 0.0127, "step": 154610 }, { - "epoch": 1.67, - "learning_rate": 4.927028604786923e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018298833061737238, + "loss": 0.0137, "step": 154620 }, { - "epoch": 1.67, - "learning_rate": 4.925407018226632e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018298076292435836, + "loss": 0.012, "step": 154630 }, { - "epoch": 1.67, - "learning_rate": 4.923785431666342e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018297319523134437, + "loss": 0.0128, "step": 154640 }, { - "epoch": 1.67, - "learning_rate": 4.9221638451060515e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018296562753833035, + "loss": 0.0123, "step": 154650 }, { - "epoch": 1.67, - "learning_rate": 4.920542258545761e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018295805984531633, + "loss": 0.0124, "step": 154660 }, { - "epoch": 1.67, - "learning_rate": 4.91892067198547e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.00018295049215230234, + "loss": 0.0133, "step": 154670 }, { - "epoch": 1.67, - "learning_rate": 4.917299085425179e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018294292445928832, + "loss": 0.013, "step": 154680 }, { - "epoch": 1.67, - "learning_rate": 4.9156774988648886e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.0001829353567662743, + "loss": 0.0147, "step": 154690 }, { - "epoch": 1.67, - "learning_rate": 4.9140559123045986e-05, - "loss": 0.01, + "epoch": 0.78, + "learning_rate": 0.0001829277890732603, + "loss": 0.0109, "step": 154700 }, { - "epoch": 1.67, - "learning_rate": 4.912434325744308e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.0001829202213802463, + "loss": 0.0137, "step": 154710 }, { - "epoch": 1.67, - "learning_rate": 4.910812739184017e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018291265368723227, + "loss": 0.0109, "step": 154720 }, { - "epoch": 1.67, - "learning_rate": 4.9091911526237264e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018290508599421828, + "loss": 0.0137, "step": 154730 }, { - "epoch": 1.67, - "learning_rate": 4.9075695660634357e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018289751830120426, + "loss": 0.0115, "step": 154740 }, { - "epoch": 1.67, - "learning_rate": 4.9059479795031456e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018288995060819024, + "loss": 0.0111, "step": 154750 }, { - "epoch": 1.67, - "learning_rate": 4.904326392942855e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018288238291517625, + "loss": 0.0122, "step": 154760 }, { - "epoch": 1.67, - "learning_rate": 4.902704806382564e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018287481522216223, + "loss": 0.011, "step": 154770 }, { - "epoch": 1.67, - "learning_rate": 4.9010832198222734e-05, - "loss": 0.0119, + "epoch": 0.78, + "learning_rate": 0.00018286724752914822, + "loss": 0.0113, "step": 154780 }, { - "epoch": 1.67, - "learning_rate": 4.899461633261983e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.0001828596798361342, + "loss": 0.0159, "step": 154790 }, { - "epoch": 1.67, - "learning_rate": 4.8978400467016927e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001828521121431202, + "loss": 0.0114, "step": 154800 }, { - "epoch": 1.67, - "learning_rate": 4.896218460141402e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001828445444501062, + "loss": 0.0116, "step": 154810 }, { - "epoch": 1.67, - "learning_rate": 4.894596873581111e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018283697675709217, + "loss": 0.0101, "step": 154820 }, { - "epoch": 1.67, - "learning_rate": 4.8929752870208205e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018282940906407818, + "loss": 0.0133, "step": 154830 }, { - "epoch": 1.67, - "learning_rate": 4.89135370046053e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018282184137106416, + "loss": 0.0113, "step": 154840 }, { - "epoch": 1.67, - "learning_rate": 4.889732113900239e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018281427367805014, + "loss": 0.013, "step": 154850 }, { - "epoch": 1.67, - "learning_rate": 4.888110527339949e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018280670598503615, + "loss": 0.0141, "step": 154860 }, { - "epoch": 1.67, - "learning_rate": 4.886488940779658e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018279913829202213, + "loss": 0.0136, "step": 154870 }, { - "epoch": 1.67, - "learning_rate": 4.8848673542193675e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.0001827915705990081, + "loss": 0.0107, "step": 154880 }, { - "epoch": 1.67, - "learning_rate": 4.883245767659077e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018278400290599412, + "loss": 0.0158, "step": 154890 }, { - "epoch": 1.67, - "learning_rate": 4.881624181098786e-05, - "loss": 0.0052, + "epoch": 0.78, + "learning_rate": 0.0001827764352129801, + "loss": 0.0116, "step": 154900 }, { - "epoch": 1.67, - "learning_rate": 4.880002594538496e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018276886751996608, + "loss": 0.0114, "step": 154910 }, { - "epoch": 1.67, - "learning_rate": 4.878381007978205e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.0001827612998269521, + "loss": 0.0124, "step": 154920 }, { - "epoch": 1.67, - "learning_rate": 4.8767594214179146e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018275373213393807, + "loss": 0.0138, "step": 154930 }, { - "epoch": 1.67, - "learning_rate": 4.875137834857624e-05, - "loss": 0.0088, + "epoch": 0.78, + "learning_rate": 0.00018274616444092405, + "loss": 0.0102, "step": 154940 }, { - "epoch": 1.68, - "learning_rate": 4.873516248297333e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018273859674791004, + "loss": 0.013, "step": 154950 }, { - "epoch": 1.68, - "learning_rate": 4.8718946617370424e-05, - "loss": 0.0051, + "epoch": 0.78, + "learning_rate": 0.00018273102905489604, + "loss": 0.0128, "step": 154960 }, { - "epoch": 1.68, - "learning_rate": 4.8702730751767524e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018272346136188203, + "loss": 0.0162, "step": 154970 }, { - "epoch": 1.68, - "learning_rate": 4.8686514886164616e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.000182715893668868, + "loss": 0.014, "step": 154980 }, { - "epoch": 1.68, - "learning_rate": 4.867029902056171e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018270832597585402, + "loss": 0.0116, "step": 154990 }, { - "epoch": 1.68, - "learning_rate": 4.86540831549588e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018270075828284, + "loss": 0.012, "step": 155000 }, { - "epoch": 1.68, - "eval_cer": 0.9215251973031615, - "eval_loss": 0.005951076280325651, - "eval_runtime": 121.1875, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.78, + "eval_cer": 0.9144731670915385, + "eval_loss": 0.009108257479965687, + "eval_runtime": 116.7273, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, "step": 155000 }, { - "epoch": 1.68, - "learning_rate": 4.863786728935591e-05, - "loss": 0.0102, + "epoch": 0.78, + "learning_rate": 0.00018269319058982598, + "loss": 0.0115, "step": 155010 }, { - "epoch": 1.68, - "learning_rate": 4.8621651423753e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.000182685622896812, + "loss": 0.0206, "step": 155020 }, { - "epoch": 1.68, - "learning_rate": 4.8605435558150094e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018267805520379797, + "loss": 0.0122, "step": 155030 }, { - "epoch": 1.68, - "learning_rate": 4.8589219692547186e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018267048751078395, + "loss": 0.0132, "step": 155040 }, { - "epoch": 1.68, - "learning_rate": 4.857300382694428e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018266291981776996, + "loss": 0.0166, "step": 155050 }, { - "epoch": 1.68, - "learning_rate": 4.855678796134138e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018265535212475594, + "loss": 0.0127, "step": 155060 }, { - "epoch": 1.68, - "learning_rate": 4.854057209573847e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018264778443174192, + "loss": 0.0139, "step": 155070 }, { - "epoch": 1.68, - "learning_rate": 4.8524356230135564e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018264021673872793, + "loss": 0.0103, "step": 155080 }, { - "epoch": 1.68, - "learning_rate": 4.850814036453266e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001826326490457139, + "loss": 0.0136, "step": 155090 }, { - "epoch": 1.68, - "learning_rate": 4.849192449892975e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001826250813526999, + "loss": 0.0147, "step": 155100 }, { - "epoch": 1.68, - "learning_rate": 4.847570863332685e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018261751365968587, + "loss": 0.0111, "step": 155110 }, { - "epoch": 1.68, - "learning_rate": 4.845949276772394e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018260994596667188, + "loss": 0.0137, "step": 155120 }, { - "epoch": 1.68, - "learning_rate": 4.8443276902121035e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018260237827365786, + "loss": 0.0121, "step": 155130 }, { - "epoch": 1.68, - "learning_rate": 4.842706103651813e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018259481058064385, + "loss": 0.0143, "step": 155140 }, { - "epoch": 1.68, - "learning_rate": 4.841084517091522e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018258724288762985, + "loss": 0.0134, "step": 155150 }, { - "epoch": 1.68, - "learning_rate": 4.839462930531231e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018257967519461584, + "loss": 0.0147, "step": 155160 }, { - "epoch": 1.68, - "learning_rate": 4.837841343970941e-05, - "loss": 0.005, + "epoch": 0.78, + "learning_rate": 0.00018257210750160182, + "loss": 0.0109, "step": 155170 }, { - "epoch": 1.68, - "learning_rate": 4.8362197574106505e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.00018256453980858783, + "loss": 0.0182, "step": 155180 }, { - "epoch": 1.68, - "learning_rate": 4.83459817085036e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.0001825569721155738, + "loss": 0.0164, "step": 155190 }, { - "epoch": 1.68, - "learning_rate": 4.832976584290069e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.0001825494044225598, + "loss": 0.017, "step": 155200 }, { - "epoch": 1.68, - "learning_rate": 4.831354997729778e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.0001825418367295458, + "loss": 0.012, "step": 155210 }, { - "epoch": 1.68, - "learning_rate": 4.829733411169488e-05, - "loss": 0.0103, + "epoch": 0.78, + "learning_rate": 0.00018253426903653178, + "loss": 0.015, "step": 155220 }, { - "epoch": 1.68, - "learning_rate": 4.8281118246091976e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018252670134351773, + "loss": 0.0128, "step": 155230 }, { - "epoch": 1.68, - "learning_rate": 4.826490238048907e-05, - "loss": 0.0091, + "epoch": 0.78, + "learning_rate": 0.00018251913365050371, + "loss": 0.0164, "step": 155240 }, { - "epoch": 1.68, - "learning_rate": 4.824868651488616e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018251156595748972, + "loss": 0.0184, "step": 155250 }, { - "epoch": 1.68, - "learning_rate": 4.8232470649283254e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.0001825039982644757, + "loss": 0.0144, "step": 155260 }, { - "epoch": 1.68, - "learning_rate": 4.8216254783680346e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018249643057146169, + "loss": 0.0143, "step": 155270 }, { - "epoch": 1.68, - "learning_rate": 4.8200038918077446e-05, - "loss": 0.0057, + "epoch": 0.78, + "learning_rate": 0.0001824888628784477, + "loss": 0.0101, "step": 155280 }, { - "epoch": 1.68, - "learning_rate": 4.818382305247454e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018248129518543368, + "loss": 0.0154, "step": 155290 }, { - "epoch": 1.68, - "learning_rate": 4.816760718687163e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018247372749241966, + "loss": 0.0149, "step": 155300 }, { - "epoch": 1.68, - "learning_rate": 4.8151391321268724e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018246615979940567, + "loss": 0.0109, "step": 155310 }, { - "epoch": 1.68, - "learning_rate": 4.813517545566582e-05, - "loss": 0.0104, + "epoch": 0.78, + "learning_rate": 0.00018245859210639165, + "loss": 0.0128, "step": 155320 }, { - "epoch": 1.68, - "learning_rate": 4.8118959590062916e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018245102441337763, + "loss": 0.0135, "step": 155330 }, { - "epoch": 1.68, - "learning_rate": 4.810274372446001e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001824434567203636, + "loss": 0.014, "step": 155340 }, { - "epoch": 1.68, - "learning_rate": 4.80865278588571e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018243588902734962, + "loss": 0.0136, "step": 155350 }, { - "epoch": 1.68, - "learning_rate": 4.8070311993254195e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001824283213343356, + "loss": 0.0132, "step": 155360 }, { - "epoch": 1.68, - "learning_rate": 4.805409612765129e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018242075364132158, + "loss": 0.0132, "step": 155370 }, { - "epoch": 1.68, - "learning_rate": 4.803788026204839e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001824131859483076, + "loss": 0.0131, "step": 155380 }, { - "epoch": 1.68, - "learning_rate": 4.802166439644548e-05, - "loss": 0.0088, + "epoch": 0.78, + "learning_rate": 0.00018240561825529357, + "loss": 0.0112, "step": 155390 }, { - "epoch": 1.68, - "learning_rate": 4.800544853084257e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018239805056227955, + "loss": 0.0143, "step": 155400 }, { - "epoch": 1.68, - "learning_rate": 4.7989232665239665e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018239048286926556, + "loss": 0.0127, "step": 155410 }, { - "epoch": 1.68, - "learning_rate": 4.797301679963676e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018238291517625154, + "loss": 0.0128, "step": 155420 }, { - "epoch": 1.68, - "learning_rate": 4.795680093403385e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018237534748323752, + "loss": 0.0122, "step": 155430 }, { - "epoch": 1.68, - "learning_rate": 4.794058506843095e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018236777979022353, + "loss": 0.0105, "step": 155440 }, { - "epoch": 1.68, - "learning_rate": 4.792436920282804e-05, - "loss": 0.0101, + "epoch": 0.78, + "learning_rate": 0.00018236021209720951, + "loss": 0.0133, "step": 155450 }, { - "epoch": 1.68, - "learning_rate": 4.7908153337225136e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.0001823526444041955, + "loss": 0.0129, "step": 155460 }, { - "epoch": 1.68, - "learning_rate": 4.789193747162223e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.0001823450767111815, + "loss": 0.0138, "step": 155470 }, { - "epoch": 1.68, - "learning_rate": 4.787572160601932e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018233750901816749, + "loss": 0.0088, "step": 155480 }, { - "epoch": 1.68, - "learning_rate": 4.785950574041642e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018232994132515347, + "loss": 0.0127, "step": 155490 }, { - "epoch": 1.68, - "learning_rate": 4.7843289874813513e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018232237363213945, + "loss": 0.0125, "step": 155500 }, { - "epoch": 1.68, - "learning_rate": 4.7827074009210606e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018231480593912546, + "loss": 0.0124, "step": 155510 }, { - "epoch": 1.68, - "learning_rate": 4.78108581436077e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018230723824611144, + "loss": 0.0138, "step": 155520 }, { - "epoch": 1.68, - "learning_rate": 4.779464227800479e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018229967055309742, + "loss": 0.0122, "step": 155530 }, { - "epoch": 1.68, - "learning_rate": 4.777842641240189e-05, - "loss": 0.005, + "epoch": 0.78, + "learning_rate": 0.00018229210286008343, + "loss": 0.0136, "step": 155540 }, { - "epoch": 1.68, - "learning_rate": 4.7762210546798984e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001822845351670694, + "loss": 0.0114, "step": 155550 }, { - "epoch": 1.68, - "learning_rate": 4.774599468119608e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.0001822769674740554, + "loss": 0.0147, "step": 155560 }, { - "epoch": 1.68, - "learning_rate": 4.772977881559317e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001822693997810414, + "loss": 0.0114, "step": 155570 }, { - "epoch": 1.68, - "learning_rate": 4.771356294999026e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018226183208802738, + "loss": 0.0108, "step": 155580 }, { - "epoch": 1.68, - "learning_rate": 4.7697347084387355e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018225426439501336, + "loss": 0.0138, "step": 155590 }, { - "epoch": 1.68, - "learning_rate": 4.7681131218784454e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018224669670199937, + "loss": 0.014, "step": 155600 }, { - "epoch": 1.68, - "learning_rate": 4.766491535318155e-05, - "loss": 0.0093, + "epoch": 0.79, + "learning_rate": 0.00018223912900898535, + "loss": 0.0133, "step": 155610 }, { - "epoch": 1.68, - "learning_rate": 4.764869948757864e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018223156131597133, + "loss": 0.0132, "step": 155620 }, { - "epoch": 1.68, - "learning_rate": 4.763248362197573e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018222399362295734, + "loss": 0.0134, "step": 155630 }, { - "epoch": 1.68, - "learning_rate": 4.7616267756372825e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018221642592994332, + "loss": 0.0174, "step": 155640 }, { - "epoch": 1.68, - "learning_rate": 4.7600051890769925e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001822088582369293, + "loss": 0.013, "step": 155650 }, { - "epoch": 1.68, - "learning_rate": 4.758383602516702e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018220129054391531, + "loss": 0.012, "step": 155660 }, { - "epoch": 1.68, - "learning_rate": 4.756762015956411e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.0001821937228509013, + "loss": 0.0115, "step": 155670 }, { - "epoch": 1.68, - "learning_rate": 4.75514042939612e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018218615515788728, + "loss": 0.0114, "step": 155680 }, { - "epoch": 1.68, - "learning_rate": 4.7535188428358296e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018217858746487326, + "loss": 0.0108, "step": 155690 }, { - "epoch": 1.68, - "learning_rate": 4.751897256275539e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018217101977185927, + "loss": 0.0118, "step": 155700 }, { - "epoch": 1.68, - "learning_rate": 4.750275669715249e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018216345207884525, + "loss": 0.0119, "step": 155710 }, { - "epoch": 1.68, - "learning_rate": 4.748654083154958e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018215588438583123, + "loss": 0.0112, "step": 155720 }, { - "epoch": 1.68, - "learning_rate": 4.747032496594668e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018214831669281724, + "loss": 0.0102, "step": 155730 }, { - "epoch": 1.68, - "learning_rate": 4.745410910034377e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018214074899980322, + "loss": 0.0129, "step": 155740 }, { - "epoch": 1.68, - "learning_rate": 4.743789323474087e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001821331813067892, + "loss": 0.0142, "step": 155750 }, { - "epoch": 1.68, - "learning_rate": 4.7421677369137965e-05, - "loss": 0.0091, + "epoch": 0.79, + "learning_rate": 0.0001821256136137752, + "loss": 0.0108, "step": 155760 }, { - "epoch": 1.68, - "learning_rate": 4.740546150353506e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.0001821180459207612, + "loss": 0.0133, "step": 155770 }, { - "epoch": 1.68, - "learning_rate": 4.738924563793215e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018211047822774717, + "loss": 0.0161, "step": 155780 }, { - "epoch": 1.68, - "learning_rate": 4.7373029772329244e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018210291053473318, + "loss": 0.0138, "step": 155790 }, { - "epoch": 1.68, - "learning_rate": 4.735681390672634e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018209534284171916, + "loss": 0.011, "step": 155800 }, { - "epoch": 1.68, - "learning_rate": 4.7340598041123436e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018208777514870514, + "loss": 0.0129, "step": 155810 }, { - "epoch": 1.68, - "learning_rate": 4.732438217552053e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018208020745569115, + "loss": 0.0124, "step": 155820 }, { - "epoch": 1.68, - "learning_rate": 4.730816630991762e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018207263976267713, + "loss": 0.0126, "step": 155830 }, { - "epoch": 1.68, - "learning_rate": 4.7291950444314714e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018206507206966312, + "loss": 0.0143, "step": 155840 }, { - "epoch": 1.68, - "learning_rate": 4.727573457871181e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001820575043766491, + "loss": 0.0099, "step": 155850 }, { - "epoch": 1.68, - "learning_rate": 4.7259518713108906e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.0001820499366836351, + "loss": 0.0129, "step": 155860 }, { - "epoch": 1.69, - "learning_rate": 4.7243302847506e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.0001820423689906211, + "loss": 0.0159, "step": 155870 }, { - "epoch": 1.69, - "learning_rate": 4.722708698190309e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018203480129760707, + "loss": 0.0127, "step": 155880 }, { - "epoch": 1.69, - "learning_rate": 4.7210871116300185e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018202723360459308, + "loss": 0.0144, "step": 155890 }, { - "epoch": 1.69, - "learning_rate": 4.719465525069728e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018201966591157906, + "loss": 0.0133, "step": 155900 }, { - "epoch": 1.69, - "learning_rate": 4.717843938509438e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018201209821856504, + "loss": 0.0155, "step": 155910 }, { - "epoch": 1.69, - "learning_rate": 4.716222351949147e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018200453052555105, + "loss": 0.0125, "step": 155920 }, { - "epoch": 1.69, - "learning_rate": 4.714600765388856e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018199696283253703, + "loss": 0.0125, "step": 155930 }, { - "epoch": 1.69, - "learning_rate": 4.7129791788285655e-05, - "loss": 0.0043, + "epoch": 0.79, + "learning_rate": 0.000181989395139523, + "loss": 0.0128, "step": 155940 }, { - "epoch": 1.69, - "learning_rate": 4.711357592268275e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018198182744650902, + "loss": 0.0123, "step": 155950 }, { - "epoch": 1.69, - "learning_rate": 4.709736005707985e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.000181974259753495, + "loss": 0.0128, "step": 155960 }, { - "epoch": 1.69, - "learning_rate": 4.708114419147694e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018196669206048098, + "loss": 0.0139, "step": 155970 }, { - "epoch": 1.69, - "learning_rate": 4.706492832587403e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.000181959124367467, + "loss": 0.0133, "step": 155980 }, { - "epoch": 1.69, - "learning_rate": 4.7048712460271126e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018195155667445297, + "loss": 0.01, "step": 155990 }, { - "epoch": 1.69, - "learning_rate": 4.703249659466822e-05, - "loss": 0.0118, + "epoch": 0.79, + "learning_rate": 0.00018194398898143895, + "loss": 0.013, "step": 156000 }, { - "epoch": 1.69, - "eval_cer": 0.9215477809800273, - "eval_loss": 0.006024594884365797, - "eval_runtime": 121.1774, - "eval_samples_per_second": 16.505, - "eval_steps_per_second": 4.126, + "epoch": 0.79, + "eval_cer": 0.9144838414489178, + "eval_loss": 0.00919434055685997, + "eval_runtime": 116.631, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, "step": 156000 }, { - "epoch": 1.69, - "learning_rate": 4.701628072906531e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018193642128842494, + "loss": 0.0116, "step": 156010 }, { - "epoch": 1.69, - "learning_rate": 4.700006486346241e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018192885359541094, + "loss": 0.0135, "step": 156020 }, { - "epoch": 1.69, - "learning_rate": 4.6983848997859503e-05, - "loss": 0.0091, + "epoch": 0.79, + "learning_rate": 0.00018192128590239693, + "loss": 0.0128, "step": 156030 }, { - "epoch": 1.69, - "learning_rate": 4.6967633132256596e-05, - "loss": 0.005, + "epoch": 0.79, + "learning_rate": 0.0001819137182093829, + "loss": 0.0144, "step": 156040 }, { - "epoch": 1.69, - "learning_rate": 4.695141726665369e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018190615051636892, + "loss": 0.0157, "step": 156050 }, { - "epoch": 1.69, - "learning_rate": 4.693520140105078e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.0001818985828233549, + "loss": 0.0149, "step": 156060 }, { - "epoch": 1.69, - "learning_rate": 4.691898553544788e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018189101513034088, + "loss": 0.0116, "step": 156070 }, { - "epoch": 1.69, - "learning_rate": 4.6902769669844974e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.0001818834474373269, + "loss": 0.0124, "step": 156080 }, { - "epoch": 1.69, - "learning_rate": 4.688655380424207e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018187587974431287, + "loss": 0.0116, "step": 156090 }, { - "epoch": 1.69, - "learning_rate": 4.687033793863916e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018186831205129885, + "loss": 0.014, "step": 156100 }, { - "epoch": 1.69, - "learning_rate": 4.685412207303625e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018186074435828486, + "loss": 0.0123, "step": 156110 }, { - "epoch": 1.69, - "learning_rate": 4.683790620743335e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018185317666527084, + "loss": 0.0124, "step": 156120 }, { - "epoch": 1.69, - "learning_rate": 4.6821690341830444e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018184560897225682, + "loss": 0.0124, "step": 156130 }, { - "epoch": 1.69, - "learning_rate": 4.680547447622754e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018183804127924283, + "loss": 0.0112, "step": 156140 }, { - "epoch": 1.69, - "learning_rate": 4.678925861062463e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.0001818304735862288, + "loss": 0.012, "step": 156150 }, { - "epoch": 1.69, - "learning_rate": 4.677304274502172e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.0001818229058932148, + "loss": 0.0125, "step": 156160 }, { - "epoch": 1.69, - "learning_rate": 4.6756826879418815e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001818153382002008, + "loss": 0.013, "step": 156170 }, { - "epoch": 1.69, - "learning_rate": 4.6740611013815915e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018180777050718678, + "loss": 0.0136, "step": 156180 }, { - "epoch": 1.69, - "learning_rate": 4.672439514821301e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018180020281417276, + "loss": 0.0117, "step": 156190 }, { - "epoch": 1.69, - "learning_rate": 4.67081792826101e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018179263512115875, + "loss": 0.0137, "step": 156200 }, { - "epoch": 1.69, - "learning_rate": 4.669196341700719e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018178506742814475, + "loss": 0.0122, "step": 156210 }, { - "epoch": 1.69, - "learning_rate": 4.6675747551404286e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018177749973513074, + "loss": 0.0134, "step": 156220 }, { - "epoch": 1.69, - "learning_rate": 4.6659531685801385e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018176993204211672, + "loss": 0.0133, "step": 156230 }, { - "epoch": 1.69, - "learning_rate": 4.664331582019848e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018176236434910273, + "loss": 0.0091, "step": 156240 }, { - "epoch": 1.69, - "learning_rate": 4.662709995459557e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.0001817547966560887, + "loss": 0.0171, "step": 156250 }, { - "epoch": 1.69, - "learning_rate": 4.6610884088992664e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001817472289630747, + "loss": 0.0132, "step": 156260 }, { - "epoch": 1.69, - "learning_rate": 4.6594668223389756e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.0001817396612700607, + "loss": 0.0129, "step": 156270 }, { - "epoch": 1.69, - "learning_rate": 4.657845235778685e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018173209357704668, + "loss": 0.0103, "step": 156280 }, { - "epoch": 1.69, - "learning_rate": 4.656223649218395e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018172452588403266, + "loss": 0.014, "step": 156290 }, { - "epoch": 1.69, - "learning_rate": 4.654602062658104e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018171695819101867, + "loss": 0.0107, "step": 156300 }, { - "epoch": 1.69, - "learning_rate": 4.6529804760978134e-05, - "loss": 0.0053, + "epoch": 0.79, + "learning_rate": 0.00018170939049800465, + "loss": 0.013, "step": 156310 }, { - "epoch": 1.69, - "learning_rate": 4.651358889537523e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018170182280499063, + "loss": 0.0106, "step": 156320 }, { - "epoch": 1.69, - "learning_rate": 4.649737302977232e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018169425511197664, + "loss": 0.0093, "step": 156330 }, { - "epoch": 1.69, - "learning_rate": 4.648115716416942e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018168668741896262, + "loss": 0.012, "step": 156340 }, { - "epoch": 1.69, - "learning_rate": 4.646494129856651e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001816791197259486, + "loss": 0.0085, "step": 156350 }, { - "epoch": 1.69, - "learning_rate": 4.6448725432963605e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.00018167155203293459, + "loss": 0.0136, "step": 156360 }, { - "epoch": 1.69, - "learning_rate": 4.64325095673607e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.0001816639843399206, + "loss": 0.0105, "step": 156370 }, { - "epoch": 1.69, - "learning_rate": 4.641629370175779e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018165641664690657, + "loss": 0.0127, "step": 156380 }, { - "epoch": 1.69, - "learning_rate": 4.640007783615489e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.00018164884895389256, + "loss": 0.011, "step": 156390 }, { - "epoch": 1.69, - "learning_rate": 4.638386197055198e-05, - "loss": 0.0099, + "epoch": 0.79, + "learning_rate": 0.00018164128126087856, + "loss": 0.01, "step": 156400 }, { - "epoch": 1.69, - "learning_rate": 4.6367646104949075e-05, - "loss": 0.0048, + "epoch": 0.79, + "learning_rate": 0.00018163371356786455, + "loss": 0.0115, "step": 156410 }, { - "epoch": 1.69, - "learning_rate": 4.635143023934617e-05, - "loss": 0.0095, + "epoch": 0.79, + "learning_rate": 0.00018162614587485053, + "loss": 0.0155, "step": 156420 }, { - "epoch": 1.69, - "learning_rate": 4.633521437374326e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018161857818183654, + "loss": 0.011, "step": 156430 }, { - "epoch": 1.69, - "learning_rate": 4.631899850814035e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018161101048882252, + "loss": 0.0144, "step": 156440 }, { - "epoch": 1.69, - "learning_rate": 4.630278264253746e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001816034427958085, + "loss": 0.0128, "step": 156450 }, { - "epoch": 1.69, - "learning_rate": 4.628656677693455e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.0001815958751027945, + "loss": 0.0154, "step": 156460 }, { - "epoch": 1.69, - "learning_rate": 4.6270350911331645e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.0001815883074097805, + "loss": 0.0142, "step": 156470 }, { - "epoch": 1.69, - "learning_rate": 4.625413504572874e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018158073971676647, + "loss": 0.0153, "step": 156480 }, { - "epoch": 1.69, - "learning_rate": 4.623791918012584e-05, - "loss": 0.0106, + "epoch": 0.79, + "learning_rate": 0.00018157317202375243, + "loss": 0.0105, "step": 156490 }, { - "epoch": 1.69, - "learning_rate": 4.622170331452293e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018156560433073843, + "loss": 0.0127, "step": 156500 }, { - "epoch": 1.69, - "learning_rate": 4.620548744892002e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018155803663772442, + "loss": 0.0116, "step": 156510 }, { - "epoch": 1.69, - "learning_rate": 4.6189271583317116e-05, - "loss": 0.0084, + "epoch": 0.79, + "learning_rate": 0.0001815504689447104, + "loss": 0.0123, "step": 156520 }, { - "epoch": 1.69, - "learning_rate": 4.617305571771421e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.0001815429012516964, + "loss": 0.0115, "step": 156530 }, { - "epoch": 1.69, - "learning_rate": 4.615683985211131e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.0001815353335586824, + "loss": 0.0195, "step": 156540 }, { - "epoch": 1.69, - "learning_rate": 4.61406239865084e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018152776586566837, + "loss": 0.0108, "step": 156550 }, { - "epoch": 1.69, - "learning_rate": 4.612440812090549e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018152019817265438, + "loss": 0.014, "step": 156560 }, { - "epoch": 1.69, - "learning_rate": 4.6108192255302586e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018151263047964036, + "loss": 0.0119, "step": 156570 }, { - "epoch": 1.69, - "learning_rate": 4.609197638969968e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.00018150506278662634, + "loss": 0.0114, "step": 156580 }, { - "epoch": 1.69, - "learning_rate": 4.607576052409677e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018149749509361232, + "loss": 0.0134, "step": 156590 }, { - "epoch": 1.69, - "learning_rate": 4.605954465849387e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018148992740059833, + "loss": 0.012, "step": 156600 }, { - "epoch": 1.69, - "learning_rate": 4.6043328792890964e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.0001814823597075843, + "loss": 0.0273, "step": 156610 }, { - "epoch": 1.69, - "learning_rate": 4.6027112927288057e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.0001814747920145703, + "loss": 0.0154, "step": 156620 }, { - "epoch": 1.69, - "learning_rate": 4.601089706168515e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.0001814672243215563, + "loss": 0.0153, "step": 156630 }, { - "epoch": 1.69, - "learning_rate": 4.599468119608224e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018145965662854228, + "loss": 0.0129, "step": 156640 }, { - "epoch": 1.69, - "learning_rate": 4.597846533047934e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018145208893552826, + "loss": 0.0135, "step": 156650 }, { - "epoch": 1.69, - "learning_rate": 4.5962249464876434e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018144452124251427, + "loss": 0.0116, "step": 156660 }, { - "epoch": 1.69, - "learning_rate": 4.594603359927353e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018143695354950025, + "loss": 0.0133, "step": 156670 }, { - "epoch": 1.69, - "learning_rate": 4.592981773367062e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018142938585648624, + "loss": 0.0105, "step": 156680 }, { - "epoch": 1.69, - "learning_rate": 4.591360186806771e-05, - "loss": 0.0118, + "epoch": 0.79, + "learning_rate": 0.00018142181816347224, + "loss": 0.0111, "step": 156690 }, { - "epoch": 1.69, - "learning_rate": 4.589738600246481e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018141425047045823, + "loss": 0.0115, "step": 156700 }, { - "epoch": 1.69, - "learning_rate": 4.5881170136861905e-05, - "loss": 0.0092, + "epoch": 0.79, + "learning_rate": 0.0001814066827774442, + "loss": 0.0133, "step": 156710 }, { - "epoch": 1.69, - "learning_rate": 4.5864954271259e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018139911508443022, + "loss": 0.0111, "step": 156720 }, { - "epoch": 1.69, - "learning_rate": 4.584873840565609e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.0001813915473914162, + "loss": 0.0119, "step": 156730 }, { - "epoch": 1.69, - "learning_rate": 4.583252254005318e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018138397969840218, + "loss": 0.0122, "step": 156740 }, { - "epoch": 1.69, - "learning_rate": 4.5816306674450276e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018137641200538816, + "loss": 0.014, "step": 156750 }, { - "epoch": 1.69, - "learning_rate": 4.5800090808847375e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018136884431237417, + "loss": 0.0091, "step": 156760 }, { - "epoch": 1.69, - "learning_rate": 4.578387494324447e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018136127661936015, + "loss": 0.0101, "step": 156770 }, { - "epoch": 1.69, - "learning_rate": 4.576765907764156e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018135370892634613, + "loss": 0.0108, "step": 156780 }, { - "epoch": 1.69, - "learning_rate": 4.5751443212038654e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018134614123333214, + "loss": 0.0159, "step": 156790 }, { - "epoch": 1.7, - "learning_rate": 4.5735227346435746e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018133857354031812, + "loss": 0.0131, "step": 156800 }, { - "epoch": 1.7, - "learning_rate": 4.5719011480832846e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001813310058473041, + "loss": 0.011, "step": 156810 }, { - "epoch": 1.7, - "learning_rate": 4.570279561522994e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001813234381542901, + "loss": 0.0105, "step": 156820 }, { - "epoch": 1.7, - "learning_rate": 4.568657974962703e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.0001813158704612761, + "loss": 0.0155, "step": 156830 }, { - "epoch": 1.7, - "learning_rate": 4.5670363884024124e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018130830276826207, + "loss": 0.0148, "step": 156840 }, { - "epoch": 1.7, - "learning_rate": 4.565414801842122e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018130073507524808, + "loss": 0.0139, "step": 156850 }, { - "epoch": 1.7, - "learning_rate": 4.563793215281831e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018129316738223406, + "loss": 0.0119, "step": 156860 }, { - "epoch": 1.7, - "learning_rate": 4.562171628721541e-05, - "loss": 0.0105, + "epoch": 0.79, + "learning_rate": 0.00018128559968922005, + "loss": 0.0145, "step": 156870 }, { - "epoch": 1.7, - "learning_rate": 4.56055004216125e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018127803199620605, + "loss": 0.0132, "step": 156880 }, { - "epoch": 1.7, - "learning_rate": 4.5589284556009595e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018127046430319204, + "loss": 0.0132, "step": 156890 }, { - "epoch": 1.7, - "learning_rate": 4.557306869040669e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018126289661017802, + "loss": 0.012, "step": 156900 }, { - "epoch": 1.7, - "learning_rate": 4.555685282480378e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.000181255328917164, + "loss": 0.012, "step": 156910 }, { - "epoch": 1.7, - "learning_rate": 4.554063695920088e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018124776122415, + "loss": 0.0128, "step": 156920 }, { - "epoch": 1.7, - "learning_rate": 4.552442109359797e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.000181240193531136, + "loss": 0.0122, "step": 156930 }, { - "epoch": 1.7, - "learning_rate": 4.5508205227995065e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018123262583812197, + "loss": 0.0125, "step": 156940 }, { - "epoch": 1.7, - "learning_rate": 4.549198936239216e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018122505814510798, + "loss": 0.0148, "step": 156950 }, { - "epoch": 1.7, - "learning_rate": 4.547577349678925e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018121749045209396, + "loss": 0.0116, "step": 156960 }, { - "epoch": 1.7, - "learning_rate": 4.545955763118635e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.00018120992275907994, + "loss": 0.0112, "step": 156970 }, { - "epoch": 1.7, - "learning_rate": 4.544334176558344e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018120235506606595, + "loss": 0.0101, "step": 156980 }, { - "epoch": 1.7, - "learning_rate": 4.5427125899980536e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018119478737305193, + "loss": 0.0123, "step": 156990 }, { - "epoch": 1.7, - "learning_rate": 4.541091003437763e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.0001811872196800379, + "loss": 0.0119, "step": 157000 }, { - "epoch": 1.7, - "eval_cer": 0.9215112996558595, - "eval_loss": 0.005920048803091049, - "eval_runtime": 121.2838, - "eval_samples_per_second": 16.49, - "eval_steps_per_second": 4.123, + "epoch": 0.79, + "eval_cer": 0.9144983973907989, + "eval_loss": 0.009071653708815575, + "eval_runtime": 116.5721, + "eval_samples_per_second": 17.157, + "eval_steps_per_second": 4.289, "step": 157000 }, { - "epoch": 1.7, - "learning_rate": 4.539469416877472e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018117965198702392, + "loss": 0.0129, "step": 157010 }, { - "epoch": 1.7, - "learning_rate": 4.5378478303171814e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.0001811720842940099, + "loss": 0.0134, "step": 157020 }, { - "epoch": 1.7, - "learning_rate": 4.536226243756891e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018116451660099588, + "loss": 0.0115, "step": 157030 }, { - "epoch": 1.7, - "learning_rate": 4.5346046571966006e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.0001811569489079819, + "loss": 0.015, "step": 157040 }, { - "epoch": 1.7, - "learning_rate": 4.53298307063631e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018114938121496787, + "loss": 0.0136, "step": 157050 }, { - "epoch": 1.7, - "learning_rate": 4.531361484076019e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.00018114181352195386, + "loss": 0.0166, "step": 157060 }, { - "epoch": 1.7, - "learning_rate": 4.5297398975157284e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018113424582893984, + "loss": 0.0115, "step": 157070 }, { - "epoch": 1.7, - "learning_rate": 4.5281183109554384e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018112667813592585, + "loss": 0.0144, "step": 157080 }, { - "epoch": 1.7, - "learning_rate": 4.5264967243951477e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018111911044291183, + "loss": 0.019, "step": 157090 }, { - "epoch": 1.7, - "learning_rate": 4.524875137834857e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001811115427498978, + "loss": 0.0121, "step": 157100 }, { - "epoch": 1.7, - "learning_rate": 4.523253551274566e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018110397505688382, + "loss": 0.0156, "step": 157110 }, { - "epoch": 1.7, - "learning_rate": 4.5216319647142755e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.0001810964073638698, + "loss": 0.014, "step": 157120 }, { - "epoch": 1.7, - "learning_rate": 4.5200103781539854e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018108883967085578, + "loss": 0.0136, "step": 157130 }, { - "epoch": 1.7, - "learning_rate": 4.518388791593695e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.0001810812719778418, + "loss": 0.0128, "step": 157140 }, { - "epoch": 1.7, - "learning_rate": 4.516767205033404e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018107370428482777, + "loss": 0.0151, "step": 157150 }, { - "epoch": 1.7, - "learning_rate": 4.515145618473113e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018106613659181375, + "loss": 0.0142, "step": 157160 }, { - "epoch": 1.7, - "learning_rate": 4.513524031912823e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018105856889879976, + "loss": 0.0154, "step": 157170 }, { - "epoch": 1.7, - "learning_rate": 4.511902445352533e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018105100120578574, + "loss": 0.0146, "step": 157180 }, { - "epoch": 1.7, - "learning_rate": 4.5102808587922424e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018104343351277172, + "loss": 0.0104, "step": 157190 }, { - "epoch": 1.7, - "learning_rate": 4.508659272231952e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018103586581975773, + "loss": 0.0094, "step": 157200 }, { - "epoch": 1.7, - "learning_rate": 4.507037685671661e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.0001810282981267437, + "loss": 0.0141, "step": 157210 }, { - "epoch": 1.7, - "learning_rate": 4.50541609911137e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001810207304337297, + "loss": 0.0138, "step": 157220 }, { - "epoch": 1.7, - "learning_rate": 4.50379451255108e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.0001810131627407157, + "loss": 0.0128, "step": 157230 }, { - "epoch": 1.7, - "learning_rate": 4.5021729259907895e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018100559504770168, + "loss": 0.0136, "step": 157240 }, { - "epoch": 1.7, - "learning_rate": 4.500551339430499e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018099802735468767, + "loss": 0.0148, "step": 157250 }, { - "epoch": 1.7, - "learning_rate": 4.498929752870208e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018099045966167365, + "loss": 0.0119, "step": 157260 }, { - "epoch": 1.7, - "learning_rate": 4.497308166309917e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018098289196865966, + "loss": 0.0152, "step": 157270 }, { - "epoch": 1.7, - "learning_rate": 4.495686579749627e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018097532427564564, + "loss": 0.0164, "step": 157280 }, { - "epoch": 1.7, - "learning_rate": 4.4940649931893365e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018096775658263162, + "loss": 0.0145, "step": 157290 }, { - "epoch": 1.7, - "learning_rate": 4.492443406629046e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018096018888961763, + "loss": 0.0142, "step": 157300 }, { - "epoch": 1.7, - "learning_rate": 4.490821820068755e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001809526211966036, + "loss": 0.0148, "step": 157310 }, { - "epoch": 1.7, - "learning_rate": 4.4892002335084643e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.0001809450535035896, + "loss": 0.012, "step": 157320 }, { - "epoch": 1.7, - "learning_rate": 4.4875786469481736e-05, - "loss": 0.0084, + "epoch": 0.79, + "learning_rate": 0.0001809374858105756, + "loss": 0.0153, "step": 157330 }, { - "epoch": 1.7, - "learning_rate": 4.4859570603878836e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018092991811756158, + "loss": 0.0122, "step": 157340 }, { - "epoch": 1.7, - "learning_rate": 4.484335473827593e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018092235042454756, + "loss": 0.0111, "step": 157350 }, { - "epoch": 1.7, - "learning_rate": 4.482713887267302e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018091478273153357, + "loss": 0.012, "step": 157360 }, { - "epoch": 1.7, - "learning_rate": 4.4810923007070114e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018090721503851955, + "loss": 0.0133, "step": 157370 }, { - "epoch": 1.7, - "learning_rate": 4.479470714146721e-05, - "loss": 0.0101, + "epoch": 0.79, + "learning_rate": 0.00018089964734550553, + "loss": 0.0125, "step": 157380 }, { - "epoch": 1.7, - "learning_rate": 4.4778491275864306e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018089207965249154, + "loss": 0.0117, "step": 157390 }, { - "epoch": 1.7, - "learning_rate": 4.47622754102614e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018088451195947752, + "loss": 0.0113, "step": 157400 }, { - "epoch": 1.7, - "learning_rate": 4.474605954465849e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.0001808769442664635, + "loss": 0.0109, "step": 157410 }, { - "epoch": 1.7, - "learning_rate": 4.4729843679055584e-05, - "loss": 0.0103, + "epoch": 0.79, + "learning_rate": 0.00018086937657344949, + "loss": 0.0105, "step": 157420 }, { - "epoch": 1.7, - "learning_rate": 4.471362781345268e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.0001808618088804355, + "loss": 0.0119, "step": 157430 }, { - "epoch": 1.7, - "learning_rate": 4.469741194784977e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018085424118742148, + "loss": 0.0085, "step": 157440 }, { - "epoch": 1.7, - "learning_rate": 4.468119608224687e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018084667349440746, + "loss": 0.0113, "step": 157450 }, { - "epoch": 1.7, - "learning_rate": 4.466498021664396e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018083910580139347, + "loss": 0.0113, "step": 157460 }, { - "epoch": 1.7, - "learning_rate": 4.4648764351041055e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018083153810837945, + "loss": 0.0138, "step": 157470 }, { - "epoch": 1.7, - "learning_rate": 4.463254848543815e-05, - "loss": 0.005, + "epoch": 0.79, + "learning_rate": 0.00018082397041536543, + "loss": 0.011, "step": 157480 }, { - "epoch": 1.7, - "learning_rate": 4.461633261983524e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018081640272235144, + "loss": 0.0103, "step": 157490 }, { - "epoch": 1.7, - "learning_rate": 4.460011675423234e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018080883502933742, + "loss": 0.0204, "step": 157500 }, { - "epoch": 1.7, - "learning_rate": 4.458390088862943e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001808012673363234, + "loss": 0.0136, "step": 157510 }, { - "epoch": 1.7, - "learning_rate": 4.4567685023026525e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.0001807936996433094, + "loss": 0.0155, "step": 157520 }, { - "epoch": 1.7, - "learning_rate": 4.455146915742362e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.0001807861319502954, + "loss": 0.0137, "step": 157530 }, { - "epoch": 1.7, - "learning_rate": 4.453525329182071e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018077856425728137, + "loss": 0.0102, "step": 157540 }, { - "epoch": 1.7, - "learning_rate": 4.451903742621781e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018077099656426738, + "loss": 0.012, "step": 157550 }, { - "epoch": 1.7, - "learning_rate": 4.45028215606149e-05, - "loss": 0.0046, + "epoch": 0.79, + "learning_rate": 0.00018076342887125336, + "loss": 0.0117, "step": 157560 }, { - "epoch": 1.7, - "learning_rate": 4.4486605695011996e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018075586117823934, + "loss": 0.0141, "step": 157570 }, { - "epoch": 1.7, - "learning_rate": 4.447038982940909e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018074829348522532, + "loss": 0.0114, "step": 157580 }, { - "epoch": 1.7, - "learning_rate": 4.445417396380618e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00018074072579221133, + "loss": 0.0129, "step": 157590 }, { - "epoch": 1.7, - "learning_rate": 4.4437958098203274e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018073315809919731, + "loss": 0.0117, "step": 157600 }, { - "epoch": 1.7, - "learning_rate": 4.4421742232600374e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.0001807255904061833, + "loss": 0.0122, "step": 157610 }, { - "epoch": 1.7, - "learning_rate": 4.4405526366997466e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001807180227131693, + "loss": 0.0169, "step": 157620 }, { - "epoch": 1.7, - "learning_rate": 4.438931050139456e-05, - "loss": 0.0081, + "epoch": 0.8, + "learning_rate": 0.00018071045502015529, + "loss": 0.0116, "step": 157630 }, { - "epoch": 1.7, - "learning_rate": 4.437309463579165e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018070288732714127, + "loss": 0.0102, "step": 157640 }, { - "epoch": 1.7, - "learning_rate": 4.4356878770188745e-05, - "loss": 0.009, + "epoch": 0.8, + "learning_rate": 0.00018069531963412728, + "loss": 0.0117, "step": 157650 }, { - "epoch": 1.7, - "learning_rate": 4.4340662904585844e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00018068775194111326, + "loss": 0.0149, "step": 157660 }, { - "epoch": 1.7, - "learning_rate": 4.432444703898294e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018068018424809924, + "loss": 0.0128, "step": 157670 }, { - "epoch": 1.7, - "learning_rate": 4.430823117338003e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018067261655508525, + "loss": 0.0141, "step": 157680 }, { - "epoch": 1.7, - "learning_rate": 4.429201530777712e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018066504886207123, + "loss": 0.0116, "step": 157690 }, { - "epoch": 1.7, - "learning_rate": 4.4275799442174215e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001806574811690572, + "loss": 0.0113, "step": 157700 }, { - "epoch": 1.7, - "learning_rate": 4.4259583576571315e-05, - "loss": 0.0052, + "epoch": 0.8, + "learning_rate": 0.00018064991347604322, + "loss": 0.0129, "step": 157710 }, { - "epoch": 1.71, - "learning_rate": 4.424336771096841e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.0001806423457830292, + "loss": 0.0115, "step": 157720 }, { - "epoch": 1.71, - "learning_rate": 4.42271518453655e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00018063477809001518, + "loss": 0.0133, "step": 157730 }, { - "epoch": 1.71, - "learning_rate": 4.421093597976259e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018062721039700114, + "loss": 0.0121, "step": 157740 }, { - "epoch": 1.71, - "learning_rate": 4.4194720114159686e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018061964270398714, + "loss": 0.0122, "step": 157750 }, { - "epoch": 1.71, - "learning_rate": 4.417850424855678e-05, - "loss": 0.0051, + "epoch": 0.8, + "learning_rate": 0.00018061207501097313, + "loss": 0.0114, "step": 157760 }, { - "epoch": 1.71, - "learning_rate": 4.416228838295388e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001806045073179591, + "loss": 0.0107, "step": 157770 }, { - "epoch": 1.71, - "learning_rate": 4.414607251735097e-05, - "loss": 0.0081, + "epoch": 0.8, + "learning_rate": 0.00018059693962494512, + "loss": 0.013, "step": 157780 }, { - "epoch": 1.71, - "learning_rate": 4.4129856651748063e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001805893719319311, + "loss": 0.0116, "step": 157790 }, { - "epoch": 1.71, - "learning_rate": 4.4113640786145156e-05, - "loss": 0.005, + "epoch": 0.8, + "learning_rate": 0.00018058180423891708, + "loss": 0.012, "step": 157800 }, { - "epoch": 1.71, - "learning_rate": 4.409742492054225e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018057423654590306, + "loss": 0.0123, "step": 157810 }, { - "epoch": 1.71, - "learning_rate": 4.408120905493935e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00018056666885288907, + "loss": 0.0151, "step": 157820 }, { - "epoch": 1.71, - "learning_rate": 4.406499318933644e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018055910115987505, + "loss": 0.0102, "step": 157830 }, { - "epoch": 1.71, - "learning_rate": 4.4048777323733534e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018055153346686103, + "loss": 0.013, "step": 157840 }, { - "epoch": 1.71, - "learning_rate": 4.403256145813063e-05, - "loss": 0.0048, + "epoch": 0.8, + "learning_rate": 0.00018054396577384704, + "loss": 0.0131, "step": 157850 }, { - "epoch": 1.71, - "learning_rate": 4.401634559252772e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018053639808083302, + "loss": 0.014, "step": 157860 }, { - "epoch": 1.71, - "learning_rate": 4.400012972692481e-05, - "loss": 0.0105, + "epoch": 0.8, + "learning_rate": 0.000180528830387819, + "loss": 0.0152, "step": 157870 }, { - "epoch": 1.71, - "learning_rate": 4.398391386132191e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.000180521262694805, + "loss": 0.012, "step": 157880 }, { - "epoch": 1.71, - "learning_rate": 4.396769799571901e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.000180513695001791, + "loss": 0.013, "step": 157890 }, { - "epoch": 1.71, - "learning_rate": 4.3951482130116104e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018050612730877697, + "loss": 0.0118, "step": 157900 }, { - "epoch": 1.71, - "learning_rate": 4.39352662645132e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018049855961576298, + "loss": 0.0138, "step": 157910 }, { - "epoch": 1.71, - "learning_rate": 4.3919050398910296e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018049099192274896, + "loss": 0.0125, "step": 157920 }, { - "epoch": 1.71, - "learning_rate": 4.390283453330739e-05, - "loss": 0.0112, + "epoch": 0.8, + "learning_rate": 0.00018048342422973495, + "loss": 0.0118, "step": 157930 }, { - "epoch": 1.71, - "learning_rate": 4.388661866770448e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018047585653672095, + "loss": 0.0112, "step": 157940 }, { - "epoch": 1.71, - "learning_rate": 4.3870402802101574e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00018046828884370694, + "loss": 0.0108, "step": 157950 }, { - "epoch": 1.71, - "learning_rate": 4.385418693649867e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00018046072115069292, + "loss": 0.01, "step": 157960 }, { - "epoch": 1.71, - "learning_rate": 4.383797107089577e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.0001804531534576789, + "loss": 0.0122, "step": 157970 }, { - "epoch": 1.71, - "learning_rate": 4.382175520529286e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001804455857646649, + "loss": 0.0122, "step": 157980 }, { - "epoch": 1.71, - "learning_rate": 4.380553933968995e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.0001804380180716509, + "loss": 0.0087, "step": 157990 }, { - "epoch": 1.71, - "learning_rate": 4.3789323474087045e-05, - "loss": 0.0093, + "epoch": 0.8, + "learning_rate": 0.00018043045037863687, + "loss": 0.0117, "step": 158000 }, { - "epoch": 1.71, - "eval_cer": 0.921521722891336, - "eval_loss": 0.005824473220854998, - "eval_runtime": 121.2769, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.8, + "eval_cer": 0.914447936792278, + "eval_loss": 0.008715854957699776, + "eval_runtime": 116.7633, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, "step": 158000 }, { - "epoch": 1.71, - "learning_rate": 4.377310760848414e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018042288268562288, + "loss": 0.0173, "step": 158010 }, { - "epoch": 1.71, - "learning_rate": 4.375689174288123e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00018041531499260886, + "loss": 0.0147, "step": 158020 }, { - "epoch": 1.71, - "learning_rate": 4.374067587727833e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00018040774729959484, + "loss": 0.0137, "step": 158030 }, { - "epoch": 1.71, - "learning_rate": 4.372446001167542e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018040017960658085, + "loss": 0.0125, "step": 158040 }, { - "epoch": 1.71, - "learning_rate": 4.3708244146072515e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018039261191356683, + "loss": 0.0133, "step": 158050 }, { - "epoch": 1.71, - "learning_rate": 4.369202828046961e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.0001803850442205528, + "loss": 0.0181, "step": 158060 }, { - "epoch": 1.71, - "learning_rate": 4.36758124148667e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.00018037747652753882, + "loss": 0.0132, "step": 158070 }, { - "epoch": 1.71, - "learning_rate": 4.36595965492638e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001803699088345248, + "loss": 0.0106, "step": 158080 }, { - "epoch": 1.71, - "learning_rate": 4.364338068366089e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00018036234114151078, + "loss": 0.011, "step": 158090 }, { - "epoch": 1.71, - "learning_rate": 4.3627164818057986e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001803547734484968, + "loss": 0.013, "step": 158100 }, { - "epoch": 1.71, - "learning_rate": 4.361094895245508e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018034720575548277, + "loss": 0.0116, "step": 158110 }, { - "epoch": 1.71, - "learning_rate": 4.359473308685217e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018033963806246876, + "loss": 0.0122, "step": 158120 }, { - "epoch": 1.71, - "learning_rate": 4.357851722124927e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.00018033207036945476, + "loss": 0.0159, "step": 158130 }, { - "epoch": 1.71, - "learning_rate": 4.3562301355646364e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018032450267644075, + "loss": 0.0092, "step": 158140 }, { - "epoch": 1.71, - "learning_rate": 4.3546085490043456e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.00018031693498342673, + "loss": 0.0128, "step": 158150 }, { - "epoch": 1.71, - "learning_rate": 4.352986962444055e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.0001803093672904127, + "loss": 0.0155, "step": 158160 }, { - "epoch": 1.71, - "learning_rate": 4.351365375883764e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018030179959739872, + "loss": 0.0114, "step": 158170 }, { - "epoch": 1.71, - "learning_rate": 4.3497437893234735e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.0001802942319043847, + "loss": 0.0131, "step": 158180 }, { - "epoch": 1.71, - "learning_rate": 4.3481222027631834e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018028666421137068, + "loss": 0.0101, "step": 158190 }, { - "epoch": 1.71, - "learning_rate": 4.346500616202893e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.0001802790965183567, + "loss": 0.0129, "step": 158200 }, { - "epoch": 1.71, - "learning_rate": 4.344879029642602e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00018027152882534267, + "loss": 0.0118, "step": 158210 }, { - "epoch": 1.71, - "learning_rate": 4.343257443082311e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018026396113232865, + "loss": 0.0122, "step": 158220 }, { - "epoch": 1.71, - "learning_rate": 4.3416358565220205e-05, - "loss": 0.0093, + "epoch": 0.8, + "learning_rate": 0.00018025639343931466, + "loss": 0.0133, "step": 158230 }, { - "epoch": 1.71, - "learning_rate": 4.3400142699617305e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018024882574630064, + "loss": 0.0115, "step": 158240 }, { - "epoch": 1.71, - "learning_rate": 4.33839268340144e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018024125805328662, + "loss": 0.0151, "step": 158250 }, { - "epoch": 1.71, - "learning_rate": 4.336771096841149e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018023369036027263, + "loss": 0.014, "step": 158260 }, { - "epoch": 1.71, - "learning_rate": 4.335149510280858e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.0001802261226672586, + "loss": 0.0101, "step": 158270 }, { - "epoch": 1.71, - "learning_rate": 4.3335279237205676e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.0001802185549742446, + "loss": 0.0135, "step": 158280 }, { - "epoch": 1.71, - "learning_rate": 4.3319063371602775e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001802109872812306, + "loss": 0.0105, "step": 158290 }, { - "epoch": 1.71, - "learning_rate": 4.330284750599987e-05, - "loss": 0.0092, + "epoch": 0.8, + "learning_rate": 0.00018020341958821658, + "loss": 0.0109, "step": 158300 }, { - "epoch": 1.71, - "learning_rate": 4.328663164039696e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018019585189520257, + "loss": 0.013, "step": 158310 }, { - "epoch": 1.71, - "learning_rate": 4.327041577479405e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.00018018828420218855, + "loss": 0.0156, "step": 158320 }, { - "epoch": 1.71, - "learning_rate": 4.3254199909191146e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018018071650917456, + "loss": 0.018, "step": 158330 }, { - "epoch": 1.71, - "learning_rate": 4.323798404358824e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018017314881616054, + "loss": 0.0102, "step": 158340 }, { - "epoch": 1.71, - "learning_rate": 4.322176817798534e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018016558112314652, + "loss": 0.0142, "step": 158350 }, { - "epoch": 1.71, - "learning_rate": 4.320555231238243e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00018015801343013253, + "loss": 0.0117, "step": 158360 }, { - "epoch": 1.71, - "learning_rate": 4.3189336446779524e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.0001801504457371185, + "loss": 0.012, "step": 158370 }, { - "epoch": 1.71, - "learning_rate": 4.3173120581176617e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.0001801428780441045, + "loss": 0.0158, "step": 158380 }, { - "epoch": 1.71, - "learning_rate": 4.315690471557371e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001801353103510905, + "loss": 0.0143, "step": 158390 }, { - "epoch": 1.71, - "learning_rate": 4.314068884997081e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00018012774265807648, + "loss": 0.013, "step": 158400 }, { - "epoch": 1.71, - "learning_rate": 4.31244729843679e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018012017496506246, + "loss": 0.0131, "step": 158410 }, { - "epoch": 1.71, - "learning_rate": 4.3108257118764994e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018011260727204847, + "loss": 0.0107, "step": 158420 }, { - "epoch": 1.71, - "learning_rate": 4.309204125316209e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018010503957903445, + "loss": 0.0126, "step": 158430 }, { - "epoch": 1.71, - "learning_rate": 4.307582538755918e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00018009747188602043, + "loss": 0.0111, "step": 158440 }, { - "epoch": 1.71, - "learning_rate": 4.305960952195627e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018008990419300644, + "loss": 0.0099, "step": 158450 }, { - "epoch": 1.71, - "learning_rate": 4.304339365635337e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018008233649999242, + "loss": 0.0132, "step": 158460 }, { - "epoch": 1.71, - "learning_rate": 4.3027177790750465e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.0001800747688069784, + "loss": 0.0148, "step": 158470 }, { - "epoch": 1.71, - "learning_rate": 4.301096192514756e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00018006720111396439, + "loss": 0.0158, "step": 158480 }, { - "epoch": 1.71, - "learning_rate": 4.299474605954465e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.0001800596334209504, + "loss": 0.0129, "step": 158490 }, { - "epoch": 1.71, - "learning_rate": 4.297853019394174e-05, - "loss": 0.0097, + "epoch": 0.8, + "learning_rate": 0.00018005206572793638, + "loss": 0.0093, "step": 158500 }, { - "epoch": 1.71, - "learning_rate": 4.296231432833884e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018004449803492236, + "loss": 0.0131, "step": 158510 }, { - "epoch": 1.71, - "learning_rate": 4.2946098462735935e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00018003693034190837, + "loss": 0.0118, "step": 158520 }, { - "epoch": 1.71, - "learning_rate": 4.292988259713303e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018002936264889435, + "loss": 0.0135, "step": 158530 }, { - "epoch": 1.71, - "learning_rate": 4.291366673153012e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00018002179495588033, + "loss": 0.0108, "step": 158540 }, { - "epoch": 1.71, - "learning_rate": 4.2897450865927214e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00018001422726286634, + "loss": 0.0139, "step": 158550 }, { - "epoch": 1.71, - "learning_rate": 4.288123500032431e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018000665956985232, + "loss": 0.0124, "step": 158560 }, { - "epoch": 1.71, - "learning_rate": 4.2865019134721406e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.0001799990918768383, + "loss": 0.0103, "step": 158570 }, { - "epoch": 1.71, - "learning_rate": 4.28488032691185e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.0001799915241838243, + "loss": 0.0095, "step": 158580 }, { - "epoch": 1.71, - "learning_rate": 4.283258740351559e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001799839564908103, + "loss": 0.0132, "step": 158590 }, { - "epoch": 1.71, - "learning_rate": 4.2816371537912684e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017997638879779627, + "loss": 0.0116, "step": 158600 }, { - "epoch": 1.71, - "learning_rate": 4.280015567230979e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017996882110478228, + "loss": 0.013, "step": 158610 }, { - "epoch": 1.71, - "learning_rate": 4.278393980670688e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017996125341176826, + "loss": 0.015, "step": 158620 }, { - "epoch": 1.71, - "learning_rate": 4.2767723941103976e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017995368571875424, + "loss": 0.0121, "step": 158630 }, { - "epoch": 1.71, - "learning_rate": 4.275150807550107e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017994611802574025, + "loss": 0.0111, "step": 158640 }, { - "epoch": 1.72, - "learning_rate": 4.273529220989816e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017993855033272623, + "loss": 0.013, "step": 158650 }, { - "epoch": 1.72, - "learning_rate": 4.271907634429526e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017993098263971221, + "loss": 0.0107, "step": 158660 }, { - "epoch": 1.72, - "learning_rate": 4.2702860478692354e-05, - "loss": 0.0052, + "epoch": 0.8, + "learning_rate": 0.0001799234149466982, + "loss": 0.0101, "step": 158670 }, { - "epoch": 1.72, - "learning_rate": 4.2686644613089446e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.0001799158472536842, + "loss": 0.0116, "step": 158680 }, { - "epoch": 1.72, - "learning_rate": 4.267042874748654e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017990827956067019, + "loss": 0.0124, "step": 158690 }, { - "epoch": 1.72, - "learning_rate": 4.265421288188363e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017990071186765617, + "loss": 0.0127, "step": 158700 }, { - "epoch": 1.72, - "learning_rate": 4.263799701628073e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017989314417464218, + "loss": 0.0143, "step": 158710 }, { - "epoch": 1.72, - "learning_rate": 4.2621781150677824e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017988557648162816, + "loss": 0.0103, "step": 158720 }, { - "epoch": 1.72, - "learning_rate": 4.260556528507492e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017987800878861414, + "loss": 0.0103, "step": 158730 }, { - "epoch": 1.72, - "learning_rate": 4.258934941947201e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017987044109560015, + "loss": 0.0143, "step": 158740 }, { - "epoch": 1.72, - "learning_rate": 4.25731335538691e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017986287340258613, + "loss": 0.0149, "step": 158750 }, { - "epoch": 1.72, - "learning_rate": 4.2556917688266195e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.0001798553057095721, + "loss": 0.0141, "step": 158760 }, { - "epoch": 1.72, - "learning_rate": 4.2540701822663295e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017984773801655812, + "loss": 0.0097, "step": 158770 }, { - "epoch": 1.72, - "learning_rate": 4.252448595706039e-05, - "loss": 0.0101, + "epoch": 0.8, + "learning_rate": 0.0001798401703235441, + "loss": 0.0136, "step": 158780 }, { - "epoch": 1.72, - "learning_rate": 4.250827009145748e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017983260263053008, + "loss": 0.0129, "step": 158790 }, { - "epoch": 1.72, - "learning_rate": 4.249205422585457e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.0001798250349375161, + "loss": 0.0104, "step": 158800 }, { - "epoch": 1.72, - "learning_rate": 4.2475838360251666e-05, - "loss": 0.0089, + "epoch": 0.8, + "learning_rate": 0.00017981746724450207, + "loss": 0.0119, "step": 158810 }, { - "epoch": 1.72, - "learning_rate": 4.2459622494648765e-05, - "loss": 0.0095, + "epoch": 0.8, + "learning_rate": 0.00017980989955148805, + "loss": 0.0171, "step": 158820 }, { - "epoch": 1.72, - "learning_rate": 4.244340662904586e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017980233185847403, + "loss": 0.0094, "step": 158830 }, { - "epoch": 1.72, - "learning_rate": 4.242719076344295e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017979476416546004, + "loss": 0.0098, "step": 158840 }, { - "epoch": 1.72, - "learning_rate": 4.241097489784004e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00017978719647244602, + "loss": 0.014, "step": 158850 }, { - "epoch": 1.72, - "learning_rate": 4.2394759032237136e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.000179779628779432, + "loss": 0.012, "step": 158860 }, { - "epoch": 1.72, - "learning_rate": 4.2378543166634236e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00017977206108641801, + "loss": 0.0127, "step": 158870 }, { - "epoch": 1.72, - "learning_rate": 4.236232730103133e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.000179764493393404, + "loss": 0.0169, "step": 158880 }, { - "epoch": 1.72, - "learning_rate": 4.234611143542842e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017975692570038998, + "loss": 0.0093, "step": 158890 }, { - "epoch": 1.72, - "learning_rate": 4.2329895569825514e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017974935800737599, + "loss": 0.0186, "step": 158900 }, { - "epoch": 1.72, - "learning_rate": 4.2313679704222607e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017974179031436197, + "loss": 0.013, "step": 158910 }, { - "epoch": 1.72, - "learning_rate": 4.22974638386197e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017973422262134795, + "loss": 0.0127, "step": 158920 }, { - "epoch": 1.72, - "learning_rate": 4.22812479730168e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00017972665492833396, + "loss": 0.0131, "step": 158930 }, { - "epoch": 1.72, - "learning_rate": 4.226503210741389e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00017971908723531994, + "loss": 0.013, "step": 158940 }, { - "epoch": 1.72, - "learning_rate": 4.2248816241810984e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017971151954230592, + "loss": 0.0113, "step": 158950 }, { - "epoch": 1.72, - "learning_rate": 4.223260037620808e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00017970395184929193, + "loss": 0.0098, "step": 158960 }, { - "epoch": 1.72, - "learning_rate": 4.221638451060517e-05, - "loss": 0.0098, + "epoch": 0.8, + "learning_rate": 0.0001796963841562779, + "loss": 0.0105, "step": 158970 }, { - "epoch": 1.72, - "learning_rate": 4.220016864500227e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001796888164632639, + "loss": 0.0108, "step": 158980 }, { - "epoch": 1.72, - "learning_rate": 4.218395277939936e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017968124877024987, + "loss": 0.0124, "step": 158990 }, { - "epoch": 1.72, - "learning_rate": 4.2167736913796455e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00017967368107723585, + "loss": 0.012, "step": 159000 }, { - "epoch": 1.72, - "eval_cer": 0.9215208542883797, - "eval_loss": 0.005773806478828192, - "eval_runtime": 121.1921, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.8, + "eval_cer": 0.9144945158062973, + "eval_loss": 0.00861455500125885, + "eval_runtime": 116.6046, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, "step": 159000 }, { - "epoch": 1.72, - "learning_rate": 4.215152104819355e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017966611338422184, + "loss": 0.0116, "step": 159010 }, { - "epoch": 1.72, - "learning_rate": 4.213530518259064e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017965854569120782, + "loss": 0.0118, "step": 159020 }, { - "epoch": 1.72, - "learning_rate": 4.211908931698773e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00017965097799819383, + "loss": 0.0135, "step": 159030 }, { - "epoch": 1.72, - "learning_rate": 4.210287345138483e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.0001796434103051798, + "loss": 0.011, "step": 159040 }, { - "epoch": 1.72, - "learning_rate": 4.2086657585781925e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001796358426121658, + "loss": 0.0123, "step": 159050 }, { - "epoch": 1.72, - "learning_rate": 4.207044172017902e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017962827491915177, + "loss": 0.0132, "step": 159060 }, { - "epoch": 1.72, - "learning_rate": 4.205422585457611e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017962070722613778, + "loss": 0.0123, "step": 159070 }, { - "epoch": 1.72, - "learning_rate": 4.2038009988973204e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017961313953312376, + "loss": 0.0127, "step": 159080 }, { - "epoch": 1.72, - "learning_rate": 4.20217941233703e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017960557184010974, + "loss": 0.0141, "step": 159090 }, { - "epoch": 1.72, - "learning_rate": 4.2005578257767396e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017959800414709575, + "loss": 0.0123, "step": 159100 }, { - "epoch": 1.72, - "learning_rate": 4.198936239216449e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017959043645408173, + "loss": 0.0098, "step": 159110 }, { - "epoch": 1.72, - "learning_rate": 4.197314652656158e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.0001795828687610677, + "loss": 0.0104, "step": 159120 }, { - "epoch": 1.72, - "learning_rate": 4.1956930660958674e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017957530106805372, + "loss": 0.0117, "step": 159130 }, { - "epoch": 1.72, - "learning_rate": 4.1940714795355774e-05, - "loss": 0.0092, + "epoch": 0.8, + "learning_rate": 0.0001795677333750397, + "loss": 0.012, "step": 159140 }, { - "epoch": 1.72, - "learning_rate": 4.1924498929752866e-05, - "loss": 0.0096, + "epoch": 0.8, + "learning_rate": 0.00017956016568202568, + "loss": 0.0123, "step": 159150 }, { - "epoch": 1.72, - "learning_rate": 4.190828306414996e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.0001795525979890117, + "loss": 0.0127, "step": 159160 }, { - "epoch": 1.72, - "learning_rate": 4.189206719854705e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017954503029599767, + "loss": 0.0131, "step": 159170 }, { - "epoch": 1.72, - "learning_rate": 4.1875851332944144e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017953746260298366, + "loss": 0.0109, "step": 159180 }, { - "epoch": 1.72, - "learning_rate": 4.185963546734124e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017952989490996966, + "loss": 0.0125, "step": 159190 }, { - "epoch": 1.72, - "learning_rate": 4.184341960173834e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017952232721695565, + "loss": 0.0111, "step": 159200 }, { - "epoch": 1.72, - "learning_rate": 4.182720373613543e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.00017951475952394163, + "loss": 0.0191, "step": 159210 }, { - "epoch": 1.72, - "learning_rate": 4.181098787053252e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001795071918309276, + "loss": 0.0091, "step": 159220 }, { - "epoch": 1.72, - "learning_rate": 4.1794772004929615e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017949962413791362, + "loss": 0.0133, "step": 159230 }, { - "epoch": 1.72, - "learning_rate": 4.177855613932671e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.0001794920564448996, + "loss": 0.0126, "step": 159240 }, { - "epoch": 1.72, - "learning_rate": 4.176234027372381e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017948448875188558, + "loss": 0.012, "step": 159250 }, { - "epoch": 1.72, - "learning_rate": 4.17461244081209e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001794769210588716, + "loss": 0.0124, "step": 159260 }, { - "epoch": 1.72, - "learning_rate": 4.172990854251799e-05, - "loss": 0.0087, + "epoch": 0.8, + "learning_rate": 0.00017946935336585757, + "loss": 0.0115, "step": 159270 }, { - "epoch": 1.72, - "learning_rate": 4.1713692676915085e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00017946178567284355, + "loss": 0.0193, "step": 159280 }, { - "epoch": 1.72, - "learning_rate": 4.169747681131218e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017945421797982956, + "loss": 0.0141, "step": 159290 }, { - "epoch": 1.72, - "learning_rate": 4.168126094570928e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017944665028681554, + "loss": 0.0113, "step": 159300 }, { - "epoch": 1.72, - "learning_rate": 4.166504508010637e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017943908259380152, + "loss": 0.0142, "step": 159310 }, { - "epoch": 1.72, - "learning_rate": 4.164882921450346e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017943151490078753, + "loss": 0.0114, "step": 159320 }, { - "epoch": 1.72, - "learning_rate": 4.163261334890056e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.0001794239472077735, + "loss": 0.0111, "step": 159330 }, { - "epoch": 1.72, - "learning_rate": 4.1616397483297655e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.0001794163795147595, + "loss": 0.02, "step": 159340 }, { - "epoch": 1.72, - "learning_rate": 4.1600181617694755e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.0001794088118217455, + "loss": 0.0143, "step": 159350 }, { - "epoch": 1.72, - "learning_rate": 4.158396575209185e-05, - "loss": 0.0093, + "epoch": 0.8, + "learning_rate": 0.00017940124412873148, + "loss": 0.0158, "step": 159360 }, { - "epoch": 1.72, - "learning_rate": 4.156774988648894e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017939367643571747, + "loss": 0.0125, "step": 159370 }, { - "epoch": 1.72, - "learning_rate": 4.155153402088603e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017938610874270345, + "loss": 0.0116, "step": 159380 }, { - "epoch": 1.72, - "learning_rate": 4.1535318155283126e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017937854104968946, + "loss": 0.0107, "step": 159390 }, { - "epoch": 1.72, - "learning_rate": 4.1519102289680226e-05, - "loss": 0.009, + "epoch": 0.8, + "learning_rate": 0.00017937097335667544, + "loss": 0.0139, "step": 159400 }, { - "epoch": 1.72, - "learning_rate": 4.150288642407732e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017936340566366142, + "loss": 0.0131, "step": 159410 }, { - "epoch": 1.72, - "learning_rate": 4.148667055847441e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017935583797064743, + "loss": 0.0109, "step": 159420 }, { - "epoch": 1.72, - "learning_rate": 4.1470454692871504e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001793482702776334, + "loss": 0.014, "step": 159430 }, { - "epoch": 1.72, - "learning_rate": 4.1454238827268596e-05, - "loss": 0.0108, + "epoch": 0.8, + "learning_rate": 0.0001793407025846194, + "loss": 0.011, "step": 159440 }, { - "epoch": 1.72, - "learning_rate": 4.1438022961665696e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.0001793331348916054, + "loss": 0.0121, "step": 159450 }, { - "epoch": 1.72, - "learning_rate": 4.142180709606279e-05, - "loss": 0.005, + "epoch": 0.8, + "learning_rate": 0.00017932556719859138, + "loss": 0.0132, "step": 159460 }, { - "epoch": 1.72, - "learning_rate": 4.140559123045988e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00017931799950557736, + "loss": 0.0112, "step": 159470 }, { - "epoch": 1.72, - "learning_rate": 4.1389375364856974e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017931043181256337, + "loss": 0.0158, "step": 159480 }, { - "epoch": 1.72, - "learning_rate": 4.137315949925407e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017930286411954935, + "loss": 0.0108, "step": 159490 }, { - "epoch": 1.72, - "learning_rate": 4.135694363365116e-05, - "loss": 0.0051, + "epoch": 0.8, + "learning_rate": 0.00017929529642653533, + "loss": 0.0115, "step": 159500 }, { - "epoch": 1.72, - "learning_rate": 4.134072776804826e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017928772873352134, + "loss": 0.013, "step": 159510 }, { - "epoch": 1.72, - "learning_rate": 4.132451190244535e-05, + "epoch": 0.8, + "learning_rate": 0.00017928016104050732, "loss": 0.0108, "step": 159520 }, { - "epoch": 1.72, - "learning_rate": 4.1308296036842445e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.0001792725933474933, + "loss": 0.0116, "step": 159530 }, { - "epoch": 1.72, - "learning_rate": 4.129208017123954e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001792650256544793, + "loss": 0.0105, "step": 159540 }, { - "epoch": 1.72, - "learning_rate": 4.127586430563663e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.0001792574579614653, + "loss": 0.0127, "step": 159550 }, { - "epoch": 1.72, - "learning_rate": 4.125964844003373e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017924989026845128, + "loss": 0.0139, "step": 159560 }, { - "epoch": 1.73, - "learning_rate": 4.124343257443082e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017924232257543726, + "loss": 0.011, "step": 159570 }, { - "epoch": 1.73, - "learning_rate": 4.1227216708827915e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017923475488242327, + "loss": 0.0143, "step": 159580 }, { - "epoch": 1.73, - "learning_rate": 4.121100084322501e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017922718718940925, + "loss": 0.0109, "step": 159590 }, { - "epoch": 1.73, - "learning_rate": 4.11947849776221e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017921961949639523, + "loss": 0.0108, "step": 159600 }, { - "epoch": 1.73, - "learning_rate": 4.11785691120192e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017921205180338124, + "loss": 0.0119, "step": 159610 }, { - "epoch": 1.73, - "learning_rate": 4.116235324641629e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017920448411036722, + "loss": 0.0187, "step": 159620 }, { - "epoch": 1.73, - "learning_rate": 4.1146137380813386e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.0001791969164173532, + "loss": 0.0142, "step": 159630 }, { - "epoch": 1.73, - "learning_rate": 4.112992151521048e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.0001791893487243392, + "loss": 0.0135, "step": 159640 }, { - "epoch": 1.73, - "learning_rate": 4.111370564960757e-05, - "loss": 0.0048, + "epoch": 0.81, + "learning_rate": 0.0001791817810313252, + "loss": 0.015, "step": 159650 }, { - "epoch": 1.73, - "learning_rate": 4.1097489784004664e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017917421333831117, + "loss": 0.0122, "step": 159660 }, { - "epoch": 1.73, - "learning_rate": 4.1081273918401763e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017916664564529718, + "loss": 0.0115, "step": 159670 }, { - "epoch": 1.73, - "learning_rate": 4.1065058052798856e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017915907795228316, + "loss": 0.0106, "step": 159680 }, { - "epoch": 1.73, - "learning_rate": 4.104884218719595e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017915151025926914, + "loss": 0.0127, "step": 159690 }, { - "epoch": 1.73, - "learning_rate": 4.103262632159304e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017914394256625515, + "loss": 0.0124, "step": 159700 }, { - "epoch": 1.73, - "learning_rate": 4.1016410455990134e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017913637487324113, + "loss": 0.0161, "step": 159710 }, { - "epoch": 1.73, - "learning_rate": 4.1000194590387234e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.00017912880718022711, + "loss": 0.0138, "step": 159720 }, { - "epoch": 1.73, - "learning_rate": 4.098397872478433e-05, - "loss": 0.0114, + "epoch": 0.81, + "learning_rate": 0.0001791212394872131, + "loss": 0.0105, "step": 159730 }, { - "epoch": 1.73, - "learning_rate": 4.096776285918142e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.0001791136717941991, + "loss": 0.0097, "step": 159740 }, { - "epoch": 1.73, - "learning_rate": 4.095154699357851e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017910610410118509, + "loss": 0.0126, "step": 159750 }, { - "epoch": 1.73, - "learning_rate": 4.0935331127975605e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017909853640817107, + "loss": 0.0131, "step": 159760 }, { - "epoch": 1.73, - "learning_rate": 4.09191152623727e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017909096871515708, + "loss": 0.0107, "step": 159770 }, { - "epoch": 1.73, - "learning_rate": 4.09028993967698e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017908340102214306, + "loss": 0.0111, "step": 159780 }, { - "epoch": 1.73, - "learning_rate": 4.088668353116689e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017907583332912904, + "loss": 0.0144, "step": 159790 }, { - "epoch": 1.73, - "learning_rate": 4.087046766556398e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017906826563611505, + "loss": 0.0123, "step": 159800 }, { - "epoch": 1.73, - "learning_rate": 4.0854251799961075e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017906069794310103, + "loss": 0.0135, "step": 159810 }, { - "epoch": 1.73, - "learning_rate": 4.083803593435817e-05, - "loss": 0.005, + "epoch": 0.81, + "learning_rate": 0.000179053130250087, + "loss": 0.0127, "step": 159820 }, { - "epoch": 1.73, - "learning_rate": 4.082182006875527e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017904556255707302, + "loss": 0.0131, "step": 159830 }, { - "epoch": 1.73, - "learning_rate": 4.080560420315236e-05, - "loss": 0.0101, + "epoch": 0.81, + "learning_rate": 0.000179037994864059, + "loss": 0.0153, "step": 159840 }, { - "epoch": 1.73, - "learning_rate": 4.078938833754945e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017903042717104498, + "loss": 0.0109, "step": 159850 }, { - "epoch": 1.73, - "learning_rate": 4.0773172471946546e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.000179022859478031, + "loss": 0.0116, "step": 159860 }, { - "epoch": 1.73, - "learning_rate": 4.075695660634364e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017901529178501697, + "loss": 0.0124, "step": 159870 }, { - "epoch": 1.73, - "learning_rate": 4.074074074074074e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017900772409200295, + "loss": 0.0109, "step": 159880 }, { - "epoch": 1.73, - "learning_rate": 4.072452487513783e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017900015639898893, + "loss": 0.0117, "step": 159890 }, { - "epoch": 1.73, - "learning_rate": 4.0708309009534924e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017899258870597494, + "loss": 0.0133, "step": 159900 }, { - "epoch": 1.73, - "learning_rate": 4.0692093143932016e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017898502101296092, + "loss": 0.0131, "step": 159910 }, { - "epoch": 1.73, - "learning_rate": 4.067587727832911e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.0001789774533199469, + "loss": 0.0113, "step": 159920 }, { - "epoch": 1.73, - "learning_rate": 4.06596614127262e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017896988562693291, + "loss": 0.0105, "step": 159930 }, { - "epoch": 1.73, - "learning_rate": 4.06434455471233e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.0001789623179339189, + "loss": 0.0135, "step": 159940 }, { - "epoch": 1.73, - "learning_rate": 4.0627229681520394e-05, - "loss": 0.0089, + "epoch": 0.81, + "learning_rate": 0.00017895475024090488, + "loss": 0.0128, "step": 159950 }, { - "epoch": 1.73, - "learning_rate": 4.061101381591749e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017894718254789089, + "loss": 0.0129, "step": 159960 }, { - "epoch": 1.73, - "learning_rate": 4.059479795031458e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017893961485487687, + "loss": 0.0184, "step": 159970 }, { - "epoch": 1.73, - "learning_rate": 4.057858208471167e-05, - "loss": 0.0089, + "epoch": 0.81, + "learning_rate": 0.00017893204716186285, + "loss": 0.0144, "step": 159980 }, { - "epoch": 1.73, - "learning_rate": 4.056236621910877e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017892447946884886, + "loss": 0.0096, "step": 159990 }, { - "epoch": 1.73, - "learning_rate": 4.0546150353505865e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017891691177583484, + "loss": 0.0133, "step": 160000 }, { - "epoch": 1.73, - "eval_cer": 0.9215156426706413, - "eval_loss": 0.005892171058803797, - "eval_runtime": 121.1891, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.81, + "eval_cer": 0.9144867526372941, + "eval_loss": 0.008828338235616684, + "eval_runtime": 116.6369, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, "step": 160000 }, { - "epoch": 1.73, - "learning_rate": 4.052993448790296e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017890934408282082, + "loss": 0.0108, "step": 160010 }, { - "epoch": 1.73, - "learning_rate": 4.051371862230005e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017890177638980683, + "loss": 0.013, "step": 160020 }, { - "epoch": 1.73, - "learning_rate": 4.049750275669714e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001788942086967928, + "loss": 0.0134, "step": 160030 }, { - "epoch": 1.73, - "learning_rate": 4.0481286891094236e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.0001788866410037788, + "loss": 0.0124, "step": 160040 }, { - "epoch": 1.73, - "learning_rate": 4.046507102549134e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.0001788790733107648, + "loss": 0.0117, "step": 160050 }, { - "epoch": 1.73, - "learning_rate": 4.0448855159888435e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017887150561775078, + "loss": 0.0132, "step": 160060 }, { - "epoch": 1.73, - "learning_rate": 4.043263929428553e-05, - "loss": 0.0087, + "epoch": 0.81, + "learning_rate": 0.00017886393792473676, + "loss": 0.0121, "step": 160070 }, { - "epoch": 1.73, - "learning_rate": 4.041642342868262e-05, - "loss": 0.0112, + "epoch": 0.81, + "learning_rate": 0.00017885637023172274, + "loss": 0.0138, "step": 160080 }, { - "epoch": 1.73, - "learning_rate": 4.040020756307972e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017884880253870875, + "loss": 0.0117, "step": 160090 }, { - "epoch": 1.73, - "learning_rate": 4.038399169747681e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017884123484569473, + "loss": 0.0116, "step": 160100 }, { - "epoch": 1.73, - "learning_rate": 4.0367775831873905e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017883366715268072, + "loss": 0.0141, "step": 160110 }, { - "epoch": 1.73, - "learning_rate": 4.0351559966271e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017882609945966672, + "loss": 0.0142, "step": 160120 }, { - "epoch": 1.73, - "learning_rate": 4.033534410066809e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001788185317666527, + "loss": 0.0164, "step": 160130 }, { - "epoch": 1.73, - "learning_rate": 4.031912823506519e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.0001788109640736387, + "loss": 0.0105, "step": 160140 }, { - "epoch": 1.73, - "learning_rate": 4.030291236946228e-05, - "loss": 0.0093, + "epoch": 0.81, + "learning_rate": 0.0001788033963806247, + "loss": 0.0151, "step": 160150 }, { - "epoch": 1.73, - "learning_rate": 4.0286696503859376e-05, - "loss": 0.0088, + "epoch": 0.81, + "learning_rate": 0.00017879582868761068, + "loss": 0.0183, "step": 160160 }, { - "epoch": 1.73, - "learning_rate": 4.027048063825647e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017878826099459666, + "loss": 0.0106, "step": 160170 }, { - "epoch": 1.73, - "learning_rate": 4.025426477265356e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017878069330158267, + "loss": 0.0155, "step": 160180 }, { - "epoch": 1.73, - "learning_rate": 4.023804890705066e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017877312560856865, + "loss": 0.0123, "step": 160190 }, { - "epoch": 1.73, - "learning_rate": 4.0221833041447753e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017876555791555463, + "loss": 0.0141, "step": 160200 }, { - "epoch": 1.73, - "learning_rate": 4.0205617175844846e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017875799022254064, + "loss": 0.0124, "step": 160210 }, { - "epoch": 1.73, - "learning_rate": 4.018940131024194e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017875042252952662, + "loss": 0.0151, "step": 160220 }, { - "epoch": 1.73, - "learning_rate": 4.017318544463903e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.0001787428548365126, + "loss": 0.0108, "step": 160230 }, { - "epoch": 1.73, - "learning_rate": 4.0156969579036124e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017873528714349858, + "loss": 0.0112, "step": 160240 }, { - "epoch": 1.73, - "learning_rate": 4.0140753713433224e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001787277194504846, + "loss": 0.0133, "step": 160250 }, { - "epoch": 1.73, - "learning_rate": 4.012453784783032e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017872015175747055, + "loss": 0.0109, "step": 160260 }, { - "epoch": 1.73, - "learning_rate": 4.010832198222741e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017871258406445653, + "loss": 0.013, "step": 160270 }, { - "epoch": 1.73, - "learning_rate": 4.00921061166245e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001787050163714425, + "loss": 0.0102, "step": 160280 }, { - "epoch": 1.73, - "learning_rate": 4.0075890251021595e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.00017869744867842852, + "loss": 0.0133, "step": 160290 }, { - "epoch": 1.73, - "learning_rate": 4.0059674385418694e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001786898809854145, + "loss": 0.0137, "step": 160300 }, { - "epoch": 1.73, - "learning_rate": 4.004345851981579e-05, - "loss": 0.0102, + "epoch": 0.81, + "learning_rate": 0.00017868231329240048, + "loss": 0.0132, "step": 160310 }, { - "epoch": 1.73, - "learning_rate": 4.002724265421288e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001786747455993865, + "loss": 0.013, "step": 160320 }, { - "epoch": 1.73, - "learning_rate": 4.001102678860997e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017866717790637247, + "loss": 0.0109, "step": 160330 }, { - "epoch": 1.73, - "learning_rate": 3.9994810923007065e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017865961021335845, + "loss": 0.0129, "step": 160340 }, { - "epoch": 1.73, - "learning_rate": 3.997859505740416e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017865204252034446, + "loss": 0.0106, "step": 160350 }, { - "epoch": 1.73, - "learning_rate": 3.996237919180126e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017864447482733044, + "loss": 0.0135, "step": 160360 }, { - "epoch": 1.73, - "learning_rate": 3.994616332619835e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017863690713431642, + "loss": 0.0097, "step": 160370 }, { - "epoch": 1.73, - "learning_rate": 3.992994746059544e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017862933944130243, + "loss": 0.0139, "step": 160380 }, { - "epoch": 1.73, - "learning_rate": 3.9913731594992536e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.0001786217717482884, + "loss": 0.0092, "step": 160390 }, { - "epoch": 1.73, - "learning_rate": 3.989751572938963e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001786142040552744, + "loss": 0.0143, "step": 160400 }, { - "epoch": 1.73, - "learning_rate": 3.988129986378673e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.0001786066363622604, + "loss": 0.0108, "step": 160410 }, { - "epoch": 1.73, - "learning_rate": 3.986508399818382e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017859906866924638, + "loss": 0.0146, "step": 160420 }, { - "epoch": 1.73, - "learning_rate": 3.9848868132580914e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017859150097623237, + "loss": 0.0118, "step": 160430 }, { - "epoch": 1.73, - "learning_rate": 3.9832652266978006e-05, - "loss": 0.0106, + "epoch": 0.81, + "learning_rate": 0.00017858393328321837, + "loss": 0.0136, "step": 160440 }, { - "epoch": 1.73, - "learning_rate": 3.98164364013751e-05, - "loss": 0.0099, + "epoch": 0.81, + "learning_rate": 0.00017857636559020436, + "loss": 0.0121, "step": 160450 }, { - "epoch": 1.73, - "learning_rate": 3.98002205357722e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.00017856879789719034, + "loss": 0.0147, "step": 160460 }, { - "epoch": 1.73, - "learning_rate": 3.978400467016929e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017856123020417632, + "loss": 0.0117, "step": 160470 }, { - "epoch": 1.73, - "learning_rate": 3.9767788804566384e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017855366251116233, + "loss": 0.0129, "step": 160480 }, { - "epoch": 1.73, - "learning_rate": 3.975157293896348e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001785460948181483, + "loss": 0.0139, "step": 160490 }, { - "epoch": 1.74, - "learning_rate": 3.973535707336057e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.0001785385271251343, + "loss": 0.0111, "step": 160500 }, { - "epoch": 1.74, - "learning_rate": 3.971914120775766e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.0001785309594321203, + "loss": 0.013, "step": 160510 }, { - "epoch": 1.74, - "learning_rate": 3.970292534215476e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017852339173910628, + "loss": 0.0109, "step": 160520 }, { - "epoch": 1.74, - "learning_rate": 3.9686709476551855e-05, - "loss": 0.0097, + "epoch": 0.81, + "learning_rate": 0.00017851582404609226, + "loss": 0.0127, "step": 160530 }, { - "epoch": 1.74, - "learning_rate": 3.967049361094895e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017850825635307827, + "loss": 0.0139, "step": 160540 }, { - "epoch": 1.74, - "learning_rate": 3.965427774534604e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017850068866006425, + "loss": 0.0095, "step": 160550 }, { - "epoch": 1.74, - "learning_rate": 3.963806187974313e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017849312096705023, + "loss": 0.0111, "step": 160560 }, { - "epoch": 1.74, - "learning_rate": 3.962184601414023e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.00017848555327403624, + "loss": 0.0126, "step": 160570 }, { - "epoch": 1.74, - "learning_rate": 3.9605630148537325e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017847798558102222, + "loss": 0.0107, "step": 160580 }, { - "epoch": 1.74, - "learning_rate": 3.958941428293442e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.0001784704178880082, + "loss": 0.0107, "step": 160590 }, { - "epoch": 1.74, - "learning_rate": 3.957319841733151e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.0001784628501949942, + "loss": 0.0111, "step": 160600 }, { - "epoch": 1.74, - "learning_rate": 3.95569825517286e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.0001784552825019802, + "loss": 0.0118, "step": 160610 }, { - "epoch": 1.74, - "learning_rate": 3.9540766686125696e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017844771480896618, + "loss": 0.0118, "step": 160620 }, { - "epoch": 1.74, - "learning_rate": 3.9524550820522796e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017844014711595216, + "loss": 0.0115, "step": 160630 }, { - "epoch": 1.74, - "learning_rate": 3.950833495491989e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017843257942293817, + "loss": 0.01, "step": 160640 }, { - "epoch": 1.74, - "learning_rate": 3.949211908931698e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017842501172992415, + "loss": 0.0114, "step": 160650 }, { - "epoch": 1.74, - "learning_rate": 3.9475903223714074e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017841744403691013, + "loss": 0.0137, "step": 160660 }, { - "epoch": 1.74, - "learning_rate": 3.9459687358111167e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.00017840987634389614, + "loss": 0.0107, "step": 160670 }, { - "epoch": 1.74, - "learning_rate": 3.9443471492508266e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017840230865088212, + "loss": 0.01, "step": 160680 }, { - "epoch": 1.74, - "learning_rate": 3.942725562690536e-05, - "loss": 0.0095, + "epoch": 0.81, + "learning_rate": 0.0001783947409578681, + "loss": 0.0131, "step": 160690 }, { - "epoch": 1.74, - "learning_rate": 3.941103976130245e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.0001783871732648541, + "loss": 0.0122, "step": 160700 }, { - "epoch": 1.74, - "learning_rate": 3.9394823895699544e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001783796055718401, + "loss": 0.0114, "step": 160710 }, { - "epoch": 1.74, - "learning_rate": 3.937860803009664e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017837203787882607, + "loss": 0.0138, "step": 160720 }, { - "epoch": 1.74, - "learning_rate": 3.9362392164493737e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017836447018581208, + "loss": 0.0136, "step": 160730 }, { - "epoch": 1.74, - "learning_rate": 3.934617629889083e-05, - "loss": 0.0046, + "epoch": 0.81, + "learning_rate": 0.00017835690249279806, + "loss": 0.0107, "step": 160740 }, { - "epoch": 1.74, - "learning_rate": 3.932996043328792e-05, - "loss": 0.0046, + "epoch": 0.81, + "learning_rate": 0.00017834933479978404, + "loss": 0.0095, "step": 160750 }, { - "epoch": 1.74, - "learning_rate": 3.9313744567685015e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017834176710677005, + "loss": 0.0146, "step": 160760 }, { - "epoch": 1.74, - "learning_rate": 3.929752870208212e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017833419941375603, + "loss": 0.0109, "step": 160770 }, { - "epoch": 1.74, - "learning_rate": 3.9281312836479214e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017832663172074201, + "loss": 0.0089, "step": 160780 }, { - "epoch": 1.74, - "learning_rate": 3.9265096970876307e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.000178319064027728, + "loss": 0.013, "step": 160790 }, { - "epoch": 1.74, - "learning_rate": 3.92488811052734e-05, - "loss": 0.0087, + "epoch": 0.81, + "learning_rate": 0.000178311496334714, + "loss": 0.0118, "step": 160800 }, { - "epoch": 1.74, - "learning_rate": 3.923266523967049e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017830392864169999, + "loss": 0.0137, "step": 160810 }, { - "epoch": 1.74, - "learning_rate": 3.9216449374067585e-05, - "loss": 0.0039, + "epoch": 0.81, + "learning_rate": 0.00017829636094868597, + "loss": 0.0128, "step": 160820 }, { - "epoch": 1.74, - "learning_rate": 3.9200233508464684e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017828879325567198, + "loss": 0.0109, "step": 160830 }, { - "epoch": 1.74, - "learning_rate": 3.918401764286178e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017828122556265796, + "loss": 0.0167, "step": 160840 }, { - "epoch": 1.74, - "learning_rate": 3.916780177725887e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017827365786964394, + "loss": 0.0137, "step": 160850 }, { - "epoch": 1.74, - "learning_rate": 3.915158591165596e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017826609017662995, + "loss": 0.0107, "step": 160860 }, { - "epoch": 1.74, - "learning_rate": 3.9135370046053055e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017825852248361593, + "loss": 0.0119, "step": 160870 }, { - "epoch": 1.74, - "learning_rate": 3.9119154180450155e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001782509547906019, + "loss": 0.0135, "step": 160880 }, { - "epoch": 1.74, - "learning_rate": 3.910293831484725e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017824338709758792, + "loss": 0.0102, "step": 160890 }, { - "epoch": 1.74, - "learning_rate": 3.908672244924434e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.0001782358194045739, + "loss": 0.0138, "step": 160900 }, { - "epoch": 1.74, - "learning_rate": 3.907050658364143e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017822825171155988, + "loss": 0.0143, "step": 160910 }, { - "epoch": 1.74, - "learning_rate": 3.9054290718038526e-05, - "loss": 0.0094, + "epoch": 0.81, + "learning_rate": 0.0001782206840185459, + "loss": 0.0113, "step": 160920 }, { - "epoch": 1.74, - "learning_rate": 3.903807485243562e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017821311632553187, + "loss": 0.0144, "step": 160930 }, { - "epoch": 1.74, - "learning_rate": 3.902185898683272e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017820554863251785, + "loss": 0.0107, "step": 160940 }, { - "epoch": 1.74, - "learning_rate": 3.900564312122981e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.00017819798093950383, + "loss": 0.0136, "step": 160950 }, { - "epoch": 1.74, - "learning_rate": 3.8989427255626904e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017819041324648984, + "loss": 0.0118, "step": 160960 }, { - "epoch": 1.74, - "learning_rate": 3.8973211390023996e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017818284555347582, + "loss": 0.0134, "step": 160970 }, { - "epoch": 1.74, - "learning_rate": 3.895699552442109e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.0001781752778604618, + "loss": 0.013, "step": 160980 }, { - "epoch": 1.74, - "learning_rate": 3.894077965881819e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017816771016744781, + "loss": 0.0126, "step": 160990 }, { - "epoch": 1.74, - "learning_rate": 3.892456379321528e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.0001781601424744338, + "loss": 0.0127, "step": 161000 }, { - "epoch": 1.74, - "eval_cer": 0.9215034822292522, - "eval_loss": 0.0055848234333097935, - "eval_runtime": 121.2713, - "eval_samples_per_second": 16.492, - "eval_steps_per_second": 4.123, + "epoch": 0.81, + "eval_cer": 0.9144789894682909, + "eval_loss": 0.008487106300890446, + "eval_runtime": 116.5295, + "eval_samples_per_second": 17.163, + "eval_steps_per_second": 4.291, "step": 161000 }, { - "epoch": 1.74, - "learning_rate": 3.8908347927612374e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017815257478141978, + "loss": 0.013, "step": 161010 }, { - "epoch": 1.74, - "learning_rate": 3.889213206200947e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.00017814500708840579, + "loss": 0.0154, "step": 161020 }, { - "epoch": 1.74, - "learning_rate": 3.887591619640656e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017813743939539177, + "loss": 0.0145, "step": 161030 }, { - "epoch": 1.74, - "learning_rate": 3.885970033080366e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017812987170237775, + "loss": 0.0103, "step": 161040 }, { - "epoch": 1.74, - "learning_rate": 3.884348446520075e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017812230400936376, + "loss": 0.0117, "step": 161050 }, { - "epoch": 1.74, - "learning_rate": 3.8827268599597845e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017811473631634974, + "loss": 0.0102, "step": 161060 }, { - "epoch": 1.74, - "learning_rate": 3.881105273399494e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017810716862333572, + "loss": 0.0116, "step": 161070 }, { - "epoch": 1.74, - "learning_rate": 3.879483686839203e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017809960093032173, + "loss": 0.0136, "step": 161080 }, { - "epoch": 1.74, - "learning_rate": 3.877862100278912e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001780920332373077, + "loss": 0.0112, "step": 161090 }, { - "epoch": 1.74, - "learning_rate": 3.876240513718622e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.0001780844655442937, + "loss": 0.0114, "step": 161100 }, { - "epoch": 1.74, - "learning_rate": 3.8746189271583315e-05, - "loss": 0.0102, + "epoch": 0.81, + "learning_rate": 0.0001780768978512797, + "loss": 0.013, "step": 161110 }, { - "epoch": 1.74, - "learning_rate": 3.872997340598041e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017806933015826568, + "loss": 0.012, "step": 161120 }, { - "epoch": 1.74, - "learning_rate": 3.87137575403775e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017806176246525166, + "loss": 0.0091, "step": 161130 }, { - "epoch": 1.74, - "learning_rate": 3.869754167477459e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017805419477223764, + "loss": 0.0154, "step": 161140 }, { - "epoch": 1.74, - "learning_rate": 3.868132580917169e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017804662707922365, + "loss": 0.0104, "step": 161150 }, { - "epoch": 1.74, - "learning_rate": 3.8665109943568786e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017803905938620963, + "loss": 0.0115, "step": 161160 }, { - "epoch": 1.74, - "learning_rate": 3.864889407796588e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017803149169319562, + "loss": 0.0114, "step": 161170 }, { - "epoch": 1.74, - "learning_rate": 3.863267821236297e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017802392400018162, + "loss": 0.0143, "step": 161180 }, { - "epoch": 1.74, - "learning_rate": 3.8616462346760064e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.0001780163563071676, + "loss": 0.0102, "step": 161190 }, { - "epoch": 1.74, - "learning_rate": 3.860024648115716e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.0001780087886141536, + "loss": 0.0117, "step": 161200 }, { - "epoch": 1.74, - "learning_rate": 3.8584030615554256e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001780012209211396, + "loss": 0.0116, "step": 161210 }, { - "epoch": 1.74, - "learning_rate": 3.856781474995135e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017799365322812558, + "loss": 0.0114, "step": 161220 }, { - "epoch": 1.74, - "learning_rate": 3.855159888434844e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017798608553511156, + "loss": 0.0126, "step": 161230 }, { - "epoch": 1.74, - "learning_rate": 3.8535383018745534e-05, - "loss": 0.005, + "epoch": 0.81, + "learning_rate": 0.00017797851784209757, + "loss": 0.013, "step": 161240 }, { - "epoch": 1.74, - "learning_rate": 3.851916715314263e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017797095014908355, + "loss": 0.0143, "step": 161250 }, { - "epoch": 1.74, - "learning_rate": 3.8502951287539727e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017796338245606953, + "loss": 0.0134, "step": 161260 }, { - "epoch": 1.74, - "learning_rate": 3.848673542193682e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017795581476305554, + "loss": 0.0098, "step": 161270 }, { - "epoch": 1.74, - "learning_rate": 3.847051955633391e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017794824707004152, + "loss": 0.0118, "step": 161280 }, { - "epoch": 1.74, - "learning_rate": 3.8454303690731005e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001779406793770275, + "loss": 0.0133, "step": 161290 }, { - "epoch": 1.74, - "learning_rate": 3.84380878251281e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017793311168401348, + "loss": 0.0139, "step": 161300 }, { - "epoch": 1.74, - "learning_rate": 3.84218719595252e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.0001779255439909995, + "loss": 0.0132, "step": 161310 }, { - "epoch": 1.74, - "learning_rate": 3.840565609392229e-05, - "loss": 0.005, + "epoch": 0.81, + "learning_rate": 0.00017791797629798547, + "loss": 0.0124, "step": 161320 }, { - "epoch": 1.74, - "learning_rate": 3.838944022831938e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017791040860497145, + "loss": 0.0137, "step": 161330 }, { - "epoch": 1.74, - "learning_rate": 3.8373224362716475e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017790284091195746, + "loss": 0.0127, "step": 161340 }, { - "epoch": 1.74, - "learning_rate": 3.835700849711357e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017789527321894344, + "loss": 0.0129, "step": 161350 }, { - "epoch": 1.74, - "learning_rate": 3.834079263151066e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017788770552592943, + "loss": 0.0149, "step": 161360 }, { - "epoch": 1.74, - "learning_rate": 3.832457676590776e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017788013783291543, + "loss": 0.0113, "step": 161370 }, { - "epoch": 1.74, - "learning_rate": 3.830836090030485e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017787257013990142, + "loss": 0.0116, "step": 161380 }, { - "epoch": 1.74, - "learning_rate": 3.8292145034701946e-05, - "loss": 0.0048, + "epoch": 0.81, + "learning_rate": 0.0001778650024468874, + "loss": 0.0111, "step": 161390 }, { - "epoch": 1.74, - "learning_rate": 3.827592916909904e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.0001778574347538734, + "loss": 0.0127, "step": 161400 }, { - "epoch": 1.74, - "learning_rate": 3.825971330349613e-05, - "loss": 0.0049, + "epoch": 0.81, + "learning_rate": 0.0001778498670608594, + "loss": 0.0114, "step": 161410 }, { - "epoch": 1.75, - "learning_rate": 3.824349743789323e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017784229936784537, + "loss": 0.0104, "step": 161420 }, { - "epoch": 1.75, - "learning_rate": 3.8227281572290323e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017783473167483138, + "loss": 0.014, "step": 161430 }, { - "epoch": 1.75, - "learning_rate": 3.8211065706687416e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017782716398181736, + "loss": 0.0135, "step": 161440 }, { - "epoch": 1.75, - "learning_rate": 3.819484984108451e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017781959628880334, + "loss": 0.0104, "step": 161450 }, { - "epoch": 1.75, - "learning_rate": 3.81786339754816e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017781202859578932, + "loss": 0.0124, "step": 161460 }, { - "epoch": 1.75, - "learning_rate": 3.81624181098787e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017780446090277533, + "loss": 0.0107, "step": 161470 }, { - "epoch": 1.75, - "learning_rate": 3.8146202244275794e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.0001777968932097613, + "loss": 0.0119, "step": 161480 }, { - "epoch": 1.75, - "learning_rate": 3.8129986378672893e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.0001777893255167473, + "loss": 0.0158, "step": 161490 }, { - "epoch": 1.75, - "learning_rate": 3.8113770513069986e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001777817578237333, + "loss": 0.0112, "step": 161500 }, { - "epoch": 1.75, - "learning_rate": 3.809755464746708e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017777419013071926, + "loss": 0.012, "step": 161510 }, { - "epoch": 1.75, - "learning_rate": 3.808133878186418e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017776662243770524, + "loss": 0.0122, "step": 161520 }, { - "epoch": 1.75, - "learning_rate": 3.806512291626127e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017775905474469122, + "loss": 0.0116, "step": 161530 }, { - "epoch": 1.75, - "learning_rate": 3.8048907050658364e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017775148705167723, + "loss": 0.0106, "step": 161540 }, { - "epoch": 1.75, - "learning_rate": 3.803269118505546e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001777439193586632, + "loss": 0.0106, "step": 161550 }, { - "epoch": 1.75, - "learning_rate": 3.801647531945255e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.0001777363516656492, + "loss": 0.0102, "step": 161560 }, { - "epoch": 1.75, - "learning_rate": 3.800025945384965e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.0001777287839726352, + "loss": 0.0144, "step": 161570 }, { - "epoch": 1.75, - "learning_rate": 3.798404358824674e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017772121627962118, + "loss": 0.014, "step": 161580 }, { - "epoch": 1.75, - "learning_rate": 3.7967827722643834e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.00017771364858660716, + "loss": 0.0132, "step": 161590 }, { - "epoch": 1.75, - "learning_rate": 3.795161185704093e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017770608089359317, + "loss": 0.0104, "step": 161600 }, { - "epoch": 1.75, - "learning_rate": 3.793539599143802e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017769851320057915, + "loss": 0.0104, "step": 161610 }, { - "epoch": 1.75, - "learning_rate": 3.791918012583512e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017769094550756513, + "loss": 0.0104, "step": 161620 }, { - "epoch": 1.75, - "learning_rate": 3.790296426023221e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017768337781455114, + "loss": 0.0127, "step": 161630 }, { - "epoch": 1.75, - "learning_rate": 3.7886748394629305e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017767581012153712, + "loss": 0.0128, "step": 161640 }, { - "epoch": 1.75, - "learning_rate": 3.78705325290264e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.0001776682424285231, + "loss": 0.0155, "step": 161650 }, { - "epoch": 1.75, - "learning_rate": 3.785431666342349e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001776606747355091, + "loss": 0.0119, "step": 161660 }, { - "epoch": 1.75, - "learning_rate": 3.783810079782058e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.0001776531070424951, + "loss": 0.0106, "step": 161670 }, { - "epoch": 1.75, - "learning_rate": 3.782188493221768e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017764553934948108, + "loss": 0.0149, "step": 161680 }, { - "epoch": 1.75, - "learning_rate": 3.7805669066614775e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017763797165646706, + "loss": 0.0144, "step": 161690 }, { - "epoch": 1.75, - "learning_rate": 3.778945320101187e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017763040396345307, + "loss": 0.0103, "step": 161700 }, { - "epoch": 1.75, - "learning_rate": 3.777323733540896e-05, - "loss": 0.0119, + "epoch": 0.82, + "learning_rate": 0.00017762283627043905, + "loss": 0.0131, "step": 161710 }, { - "epoch": 1.75, - "learning_rate": 3.7757021469806054e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017761526857742503, + "loss": 0.0096, "step": 161720 }, { - "epoch": 1.75, - "learning_rate": 3.774080560420315e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.00017760770088441104, + "loss": 0.011, "step": 161730 }, { - "epoch": 1.75, - "learning_rate": 3.7724589738600246e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017760013319139702, + "loss": 0.0119, "step": 161740 }, { - "epoch": 1.75, - "learning_rate": 3.770837387299734e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.000177592565498383, + "loss": 0.0118, "step": 161750 }, { - "epoch": 1.75, - "learning_rate": 3.769215800739443e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.000177584997805369, + "loss": 0.0106, "step": 161760 }, { - "epoch": 1.75, - "learning_rate": 3.7675942141791524e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.000177577430112355, + "loss": 0.0101, "step": 161770 }, { - "epoch": 1.75, - "learning_rate": 3.7659726276188624e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.00017756986241934097, + "loss": 0.0228, "step": 161780 }, { - "epoch": 1.75, - "learning_rate": 3.7643510410585716e-05, - "loss": 0.0048, + "epoch": 0.82, + "learning_rate": 0.00017756229472632698, + "loss": 0.0153, "step": 161790 }, { - "epoch": 1.75, - "learning_rate": 3.762729454498281e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017755472703331296, + "loss": 0.0118, "step": 161800 }, { - "epoch": 1.75, - "learning_rate": 3.76110786793799e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017754715934029894, + "loss": 0.013, "step": 161810 }, { - "epoch": 1.75, - "learning_rate": 3.7594862813776995e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017753959164728495, + "loss": 0.0125, "step": 161820 }, { - "epoch": 1.75, - "learning_rate": 3.757864694817409e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.00017753202395427093, + "loss": 0.0141, "step": 161830 }, { - "epoch": 1.75, - "learning_rate": 3.756243108257119e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017752445626125691, + "loss": 0.0116, "step": 161840 }, { - "epoch": 1.75, - "learning_rate": 3.754621521696828e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001775168885682429, + "loss": 0.0099, "step": 161850 }, { - "epoch": 1.75, - "learning_rate": 3.752999935136537e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.0001775093208752289, + "loss": 0.0132, "step": 161860 }, { - "epoch": 1.75, - "learning_rate": 3.7513783485762465e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017750175318221489, + "loss": 0.0111, "step": 161870 }, { - "epoch": 1.75, - "learning_rate": 3.749756762015956e-05, - "loss": 0.0089, + "epoch": 0.82, + "learning_rate": 0.00017749418548920087, + "loss": 0.0105, "step": 161880 }, { - "epoch": 1.75, - "learning_rate": 3.748135175455666e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017748661779618688, + "loss": 0.0139, "step": 161890 }, { - "epoch": 1.75, - "learning_rate": 3.746513588895375e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017747905010317286, + "loss": 0.0133, "step": 161900 }, { - "epoch": 1.75, - "learning_rate": 3.744892002335084e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017747148241015884, + "loss": 0.0111, "step": 161910 }, { - "epoch": 1.75, - "learning_rate": 3.7432704157747936e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.00017746391471714485, + "loss": 0.0119, "step": 161920 }, { - "epoch": 1.75, - "learning_rate": 3.741648829214503e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.00017745634702413083, + "loss": 0.0188, "step": 161930 }, { - "epoch": 1.75, - "learning_rate": 3.740027242654212e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001774487793311168, + "loss": 0.0113, "step": 161940 }, { - "epoch": 1.75, - "learning_rate": 3.738405656093922e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017744121163810282, + "loss": 0.0133, "step": 161950 }, { - "epoch": 1.75, - "learning_rate": 3.7367840695336313e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.0001774336439450888, + "loss": 0.0144, "step": 161960 }, { - "epoch": 1.75, - "learning_rate": 3.7351624829733406e-05, - "loss": 0.0102, + "epoch": 0.82, + "learning_rate": 0.00017742607625207478, + "loss": 0.0112, "step": 161970 }, { - "epoch": 1.75, - "learning_rate": 3.73354089641305e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001774185085590608, + "loss": 0.0123, "step": 161980 }, { - "epoch": 1.75, - "learning_rate": 3.731919309852759e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017741094086604677, + "loss": 0.0088, "step": 161990 }, { - "epoch": 1.75, - "learning_rate": 3.730297723292469e-05, - "loss": 0.0105, + "epoch": 0.82, + "learning_rate": 0.00017740337317303275, + "loss": 0.0211, "step": 162000 }, { - "epoch": 1.75, - "eval_cer": 0.9215130368617722, - "eval_loss": 0.005664716940373182, - "eval_runtime": 121.2783, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.82, + "eval_cer": 0.9144663743186606, + "eval_loss": 0.008896621875464916, + "eval_runtime": 115.9502, + "eval_samples_per_second": 17.249, + "eval_steps_per_second": 4.312, "step": 162000 }, { - "epoch": 1.75, - "learning_rate": 3.7286761367321784e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017739580548001876, + "loss": 0.0128, "step": 162010 }, { - "epoch": 1.75, - "learning_rate": 3.727054550171888e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.00017738823778700474, + "loss": 0.0124, "step": 162020 }, { - "epoch": 1.75, - "learning_rate": 3.7254329636115976e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.00017738067009399072, + "loss": 0.0148, "step": 162030 }, { - "epoch": 1.75, - "learning_rate": 3.723811377051307e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001773731024009767, + "loss": 0.0181, "step": 162040 }, { - "epoch": 1.75, - "learning_rate": 3.722189790491016e-05, - "loss": 0.0044, + "epoch": 0.82, + "learning_rate": 0.00017736553470796271, + "loss": 0.012, "step": 162050 }, { - "epoch": 1.75, - "learning_rate": 3.7205682039307254e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001773579670149487, + "loss": 0.0131, "step": 162060 }, { - "epoch": 1.75, - "learning_rate": 3.7189466173704354e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017735039932193468, + "loss": 0.0103, "step": 162070 }, { - "epoch": 1.75, - "learning_rate": 3.717325030810145e-05, - "loss": 0.0112, + "epoch": 0.82, + "learning_rate": 0.00017734283162892069, + "loss": 0.0133, "step": 162080 }, { - "epoch": 1.75, - "learning_rate": 3.715703444249854e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017733526393590667, + "loss": 0.0112, "step": 162090 }, { - "epoch": 1.75, - "learning_rate": 3.714081857689563e-05, - "loss": 0.0088, + "epoch": 0.82, + "learning_rate": 0.00017732769624289265, + "loss": 0.0136, "step": 162100 }, { - "epoch": 1.75, - "learning_rate": 3.7124602711292725e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017732012854987866, + "loss": 0.0141, "step": 162110 }, { - "epoch": 1.75, - "learning_rate": 3.710838684568982e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017731256085686464, + "loss": 0.0125, "step": 162120 }, { - "epoch": 1.75, - "learning_rate": 3.709217098008692e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.00017730499316385062, + "loss": 0.0113, "step": 162130 }, { - "epoch": 1.75, - "learning_rate": 3.707595511448401e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017729742547083663, + "loss": 0.0113, "step": 162140 }, { - "epoch": 1.75, - "learning_rate": 3.70597392488811e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.0001772898577778226, + "loss": 0.0118, "step": 162150 }, { - "epoch": 1.75, - "learning_rate": 3.7043523383278195e-05, - "loss": 0.0048, + "epoch": 0.82, + "learning_rate": 0.0001772822900848086, + "loss": 0.0096, "step": 162160 }, { - "epoch": 1.75, - "learning_rate": 3.702730751767529e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.0001772747223917946, + "loss": 0.0131, "step": 162170 }, { - "epoch": 1.75, - "learning_rate": 3.701109165207239e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017726715469878058, + "loss": 0.0102, "step": 162180 }, { - "epoch": 1.75, - "learning_rate": 3.699487578646948e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017725958700576656, + "loss": 0.013, "step": 162190 }, { - "epoch": 1.75, - "learning_rate": 3.697865992086657e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017725201931275255, + "loss": 0.0102, "step": 162200 }, { - "epoch": 1.75, - "learning_rate": 3.6962444055263666e-05, - "loss": 0.0089, + "epoch": 0.82, + "learning_rate": 0.00017724445161973855, + "loss": 0.0093, "step": 162210 }, { - "epoch": 1.75, - "learning_rate": 3.694622818966076e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017723688392672454, + "loss": 0.0157, "step": 162220 }, { - "epoch": 1.75, - "learning_rate": 3.693001232405785e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017722931623371052, + "loss": 0.0124, "step": 162230 }, { - "epoch": 1.75, - "learning_rate": 3.691379645845495e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017722174854069653, + "loss": 0.0108, "step": 162240 }, { - "epoch": 1.75, - "learning_rate": 3.6897580592852044e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001772141808476825, + "loss": 0.0122, "step": 162250 }, { - "epoch": 1.75, - "learning_rate": 3.6881364727249136e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.0001772066131546685, + "loss": 0.0154, "step": 162260 }, { - "epoch": 1.75, - "learning_rate": 3.686514886164623e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.0001771990454616545, + "loss": 0.0118, "step": 162270 }, { - "epoch": 1.75, - "learning_rate": 3.684893299604332e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017719147776864048, + "loss": 0.0111, "step": 162280 }, { - "epoch": 1.75, - "learning_rate": 3.683271713044042e-05, - "loss": 0.0049, + "epoch": 0.82, + "learning_rate": 0.00017718391007562646, + "loss": 0.0093, "step": 162290 }, { - "epoch": 1.75, - "learning_rate": 3.6816501264837514e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017717634238261247, + "loss": 0.0132, "step": 162300 }, { - "epoch": 1.75, - "learning_rate": 3.680028539923461e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017716877468959845, + "loss": 0.0119, "step": 162310 }, { - "epoch": 1.75, - "learning_rate": 3.67840695336317e-05, - "loss": 0.0092, + "epoch": 0.82, + "learning_rate": 0.00017716120699658443, + "loss": 0.0105, "step": 162320 }, { - "epoch": 1.75, - "learning_rate": 3.676785366802879e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017715363930357044, + "loss": 0.0126, "step": 162330 }, { - "epoch": 1.75, - "learning_rate": 3.675163780242589e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017714607161055642, + "loss": 0.0177, "step": 162340 }, { - "epoch": 1.76, - "learning_rate": 3.6735421936822985e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.0001771385039175424, + "loss": 0.0147, "step": 162350 }, { - "epoch": 1.76, - "learning_rate": 3.671920607122008e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017713093622452838, + "loss": 0.0197, "step": 162360 }, { - "epoch": 1.76, - "learning_rate": 3.670299020561717e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.0001771233685315144, + "loss": 0.0111, "step": 162370 }, { - "epoch": 1.76, - "learning_rate": 3.668677434001426e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017711580083850037, + "loss": 0.0146, "step": 162380 }, { - "epoch": 1.76, - "learning_rate": 3.667055847441136e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017710823314548636, + "loss": 0.0105, "step": 162390 }, { - "epoch": 1.76, - "learning_rate": 3.6654342608808455e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017710066545247236, + "loss": 0.0119, "step": 162400 }, { - "epoch": 1.76, - "learning_rate": 3.663812674320555e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017709309775945835, + "loss": 0.0127, "step": 162410 }, { - "epoch": 1.76, - "learning_rate": 3.662191087760265e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017708553006644433, + "loss": 0.0151, "step": 162420 }, { - "epoch": 1.76, - "learning_rate": 3.660569501199974e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017707796237343034, + "loss": 0.0123, "step": 162430 }, { - "epoch": 1.76, - "learning_rate": 3.658947914639683e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.00017707039468041632, + "loss": 0.0156, "step": 162440 }, { - "epoch": 1.76, - "learning_rate": 3.6573263280793926e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001770628269874023, + "loss": 0.0119, "step": 162450 }, { - "epoch": 1.76, - "learning_rate": 3.655704741519102e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.0001770552592943883, + "loss": 0.0128, "step": 162460 }, { - "epoch": 1.76, - "learning_rate": 3.654083154958812e-05, - "loss": 0.0092, + "epoch": 0.82, + "learning_rate": 0.0001770476916013743, + "loss": 0.011, "step": 162470 }, { - "epoch": 1.76, - "learning_rate": 3.652461568398521e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017704012390836027, + "loss": 0.0122, "step": 162480 }, { - "epoch": 1.76, - "learning_rate": 3.65083998183823e-05, - "loss": 0.0047, + "epoch": 0.82, + "learning_rate": 0.00017703255621534628, + "loss": 0.0121, "step": 162490 }, { - "epoch": 1.76, - "learning_rate": 3.6492183952779396e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017702498852233226, + "loss": 0.0117, "step": 162500 }, { - "epoch": 1.76, - "learning_rate": 3.647596808717649e-05, - "loss": 0.0115, + "epoch": 0.82, + "learning_rate": 0.00017701742082931824, + "loss": 0.0103, "step": 162510 }, { - "epoch": 1.76, - "learning_rate": 3.645975222157358e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017700985313630425, + "loss": 0.0104, "step": 162520 }, { - "epoch": 1.76, - "learning_rate": 3.644353635597068e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.00017700228544329023, + "loss": 0.0142, "step": 162530 }, { - "epoch": 1.76, - "learning_rate": 3.6427320490367774e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001769947177502762, + "loss": 0.0133, "step": 162540 }, { - "epoch": 1.76, - "learning_rate": 3.6411104624764867e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001769871500572622, + "loss": 0.0139, "step": 162550 }, { - "epoch": 1.76, - "learning_rate": 3.639488875916196e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.0001769795823642482, + "loss": 0.0116, "step": 162560 }, { - "epoch": 1.76, - "learning_rate": 3.637867289355905e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017697201467123418, + "loss": 0.0139, "step": 162570 }, { - "epoch": 1.76, - "learning_rate": 3.636245702795615e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017696444697822017, + "loss": 0.015, "step": 162580 }, { - "epoch": 1.76, - "learning_rate": 3.6346241162353244e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017695687928520617, + "loss": 0.0108, "step": 162590 }, { - "epoch": 1.76, - "learning_rate": 3.633002529675034e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017694931159219216, + "loss": 0.0144, "step": 162600 }, { - "epoch": 1.76, - "learning_rate": 3.631380943114743e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017694174389917814, + "loss": 0.0124, "step": 162610 }, { - "epoch": 1.76, - "learning_rate": 3.629759356554452e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017693417620616415, + "loss": 0.0102, "step": 162620 }, { - "epoch": 1.76, - "learning_rate": 3.628137769994162e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017692660851315013, + "loss": 0.0106, "step": 162630 }, { - "epoch": 1.76, - "learning_rate": 3.6265161834338715e-05, - "loss": 0.0089, + "epoch": 0.82, + "learning_rate": 0.0001769190408201361, + "loss": 0.0111, "step": 162640 }, { - "epoch": 1.76, - "learning_rate": 3.624894596873581e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017691147312712212, + "loss": 0.0154, "step": 162650 }, { - "epoch": 1.76, - "learning_rate": 3.62327301031329e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.0001769039054341081, + "loss": 0.0169, "step": 162660 }, { - "epoch": 1.76, - "learning_rate": 3.621651423752999e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017689633774109408, + "loss": 0.013, "step": 162670 }, { - "epoch": 1.76, - "learning_rate": 3.6200298371927086e-05, - "loss": 0.0051, + "epoch": 0.82, + "learning_rate": 0.0001768887700480801, + "loss": 0.0133, "step": 162680 }, { - "epoch": 1.76, - "learning_rate": 3.6184082506324185e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.00017688120235506607, + "loss": 0.011, "step": 162690 }, { - "epoch": 1.76, - "learning_rate": 3.616786664072128e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017687363466205205, + "loss": 0.0106, "step": 162700 }, { - "epoch": 1.76, - "learning_rate": 3.615165077511837e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.00017686606696903803, + "loss": 0.0114, "step": 162710 }, { - "epoch": 1.76, - "learning_rate": 3.6135434909515464e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017685849927602404, + "loss": 0.0147, "step": 162720 }, { - "epoch": 1.76, - "learning_rate": 3.6119219043912556e-05, - "loss": 0.0092, + "epoch": 0.82, + "learning_rate": 0.00017685093158301002, + "loss": 0.0114, "step": 162730 }, { - "epoch": 1.76, - "learning_rate": 3.6103003178309656e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.000176843363889996, + "loss": 0.0111, "step": 162740 }, { - "epoch": 1.76, - "learning_rate": 3.608678731270675e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.000176835796196982, + "loss": 0.0099, "step": 162750 }, { - "epoch": 1.76, - "learning_rate": 3.607057144710385e-05, - "loss": 0.0088, + "epoch": 0.82, + "learning_rate": 0.000176828228503968, + "loss": 0.0131, "step": 162760 }, { - "epoch": 1.76, - "learning_rate": 3.605435558150094e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017682066081095395, + "loss": 0.0133, "step": 162770 }, { - "epoch": 1.76, - "learning_rate": 3.6038139715898034e-05, - "loss": 0.0097, + "epoch": 0.82, + "learning_rate": 0.00017681309311793993, + "loss": 0.0119, "step": 162780 }, { - "epoch": 1.76, - "learning_rate": 3.6021923850295126e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017680552542492594, + "loss": 0.0145, "step": 162790 }, { - "epoch": 1.76, - "learning_rate": 3.600570798469222e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017679795773191192, + "loss": 0.0131, "step": 162800 }, { - "epoch": 1.76, - "learning_rate": 3.598949211908931e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001767903900388979, + "loss": 0.0152, "step": 162810 }, { - "epoch": 1.76, - "learning_rate": 3.597327625348641e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.0001767828223458839, + "loss": 0.0176, "step": 162820 }, { - "epoch": 1.76, - "learning_rate": 3.5957060387883504e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001767752546528699, + "loss": 0.014, "step": 162830 }, { - "epoch": 1.76, - "learning_rate": 3.59408445222806e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017676768695985587, + "loss": 0.0114, "step": 162840 }, { - "epoch": 1.76, - "learning_rate": 3.592462865667769e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017676011926684188, + "loss": 0.0139, "step": 162850 }, { - "epoch": 1.76, - "learning_rate": 3.590841279107478e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.00017675255157382786, + "loss": 0.0103, "step": 162860 }, { - "epoch": 1.76, - "learning_rate": 3.589219692547188e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017674498388081384, + "loss": 0.0114, "step": 162870 }, { - "epoch": 1.76, - "learning_rate": 3.5875981059868975e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017673741618779985, + "loss": 0.0123, "step": 162880 }, { - "epoch": 1.76, - "learning_rate": 3.585976519426607e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017672984849478583, + "loss": 0.0173, "step": 162890 }, { - "epoch": 1.76, - "learning_rate": 3.584354932866316e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017672228080177182, + "loss": 0.0135, "step": 162900 }, { - "epoch": 1.76, - "learning_rate": 3.582733346306025e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017671471310875782, + "loss": 0.0136, "step": 162910 }, { - "epoch": 1.76, - "learning_rate": 3.581111759745735e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001767071454157438, + "loss": 0.0115, "step": 162920 }, { - "epoch": 1.76, - "learning_rate": 3.5794901731854445e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001766995777227298, + "loss": 0.0139, "step": 162930 }, { - "epoch": 1.76, - "learning_rate": 3.577868586625154e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017669201002971577, + "loss": 0.0116, "step": 162940 }, { - "epoch": 1.76, - "learning_rate": 3.576247000064863e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017668444233670178, + "loss": 0.0155, "step": 162950 }, { - "epoch": 1.76, - "learning_rate": 3.574625413504572e-05, - "loss": 0.0044, + "epoch": 0.82, + "learning_rate": 0.00017667687464368776, + "loss": 0.0123, "step": 162960 }, { - "epoch": 1.76, - "learning_rate": 3.5730038269442816e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.00017666930695067374, + "loss": 0.0093, "step": 162970 }, { - "epoch": 1.76, - "learning_rate": 3.5713822403839916e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017666173925765975, + "loss": 0.0114, "step": 162980 }, { - "epoch": 1.76, - "learning_rate": 3.569760653823701e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017665417156464573, + "loss": 0.0108, "step": 162990 }, { - "epoch": 1.76, - "learning_rate": 3.56813906726341e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001766466038716317, + "loss": 0.0087, "step": 163000 }, { - "epoch": 1.76, - "eval_cer": 0.921507825244034, - "eval_loss": 0.005535805597901344, - "eval_runtime": 121.0817, - "eval_samples_per_second": 16.518, - "eval_steps_per_second": 4.129, + "epoch": 0.82, + "eval_cer": 0.9144401736232748, + "eval_loss": 0.00887399259954691, + "eval_runtime": 116.6416, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, "step": 163000 }, { - "epoch": 1.76, - "learning_rate": 3.5665174807031194e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017663903617861772, + "loss": 0.0108, "step": 163010 }, { - "epoch": 1.76, - "learning_rate": 3.5648958941428287e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.0001766314684856037, + "loss": 0.0116, "step": 163020 }, { - "epoch": 1.76, - "learning_rate": 3.5632743075825386e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017662390079258968, + "loss": 0.0129, "step": 163030 }, { - "epoch": 1.76, - "learning_rate": 3.561652721022248e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.0001766163330995757, + "loss": 0.011, "step": 163040 }, { - "epoch": 1.76, - "learning_rate": 3.560031134461957e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017660876540656167, + "loss": 0.0127, "step": 163050 }, { - "epoch": 1.76, - "learning_rate": 3.5584095479016664e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017660119771354765, + "loss": 0.014, "step": 163060 }, { - "epoch": 1.76, - "learning_rate": 3.556787961341376e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.00017659363002053366, + "loss": 0.0137, "step": 163070 }, { - "epoch": 1.76, - "learning_rate": 3.5551663747810857e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017658606232751964, + "loss": 0.0109, "step": 163080 }, { - "epoch": 1.76, - "learning_rate": 3.553544788220795e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017657849463450563, + "loss": 0.0148, "step": 163090 }, { - "epoch": 1.76, - "learning_rate": 3.551923201660504e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001765709269414916, + "loss": 0.0113, "step": 163100 }, { - "epoch": 1.76, - "learning_rate": 3.550301615100214e-05, - "loss": 0.0049, + "epoch": 0.82, + "learning_rate": 0.00017656335924847762, + "loss": 0.0107, "step": 163110 }, { - "epoch": 1.76, - "learning_rate": 3.5486800285399234e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.0001765557915554636, + "loss": 0.0121, "step": 163120 }, { - "epoch": 1.76, - "learning_rate": 3.547058441979633e-05, - "loss": 0.0091, + "epoch": 0.82, + "learning_rate": 0.00017654822386244958, + "loss": 0.0124, "step": 163130 }, { - "epoch": 1.76, - "learning_rate": 3.545436855419342e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001765406561694356, + "loss": 0.0104, "step": 163140 }, { - "epoch": 1.76, - "learning_rate": 3.543815268859051e-05, - "loss": 0.0049, + "epoch": 0.82, + "learning_rate": 0.00017653308847642157, + "loss": 0.0127, "step": 163150 }, { - "epoch": 1.76, - "learning_rate": 3.542193682298761e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017652552078340755, + "loss": 0.0112, "step": 163160 }, { - "epoch": 1.76, - "learning_rate": 3.5405720957384705e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017651795309039356, + "loss": 0.014, "step": 163170 }, { - "epoch": 1.76, - "learning_rate": 3.53895050917818e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.00017651038539737954, + "loss": 0.0109, "step": 163180 }, { - "epoch": 1.76, - "learning_rate": 3.537328922617889e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017650281770436552, + "loss": 0.0139, "step": 163190 }, { - "epoch": 1.76, - "learning_rate": 3.535707336057598e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017649525001135153, + "loss": 0.0115, "step": 163200 }, { - "epoch": 1.76, - "learning_rate": 3.534085749497308e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.0001764876823183375, + "loss": 0.0113, "step": 163210 }, { - "epoch": 1.76, - "learning_rate": 3.5324641629370175e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.0001764801146253235, + "loss": 0.0175, "step": 163220 }, { - "epoch": 1.76, - "learning_rate": 3.530842576376727e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001764725469323095, + "loss": 0.0156, "step": 163230 }, { - "epoch": 1.76, - "learning_rate": 3.529220989816436e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017646497923929548, + "loss": 0.0146, "step": 163240 }, { - "epoch": 1.76, - "learning_rate": 3.5275994032561454e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017645741154628146, + "loss": 0.0101, "step": 163250 }, { - "epoch": 1.76, - "learning_rate": 3.5259778166958546e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.00017644984385326745, + "loss": 0.0131, "step": 163260 }, { - "epoch": 1.77, - "learning_rate": 3.5243562301355646e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017644227616025345, + "loss": 0.0115, "step": 163270 }, { - "epoch": 1.77, - "learning_rate": 3.522734643575274e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017643470846723944, + "loss": 0.0112, "step": 163280 }, { - "epoch": 1.77, - "learning_rate": 3.521113057014983e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.00017642714077422542, + "loss": 0.0121, "step": 163290 }, { - "epoch": 1.77, - "learning_rate": 3.5194914704546924e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017641957308121143, + "loss": 0.0116, "step": 163300 }, { - "epoch": 1.77, - "learning_rate": 3.517869883894402e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.0001764120053881974, + "loss": 0.0129, "step": 163310 }, { - "epoch": 1.77, - "learning_rate": 3.5162482973341116e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.0001764044376951834, + "loss": 0.0151, "step": 163320 }, { - "epoch": 1.77, - "learning_rate": 3.514626710773821e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.0001763968700021694, + "loss": 0.0129, "step": 163330 }, { - "epoch": 1.77, - "learning_rate": 3.51300512421353e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017638930230915538, + "loss": 0.0104, "step": 163340 }, { - "epoch": 1.77, - "learning_rate": 3.5113835376532394e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.00017638173461614136, + "loss": 0.0112, "step": 163350 }, { - "epoch": 1.77, - "learning_rate": 3.509761951092949e-05, - "loss": 0.0048, + "epoch": 0.82, + "learning_rate": 0.00017637416692312737, + "loss": 0.0176, "step": 163360 }, { - "epoch": 1.77, - "learning_rate": 3.508140364532659e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017636659923011335, + "loss": 0.013, "step": 163370 }, { - "epoch": 1.77, - "learning_rate": 3.506518777972368e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017635903153709933, + "loss": 0.0107, "step": 163380 }, { - "epoch": 1.77, - "learning_rate": 3.504897191412077e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.00017635146384408534, + "loss": 0.0144, "step": 163390 }, { - "epoch": 1.77, - "learning_rate": 3.5032756048517865e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017634389615107132, + "loss": 0.0103, "step": 163400 }, { - "epoch": 1.77, - "learning_rate": 3.501654018291496e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.0001763363284580573, + "loss": 0.0186, "step": 163410 }, { - "epoch": 1.77, - "learning_rate": 3.500032431731205e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.0001763287607650433, + "loss": 0.0119, "step": 163420 }, { - "epoch": 1.77, - "learning_rate": 3.498410845170915e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.0001763211930720293, + "loss": 0.0118, "step": 163430 }, { - "epoch": 1.77, - "learning_rate": 3.496789258610624e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017631362537901527, + "loss": 0.0124, "step": 163440 }, { - "epoch": 1.77, - "learning_rate": 3.4951676720503335e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017630605768600126, + "loss": 0.0119, "step": 163450 }, { - "epoch": 1.77, - "learning_rate": 3.493546085490043e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017629848999298726, + "loss": 0.0149, "step": 163460 }, { - "epoch": 1.77, - "learning_rate": 3.491924498929753e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017629092229997325, + "loss": 0.013, "step": 163470 }, { - "epoch": 1.77, - "learning_rate": 3.490302912369462e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017628335460695923, + "loss": 0.0112, "step": 163480 }, { - "epoch": 1.77, - "learning_rate": 3.488681325809171e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017627578691394524, + "loss": 0.011, "step": 163490 }, { - "epoch": 1.77, - "learning_rate": 3.487059739248881e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017626821922093122, + "loss": 0.0104, "step": 163500 }, { - "epoch": 1.77, - "learning_rate": 3.4854381526885905e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001762606515279172, + "loss": 0.0106, "step": 163510 }, { - "epoch": 1.77, - "learning_rate": 3.4838165661283e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001762530838349032, + "loss": 0.0114, "step": 163520 }, { - "epoch": 1.77, - "learning_rate": 3.482194979568009e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.0001762455161418892, + "loss": 0.012, "step": 163530 }, { - "epoch": 1.77, - "learning_rate": 3.4805733930077184e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017623794844887517, + "loss": 0.0131, "step": 163540 }, { - "epoch": 1.77, - "learning_rate": 3.4789518064474276e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017623038075586118, + "loss": 0.0114, "step": 163550 }, { - "epoch": 1.77, - "learning_rate": 3.4773302198871376e-05, - "loss": 0.0045, + "epoch": 0.83, + "learning_rate": 0.00017622281306284716, + "loss": 0.0109, "step": 163560 }, { - "epoch": 1.77, - "learning_rate": 3.475708633326847e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017621524536983314, + "loss": 0.0081, "step": 163570 }, { - "epoch": 1.77, - "learning_rate": 3.474087046766556e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017620767767681915, + "loss": 0.0116, "step": 163580 }, { - "epoch": 1.77, - "learning_rate": 3.4724654602062654e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017620010998380513, + "loss": 0.0141, "step": 163590 }, { - "epoch": 1.77, - "learning_rate": 3.470843873645975e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.0001761925422907911, + "loss": 0.0126, "step": 163600 }, { - "epoch": 1.77, - "learning_rate": 3.4692222870856846e-05, - "loss": 0.0078, + "epoch": 0.83, + "learning_rate": 0.0001761849745977771, + "loss": 0.0111, "step": 163610 }, { - "epoch": 1.77, - "learning_rate": 3.467600700525394e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001761774069047631, + "loss": 0.0096, "step": 163620 }, { - "epoch": 1.77, - "learning_rate": 3.465979113965103e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017616983921174908, + "loss": 0.01, "step": 163630 }, { - "epoch": 1.77, - "learning_rate": 3.4643575274048125e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017616227151873507, + "loss": 0.0098, "step": 163640 }, { - "epoch": 1.77, - "learning_rate": 3.462735940844522e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017615470382572107, + "loss": 0.0147, "step": 163650 }, { - "epoch": 1.77, - "learning_rate": 3.461114354284232e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017614713613270706, + "loss": 0.0122, "step": 163660 }, { - "epoch": 1.77, - "learning_rate": 3.459492767723941e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017613956843969304, + "loss": 0.0112, "step": 163670 }, { - "epoch": 1.77, - "learning_rate": 3.45787118116365e-05, - "loss": 0.0087, + "epoch": 0.83, + "learning_rate": 0.00017613200074667905, + "loss": 0.0117, "step": 163680 }, { - "epoch": 1.77, - "learning_rate": 3.4562495946033595e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017612443305366503, + "loss": 0.0117, "step": 163690 }, { - "epoch": 1.77, - "learning_rate": 3.454628008043069e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.000176116865360651, + "loss": 0.013, "step": 163700 }, { - "epoch": 1.77, - "learning_rate": 3.453006421482778e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017610929766763702, + "loss": 0.0121, "step": 163710 }, { - "epoch": 1.77, - "learning_rate": 3.451384834922488e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.000176101729974623, + "loss": 0.0133, "step": 163720 }, { - "epoch": 1.77, - "learning_rate": 3.449763248362197e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017609416228160898, + "loss": 0.0118, "step": 163730 }, { - "epoch": 1.77, - "learning_rate": 3.4481416618019066e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.000176086594588595, + "loss": 0.0106, "step": 163740 }, { - "epoch": 1.77, - "learning_rate": 3.446520075241616e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017607902689558097, + "loss": 0.0129, "step": 163750 }, { - "epoch": 1.77, - "learning_rate": 3.444898488681325e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017607145920256695, + "loss": 0.012, "step": 163760 }, { - "epoch": 1.77, - "learning_rate": 3.443276902121035e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017606389150955293, + "loss": 0.0138, "step": 163770 }, { - "epoch": 1.77, - "learning_rate": 3.4416553155607443e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017605632381653894, + "loss": 0.0132, "step": 163780 }, { - "epoch": 1.77, - "learning_rate": 3.4400337290004536e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017604875612352492, + "loss": 0.0206, "step": 163790 }, { - "epoch": 1.77, - "learning_rate": 3.438412142440163e-05, - "loss": 0.0078, + "epoch": 0.83, + "learning_rate": 0.0001760411884305109, + "loss": 0.0131, "step": 163800 }, { - "epoch": 1.77, - "learning_rate": 3.436790555879872e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.0001760336207374969, + "loss": 0.0162, "step": 163810 }, { - "epoch": 1.77, - "learning_rate": 3.4351689693195814e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.0001760260530444829, + "loss": 0.0125, "step": 163820 }, { - "epoch": 1.77, - "learning_rate": 3.4335473827592914e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017601848535146888, + "loss": 0.0117, "step": 163830 }, { - "epoch": 1.77, - "learning_rate": 3.431925796199001e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017601091765845488, + "loss": 0.0132, "step": 163840 }, { - "epoch": 1.77, - "learning_rate": 3.4303042096387106e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017600334996544087, + "loss": 0.0109, "step": 163850 }, { - "epoch": 1.77, - "learning_rate": 3.42868262307842e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017599578227242685, + "loss": 0.0156, "step": 163860 }, { - "epoch": 1.77, - "learning_rate": 3.427061036518129e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017598821457941286, + "loss": 0.0141, "step": 163870 }, { - "epoch": 1.77, - "learning_rate": 3.4254394499578384e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017598064688639884, + "loss": 0.0145, "step": 163880 }, { - "epoch": 1.77, - "learning_rate": 3.423817863397548e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017597307919338482, + "loss": 0.0128, "step": 163890 }, { - "epoch": 1.77, - "learning_rate": 3.422196276837258e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017596551150037083, + "loss": 0.0138, "step": 163900 }, { - "epoch": 1.77, - "learning_rate": 3.420574690276967e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.0001759579438073568, + "loss": 0.0102, "step": 163910 }, { - "epoch": 1.77, - "learning_rate": 3.418953103716676e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.0001759503761143428, + "loss": 0.016, "step": 163920 }, { - "epoch": 1.77, - "learning_rate": 3.4173315171563855e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001759428084213288, + "loss": 0.016, "step": 163930 }, { - "epoch": 1.77, - "learning_rate": 3.415709930596095e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017593524072831478, + "loss": 0.0106, "step": 163940 }, { - "epoch": 1.77, - "learning_rate": 3.414088344035805e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017592767303530076, + "loss": 0.0141, "step": 163950 }, { - "epoch": 1.77, - "learning_rate": 3.412466757475514e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017592010534228674, + "loss": 0.0091, "step": 163960 }, { - "epoch": 1.77, - "learning_rate": 3.410845170915223e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017591253764927275, + "loss": 0.0125, "step": 163970 }, { - "epoch": 1.77, - "learning_rate": 3.4092235843549325e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017590496995625873, + "loss": 0.0139, "step": 163980 }, { - "epoch": 1.77, - "learning_rate": 3.407601997794642e-05, - "loss": 0.005, + "epoch": 0.83, + "learning_rate": 0.00017589740226324471, + "loss": 0.0128, "step": 163990 }, { - "epoch": 1.77, - "learning_rate": 3.405980411234351e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017588983457023072, + "loss": 0.0148, "step": 164000 }, { - "epoch": 1.77, - "eval_cer": 0.9215086938469904, - "eval_loss": 0.005612937733530998, - "eval_runtime": 121.4334, - "eval_samples_per_second": 16.47, - "eval_steps_per_second": 4.117, + "epoch": 0.83, + "eval_cer": 0.914481900656667, + "eval_loss": 0.009098981507122517, + "eval_runtime": 116.6318, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, "step": 164000 }, { - "epoch": 1.77, - "learning_rate": 3.404358824674061e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001758822668772167, + "loss": 0.0169, "step": 164010 }, { - "epoch": 1.77, - "learning_rate": 3.40273723811377e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017587469918420269, + "loss": 0.0105, "step": 164020 }, { - "epoch": 1.77, - "learning_rate": 3.4011156515534796e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017586713149118864, + "loss": 0.0115, "step": 164030 }, { - "epoch": 1.77, - "learning_rate": 3.399494064993189e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017585956379817465, + "loss": 0.011, "step": 164040 }, { - "epoch": 1.77, - "learning_rate": 3.397872478432898e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017585199610516063, + "loss": 0.0092, "step": 164050 }, { - "epoch": 1.77, - "learning_rate": 3.396250891872608e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.0001758444284121466, + "loss": 0.0128, "step": 164060 }, { - "epoch": 1.77, - "learning_rate": 3.3946293053123174e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.00017583686071913262, + "loss": 0.0118, "step": 164070 }, { - "epoch": 1.77, - "learning_rate": 3.3930077187520266e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.0001758292930261186, + "loss": 0.0104, "step": 164080 }, { - "epoch": 1.77, - "learning_rate": 3.391386132191736e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.00017582172533310458, + "loss": 0.0117, "step": 164090 }, { - "epoch": 1.77, - "learning_rate": 3.389764545631445e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.0001758141576400906, + "loss": 0.0123, "step": 164100 }, { - "epoch": 1.77, - "learning_rate": 3.3881429590711545e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017580658994707657, + "loss": 0.0113, "step": 164110 }, { - "epoch": 1.77, - "learning_rate": 3.3865213725108644e-05, - "loss": 0.0088, + "epoch": 0.83, + "learning_rate": 0.00017579902225406255, + "loss": 0.0085, "step": 164120 }, { - "epoch": 1.77, - "learning_rate": 3.384899785950574e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017579145456104856, + "loss": 0.01, "step": 164130 }, { - "epoch": 1.77, - "learning_rate": 3.383278199390283e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017578388686803454, + "loss": 0.0129, "step": 164140 }, { - "epoch": 1.77, - "learning_rate": 3.381656612829992e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017577631917502053, + "loss": 0.0115, "step": 164150 }, { - "epoch": 1.77, - "learning_rate": 3.3800350262697015e-05, - "loss": 0.0052, + "epoch": 0.83, + "learning_rate": 0.0001757687514820065, + "loss": 0.0104, "step": 164160 }, { - "epoch": 1.77, - "learning_rate": 3.3784134397094115e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017576118378899252, + "loss": 0.0162, "step": 164170 }, { - "epoch": 1.77, - "learning_rate": 3.376791853149121e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.0001757536160959785, + "loss": 0.0133, "step": 164180 }, { - "epoch": 1.77, - "learning_rate": 3.375170266588831e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017574604840296448, + "loss": 0.0133, "step": 164190 }, { - "epoch": 1.78, - "learning_rate": 3.37354868002854e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.0001757384807099505, + "loss": 0.0137, "step": 164200 }, { - "epoch": 1.78, - "learning_rate": 3.371927093468249e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017573091301693647, + "loss": 0.0119, "step": 164210 }, { - "epoch": 1.78, - "learning_rate": 3.3703055069079585e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017572334532392245, + "loss": 0.0125, "step": 164220 }, { - "epoch": 1.78, - "learning_rate": 3.368683920347668e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017571577763090846, + "loss": 0.0117, "step": 164230 }, { - "epoch": 1.78, - "learning_rate": 3.367062333787378e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017570820993789444, + "loss": 0.0152, "step": 164240 }, { - "epoch": 1.78, - "learning_rate": 3.365440747227087e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017570064224488042, + "loss": 0.0141, "step": 164250 }, { - "epoch": 1.78, - "learning_rate": 3.363819160666796e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017569307455186643, + "loss": 0.0122, "step": 164260 }, { - "epoch": 1.78, - "learning_rate": 3.3621975741065056e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.0001756855068588524, + "loss": 0.0126, "step": 164270 }, { - "epoch": 1.78, - "learning_rate": 3.360575987546215e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.0001756779391658384, + "loss": 0.0112, "step": 164280 }, { - "epoch": 1.78, - "learning_rate": 3.358954400985924e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.0001756703714728244, + "loss": 0.0101, "step": 164290 }, { - "epoch": 1.78, - "learning_rate": 3.357332814425634e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017566280377981038, + "loss": 0.0127, "step": 164300 }, { - "epoch": 1.78, - "learning_rate": 3.355711227865343e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017565523608679636, + "loss": 0.0159, "step": 164310 }, { - "epoch": 1.78, - "learning_rate": 3.3540896413050526e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017564766839378237, + "loss": 0.0124, "step": 164320 }, { - "epoch": 1.78, - "learning_rate": 3.352468054744762e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017564010070076835, + "loss": 0.0119, "step": 164330 }, { - "epoch": 1.78, - "learning_rate": 3.350846468184471e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017563253300775434, + "loss": 0.013, "step": 164340 }, { - "epoch": 1.78, - "learning_rate": 3.349224881624181e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017562496531474032, + "loss": 0.0102, "step": 164350 }, { - "epoch": 1.78, - "learning_rate": 3.3476032950638904e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017561739762172633, + "loss": 0.0148, "step": 164360 }, { - "epoch": 1.78, - "learning_rate": 3.3459817085036e-05, - "loss": 0.0043, + "epoch": 0.83, + "learning_rate": 0.0001756098299287123, + "loss": 0.0117, "step": 164370 }, { - "epoch": 1.78, - "learning_rate": 3.344360121943309e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.0001756022622356983, + "loss": 0.0124, "step": 164380 }, { - "epoch": 1.78, - "learning_rate": 3.342738535383018e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.0001755946945426843, + "loss": 0.0129, "step": 164390 }, { - "epoch": 1.78, - "learning_rate": 3.3411169488227275e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017558712684967028, + "loss": 0.0101, "step": 164400 }, { - "epoch": 1.78, - "learning_rate": 3.3394953622624374e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017557955915665626, + "loss": 0.0136, "step": 164410 }, { - "epoch": 1.78, - "learning_rate": 3.337873775702147e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.00017557199146364227, + "loss": 0.0121, "step": 164420 }, { - "epoch": 1.78, - "learning_rate": 3.336252189141856e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017556442377062825, + "loss": 0.0123, "step": 164430 }, { - "epoch": 1.78, - "learning_rate": 3.334630602581565e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017555685607761423, + "loss": 0.0108, "step": 164440 }, { - "epoch": 1.78, - "learning_rate": 3.3330090160212745e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017554928838460024, + "loss": 0.0126, "step": 164450 }, { - "epoch": 1.78, - "learning_rate": 3.3313874294609845e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017554172069158622, + "loss": 0.012, "step": 164460 }, { - "epoch": 1.78, - "learning_rate": 3.329765842900694e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.0001755341529985722, + "loss": 0.0112, "step": 164470 }, { - "epoch": 1.78, - "learning_rate": 3.328144256340403e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001755265853055582, + "loss": 0.0139, "step": 164480 }, { - "epoch": 1.78, - "learning_rate": 3.326522669780112e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.0001755190176125442, + "loss": 0.0129, "step": 164490 }, { - "epoch": 1.78, - "learning_rate": 3.3249010832198216e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017551144991953017, + "loss": 0.012, "step": 164500 }, { - "epoch": 1.78, - "learning_rate": 3.3232794966595315e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017550388222651616, + "loss": 0.0103, "step": 164510 }, { - "epoch": 1.78, - "learning_rate": 3.321657910099241e-05, - "loss": 0.0132, + "epoch": 0.83, + "learning_rate": 0.00017549631453350216, + "loss": 0.0139, "step": 164520 }, { - "epoch": 1.78, - "learning_rate": 3.32003632353895e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017548874684048815, + "loss": 0.01, "step": 164530 }, { - "epoch": 1.78, - "learning_rate": 3.31841473697866e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017548117914747413, + "loss": 0.0083, "step": 164540 }, { - "epoch": 1.78, - "learning_rate": 3.316793150418369e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017547361145446014, + "loss": 0.015, "step": 164550 }, { - "epoch": 1.78, - "learning_rate": 3.3151715638580786e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017546604376144612, + "loss": 0.0137, "step": 164560 }, { - "epoch": 1.78, - "learning_rate": 3.313549977297788e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.0001754584760684321, + "loss": 0.0121, "step": 164570 }, { - "epoch": 1.78, - "learning_rate": 3.311928390737497e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001754509083754181, + "loss": 0.0107, "step": 164580 }, { - "epoch": 1.78, - "learning_rate": 3.310306804177207e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.0001754433406824041, + "loss": 0.0125, "step": 164590 }, { - "epoch": 1.78, - "learning_rate": 3.3086852176169164e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017543577298939007, + "loss": 0.014, "step": 164600 }, { - "epoch": 1.78, - "learning_rate": 3.3070636310566256e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017542820529637608, + "loss": 0.0104, "step": 164610 }, { - "epoch": 1.78, - "learning_rate": 3.305442044496335e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017542063760336206, + "loss": 0.016, "step": 164620 }, { - "epoch": 1.78, - "learning_rate": 3.303820457936044e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017541306991034804, + "loss": 0.0153, "step": 164630 }, { - "epoch": 1.78, - "learning_rate": 3.302198871375754e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017540550221733405, + "loss": 0.0118, "step": 164640 }, { - "epoch": 1.78, - "learning_rate": 3.3005772848154634e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017539793452432003, + "loss": 0.0119, "step": 164650 }, { - "epoch": 1.78, - "learning_rate": 3.298955698255173e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.000175390366831306, + "loss": 0.0114, "step": 164660 }, { - "epoch": 1.78, - "learning_rate": 3.297334111694882e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.000175382799138292, + "loss": 0.0138, "step": 164670 }, { - "epoch": 1.78, - "learning_rate": 3.295712525134591e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.000175375231445278, + "loss": 0.0159, "step": 164680 }, { - "epoch": 1.78, - "learning_rate": 3.2940909385743005e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017536766375226398, + "loss": 0.013, "step": 164690 }, { - "epoch": 1.78, - "learning_rate": 3.2924693520140105e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017536009605924997, + "loss": 0.0117, "step": 164700 }, { - "epoch": 1.78, - "learning_rate": 3.29084776545372e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017535252836623597, + "loss": 0.011, "step": 164710 }, { - "epoch": 1.78, - "learning_rate": 3.289226178893429e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017534496067322196, + "loss": 0.0126, "step": 164720 }, { - "epoch": 1.78, - "learning_rate": 3.287604592333138e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017533739298020794, + "loss": 0.0095, "step": 164730 }, { - "epoch": 1.78, - "learning_rate": 3.2859830057728476e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017532982528719395, + "loss": 0.0147, "step": 164740 }, { - "epoch": 1.78, - "learning_rate": 3.2843614192125575e-05, - "loss": 0.0091, + "epoch": 0.83, + "learning_rate": 0.00017532225759417993, + "loss": 0.0116, "step": 164750 }, { - "epoch": 1.78, - "learning_rate": 3.282739832652267e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001753146899011659, + "loss": 0.0159, "step": 164760 }, { - "epoch": 1.78, - "learning_rate": 3.281118246091976e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017530712220815192, + "loss": 0.016, "step": 164770 }, { - "epoch": 1.78, - "learning_rate": 3.279496659531685e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.0001752995545151379, + "loss": 0.0113, "step": 164780 }, { - "epoch": 1.78, - "learning_rate": 3.2778750729713946e-05, - "loss": 0.0042, + "epoch": 0.83, + "learning_rate": 0.00017529198682212388, + "loss": 0.0161, "step": 164790 }, { - "epoch": 1.78, - "learning_rate": 3.2762534864111046e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.0001752844191291099, + "loss": 0.0122, "step": 164800 }, { - "epoch": 1.78, - "learning_rate": 3.274631899850814e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017527685143609587, + "loss": 0.0103, "step": 164810 }, { - "epoch": 1.78, - "learning_rate": 3.273010313290523e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017526928374308185, + "loss": 0.0138, "step": 164820 }, { - "epoch": 1.78, - "learning_rate": 3.2713887267302324e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017526171605006783, + "loss": 0.0142, "step": 164830 }, { - "epoch": 1.78, - "learning_rate": 3.2697671401699417e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017525414835705384, + "loss": 0.0111, "step": 164840 }, { - "epoch": 1.78, - "learning_rate": 3.268145553609651e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017524658066403982, + "loss": 0.012, "step": 164850 }, { - "epoch": 1.78, - "learning_rate": 3.266523967049361e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.0001752390129710258, + "loss": 0.0133, "step": 164860 }, { - "epoch": 1.78, - "learning_rate": 3.26490238048907e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.0001752314452780118, + "loss": 0.0146, "step": 164870 }, { - "epoch": 1.78, - "learning_rate": 3.2632807939287794e-05, - "loss": 0.0101, + "epoch": 0.83, + "learning_rate": 0.0001752238775849978, + "loss": 0.013, "step": 164880 }, { - "epoch": 1.78, - "learning_rate": 3.261659207368489e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017521630989198378, + "loss": 0.0146, "step": 164890 }, { - "epoch": 1.78, - "learning_rate": 3.2600376208081987e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017520874219896978, + "loss": 0.0109, "step": 164900 }, { - "epoch": 1.78, - "learning_rate": 3.258416034247908e-05, - "loss": 0.0052, + "epoch": 0.83, + "learning_rate": 0.00017520117450595577, + "loss": 0.0128, "step": 164910 }, { - "epoch": 1.78, - "learning_rate": 3.256794447687617e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017519360681294175, + "loss": 0.0135, "step": 164920 }, { - "epoch": 1.78, - "learning_rate": 3.255172861127327e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017518603911992776, + "loss": 0.015, "step": 164930 }, { - "epoch": 1.78, - "learning_rate": 3.2535512745670364e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017517847142691374, + "loss": 0.0097, "step": 164940 }, { - "epoch": 1.78, - "learning_rate": 3.251929688006746e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017517090373389972, + "loss": 0.013, "step": 164950 }, { - "epoch": 1.78, - "learning_rate": 3.250308101446455e-05, - "loss": 0.0078, + "epoch": 0.83, + "learning_rate": 0.00017516333604088573, + "loss": 0.0096, "step": 164960 }, { - "epoch": 1.78, - "learning_rate": 3.248686514886164e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001751557683478717, + "loss": 0.0137, "step": 164970 }, { - "epoch": 1.78, - "learning_rate": 3.2470649283258735e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001751482006548577, + "loss": 0.0133, "step": 164980 }, { - "epoch": 1.78, - "learning_rate": 3.2454433417655835e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.0001751406329618437, + "loss": 0.0143, "step": 164990 }, { - "epoch": 1.78, - "learning_rate": 3.243821755205293e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017513306526882968, + "loss": 0.0129, "step": 165000 }, { - "epoch": 1.78, - "eval_cer": 0.9215251973031615, - "eval_loss": 0.005625674035400152, - "eval_runtime": 121.2135, - "eval_samples_per_second": 16.5, - "eval_steps_per_second": 4.125, + "epoch": 0.83, + "eval_cer": 0.9144586111496574, + "eval_loss": 0.008332598023116589, + "eval_runtime": 116.7175, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 165000 }, { - "epoch": 1.78, - "learning_rate": 3.242200168645002e-05, - "loss": 0.0093, + "epoch": 0.83, + "learning_rate": 0.00017512549757581566, + "loss": 0.0141, "step": 165010 }, { - "epoch": 1.78, - "learning_rate": 3.240578582084711e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017511792988280164, + "loss": 0.0119, "step": 165020 }, { - "epoch": 1.78, - "learning_rate": 3.2389569955244206e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017511036218978765, + "loss": 0.0104, "step": 165030 }, { - "epoch": 1.78, - "learning_rate": 3.2373354089641305e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017510279449677363, + "loss": 0.0161, "step": 165040 }, { - "epoch": 1.78, - "learning_rate": 3.23571382240384e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017509522680375961, + "loss": 0.0128, "step": 165050 }, { - "epoch": 1.78, - "learning_rate": 3.234092235843549e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017508765911074562, + "loss": 0.0116, "step": 165060 }, { - "epoch": 1.78, - "learning_rate": 3.2324706492832584e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001750800914177316, + "loss": 0.0123, "step": 165070 }, { - "epoch": 1.78, - "learning_rate": 3.2308490627229676e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017507252372471759, + "loss": 0.0106, "step": 165080 }, { - "epoch": 1.78, - "learning_rate": 3.2292274761626776e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.0001750649560317036, + "loss": 0.0124, "step": 165090 }, { - "epoch": 1.78, - "learning_rate": 3.227605889602387e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017505738833868958, + "loss": 0.0103, "step": 165100 }, { - "epoch": 1.78, - "learning_rate": 3.225984303042096e-05, - "loss": 0.0046, + "epoch": 0.83, + "learning_rate": 0.00017504982064567556, + "loss": 0.0126, "step": 165110 }, { - "epoch": 1.79, - "learning_rate": 3.2243627164818054e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017504225295266157, + "loss": 0.0129, "step": 165120 }, { - "epoch": 1.79, - "learning_rate": 3.222741129921515e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017503468525964755, + "loss": 0.0126, "step": 165130 }, { - "epoch": 1.79, - "learning_rate": 3.221119543361224e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017502711756663353, + "loss": 0.0123, "step": 165140 }, { - "epoch": 1.79, - "learning_rate": 3.219497956800934e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017501954987361954, + "loss": 0.015, "step": 165150 }, { - "epoch": 1.79, - "learning_rate": 3.217876370240643e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017501198218060552, + "loss": 0.0114, "step": 165160 }, { - "epoch": 1.79, - "learning_rate": 3.2162547836803525e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.0001750044144875915, + "loss": 0.0114, "step": 165170 }, { - "epoch": 1.79, - "learning_rate": 3.214633197120062e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017499684679457748, + "loss": 0.0153, "step": 165180 }, { - "epoch": 1.79, - "learning_rate": 3.213011610559771e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.0001749892791015635, + "loss": 0.0112, "step": 165190 }, { - "epoch": 1.79, - "learning_rate": 3.211390023999481e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017498171140854947, + "loss": 0.01, "step": 165200 }, { - "epoch": 1.79, - "learning_rate": 3.20976843743919e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017497414371553545, + "loss": 0.0115, "step": 165210 }, { - "epoch": 1.79, - "learning_rate": 3.2081468508788995e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017496657602252146, + "loss": 0.0123, "step": 165220 }, { - "epoch": 1.79, - "learning_rate": 3.206525264318609e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.00017495900832950744, + "loss": 0.0108, "step": 165230 }, { - "epoch": 1.79, - "learning_rate": 3.204903677758318e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.00017495144063649342, + "loss": 0.0118, "step": 165240 }, { - "epoch": 1.79, - "learning_rate": 3.203282091198028e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017494387294347943, + "loss": 0.0105, "step": 165250 }, { - "epoch": 1.79, - "learning_rate": 3.201660504637737e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017493630525046541, + "loss": 0.0114, "step": 165260 }, { - "epoch": 1.79, - "learning_rate": 3.2000389180774466e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001749287375574514, + "loss": 0.0103, "step": 165270 }, { - "epoch": 1.79, - "learning_rate": 3.1984173315171565e-05, - "loss": 0.0043, + "epoch": 0.83, + "learning_rate": 0.0001749211698644374, + "loss": 0.0143, "step": 165280 }, { - "epoch": 1.79, - "learning_rate": 3.196795744956866e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017491360217142336, + "loss": 0.0137, "step": 165290 }, { - "epoch": 1.79, - "learning_rate": 3.195174158396575e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017490603447840934, + "loss": 0.011, "step": 165300 }, { - "epoch": 1.79, - "learning_rate": 3.193552571836284e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017489846678539532, + "loss": 0.0081, "step": 165310 }, { - "epoch": 1.79, - "learning_rate": 3.1919309852759936e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017489089909238133, + "loss": 0.0122, "step": 165320 }, { - "epoch": 1.79, - "learning_rate": 3.1903093987157036e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.0001748833313993673, + "loss": 0.0095, "step": 165330 }, { - "epoch": 1.79, - "learning_rate": 3.188687812155413e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.0001748757637063533, + "loss": 0.0117, "step": 165340 }, { - "epoch": 1.79, - "learning_rate": 3.187066225595122e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001748681960133393, + "loss": 0.0125, "step": 165350 }, { - "epoch": 1.79, - "learning_rate": 3.1854446390348314e-05, - "loss": 0.0049, + "epoch": 0.83, + "learning_rate": 0.00017486062832032528, + "loss": 0.0095, "step": 165360 }, { - "epoch": 1.79, - "learning_rate": 3.1838230524745406e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.00017485306062731126, + "loss": 0.0132, "step": 165370 }, { - "epoch": 1.79, - "learning_rate": 3.1822014659142506e-05, - "loss": 0.0052, + "epoch": 0.83, + "learning_rate": 0.00017484549293429727, + "loss": 0.0103, "step": 165380 }, { - "epoch": 1.79, - "learning_rate": 3.18057987935396e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017483792524128325, + "loss": 0.0107, "step": 165390 }, { - "epoch": 1.79, - "learning_rate": 3.178958292793669e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017483035754826924, + "loss": 0.0107, "step": 165400 }, { - "epoch": 1.79, - "learning_rate": 3.1773367062333784e-05, - "loss": 0.005, + "epoch": 0.83, + "learning_rate": 0.00017482278985525522, + "loss": 0.0115, "step": 165410 }, { - "epoch": 1.79, - "learning_rate": 3.175715119673088e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017481522216224123, + "loss": 0.0117, "step": 165420 }, { - "epoch": 1.79, - "learning_rate": 3.174093533112797e-05, - "loss": 0.0078, + "epoch": 0.83, + "learning_rate": 0.0001748076544692272, + "loss": 0.0134, "step": 165430 }, { - "epoch": 1.79, - "learning_rate": 3.172471946552507e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.0001748000867762132, + "loss": 0.0156, "step": 165440 }, { - "epoch": 1.79, - "learning_rate": 3.170850359992216e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.0001747925190831992, + "loss": 0.0152, "step": 165450 }, { - "epoch": 1.79, - "learning_rate": 3.1692287734319255e-05, - "loss": 0.0101, + "epoch": 0.83, + "learning_rate": 0.00017478495139018518, + "loss": 0.0143, "step": 165460 }, { - "epoch": 1.79, - "learning_rate": 3.167607186871635e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017477738369717116, + "loss": 0.0114, "step": 165470 }, { - "epoch": 1.79, - "learning_rate": 3.165985600311344e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017476981600415717, + "loss": 0.0118, "step": 165480 }, { - "epoch": 1.79, - "learning_rate": 3.164364013751054e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017476224831114315, + "loss": 0.0091, "step": 165490 }, { - "epoch": 1.79, - "learning_rate": 3.162742427190763e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.00017475468061812913, + "loss": 0.0112, "step": 165500 }, { - "epoch": 1.79, - "learning_rate": 3.1611208406304725e-05, - "loss": 0.0101, + "epoch": 0.84, + "learning_rate": 0.00017474711292511514, + "loss": 0.0143, "step": 165510 }, { - "epoch": 1.79, - "learning_rate": 3.159499254070182e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017473954523210112, + "loss": 0.0131, "step": 165520 }, { - "epoch": 1.79, - "learning_rate": 3.157877667509891e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001747319775390871, + "loss": 0.0116, "step": 165530 }, { - "epoch": 1.79, - "learning_rate": 3.156256080949601e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001747244098460731, + "loss": 0.0138, "step": 165540 }, { - "epoch": 1.79, - "learning_rate": 3.15463449438931e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.0001747168421530591, + "loss": 0.0124, "step": 165550 }, { - "epoch": 1.79, - "learning_rate": 3.1530129078290196e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017470927446004507, + "loss": 0.0114, "step": 165560 }, { - "epoch": 1.79, - "learning_rate": 3.151391321268729e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017470170676703106, + "loss": 0.0123, "step": 165570 }, { - "epoch": 1.79, - "learning_rate": 3.149769734708438e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017469413907401706, + "loss": 0.0143, "step": 165580 }, { - "epoch": 1.79, - "learning_rate": 3.1481481481481474e-05, - "loss": 0.0048, + "epoch": 0.84, + "learning_rate": 0.00017468657138100305, + "loss": 0.0184, "step": 165590 }, { - "epoch": 1.79, - "learning_rate": 3.1465265615878573e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017467900368798903, + "loss": 0.0129, "step": 165600 }, { - "epoch": 1.79, - "learning_rate": 3.1449049750275666e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017467143599497504, + "loss": 0.012, "step": 165610 }, { - "epoch": 1.79, - "learning_rate": 3.1432833884672766e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017466386830196102, + "loss": 0.0108, "step": 165620 }, { - "epoch": 1.79, - "learning_rate": 3.141661801906986e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.000174656300608947, + "loss": 0.0095, "step": 165630 }, { - "epoch": 1.79, - "learning_rate": 3.140040215346695e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.000174648732915933, + "loss": 0.0122, "step": 165640 }, { - "epoch": 1.79, - "learning_rate": 3.1384186287864044e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.000174641165222919, + "loss": 0.013, "step": 165650 }, { - "epoch": 1.79, - "learning_rate": 3.136797042226114e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017463359752990497, + "loss": 0.0153, "step": 165660 }, { - "epoch": 1.79, - "learning_rate": 3.1351754556658236e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017462602983689098, + "loss": 0.012, "step": 165670 }, { - "epoch": 1.79, - "learning_rate": 3.133553869105533e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.00017461846214387696, + "loss": 0.0134, "step": 165680 }, { - "epoch": 1.79, - "learning_rate": 3.131932282545242e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017461089445086294, + "loss": 0.0123, "step": 165690 }, { - "epoch": 1.79, - "learning_rate": 3.1303106959849514e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017460332675784895, + "loss": 0.0107, "step": 165700 }, { - "epoch": 1.79, - "learning_rate": 3.128689109424661e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017459575906483493, + "loss": 0.012, "step": 165710 }, { - "epoch": 1.79, - "learning_rate": 3.12706752286437e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001745881913718209, + "loss": 0.0105, "step": 165720 }, { - "epoch": 1.79, - "learning_rate": 3.12544593630408e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.0001745806236788069, + "loss": 0.0115, "step": 165730 }, { - "epoch": 1.79, - "learning_rate": 3.123824349743789e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.0001745730559857929, + "loss": 0.0161, "step": 165740 }, { - "epoch": 1.79, - "learning_rate": 3.1222027631834985e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017456548829277888, + "loss": 0.0111, "step": 165750 }, { - "epoch": 1.79, - "learning_rate": 3.120581176623208e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017455792059976487, + "loss": 0.0125, "step": 165760 }, { - "epoch": 1.79, - "learning_rate": 3.118959590062917e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017455035290675087, + "loss": 0.0112, "step": 165770 }, { - "epoch": 1.79, - "learning_rate": 3.117338003502627e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017454278521373686, + "loss": 0.0128, "step": 165780 }, { - "epoch": 1.79, - "learning_rate": 3.115716416942336e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017453521752072284, + "loss": 0.0127, "step": 165790 }, { - "epoch": 1.79, - "learning_rate": 3.1140948303820455e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017452764982770885, + "loss": 0.012, "step": 165800 }, { - "epoch": 1.79, - "learning_rate": 3.112473243821755e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017452008213469483, + "loss": 0.0095, "step": 165810 }, { - "epoch": 1.79, - "learning_rate": 3.110851657261464e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001745125144416808, + "loss": 0.0107, "step": 165820 }, { - "epoch": 1.79, - "learning_rate": 3.109230070701174e-05, - "loss": 0.0051, + "epoch": 0.84, + "learning_rate": 0.00017450494674866682, + "loss": 0.0116, "step": 165830 }, { - "epoch": 1.79, - "learning_rate": 3.107608484140883e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001744973790556528, + "loss": 0.0088, "step": 165840 }, { - "epoch": 1.79, - "learning_rate": 3.1059868975805926e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017448981136263878, + "loss": 0.0102, "step": 165850 }, { - "epoch": 1.79, - "learning_rate": 3.104365311020302e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001744822436696248, + "loss": 0.01, "step": 165860 }, { - "epoch": 1.79, - "learning_rate": 3.102743724460011e-05, - "loss": 0.0089, + "epoch": 0.84, + "learning_rate": 0.00017447467597661077, + "loss": 0.0103, "step": 165870 }, { - "epoch": 1.79, - "learning_rate": 3.1011221378997204e-05, - "loss": 0.0083, + "epoch": 0.84, + "learning_rate": 0.00017446710828359675, + "loss": 0.0114, "step": 165880 }, { - "epoch": 1.79, - "learning_rate": 3.0995005513394304e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017445954059058276, + "loss": 0.0148, "step": 165890 }, { - "epoch": 1.79, - "learning_rate": 3.0978789647791396e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017445197289756874, + "loss": 0.0133, "step": 165900 }, { - "epoch": 1.79, - "learning_rate": 3.096257378218849e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017444440520455472, + "loss": 0.0115, "step": 165910 }, { - "epoch": 1.79, - "learning_rate": 3.094635791658558e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001744368375115407, + "loss": 0.0105, "step": 165920 }, { - "epoch": 1.79, - "learning_rate": 3.0930142050982675e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001744292698185267, + "loss": 0.0107, "step": 165930 }, { - "epoch": 1.79, - "learning_rate": 3.0913926185379774e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.0001744217021255127, + "loss": 0.0098, "step": 165940 }, { - "epoch": 1.79, - "learning_rate": 3.089771031977687e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017441413443249868, + "loss": 0.0108, "step": 165950 }, { - "epoch": 1.79, - "learning_rate": 3.088149445417396e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017440656673948468, + "loss": 0.0116, "step": 165960 }, { - "epoch": 1.79, - "learning_rate": 3.086527858857105e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.00017439899904647067, + "loss": 0.01, "step": 165970 }, { - "epoch": 1.79, - "learning_rate": 3.084906272296815e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017439143135345665, + "loss": 0.0128, "step": 165980 }, { - "epoch": 1.79, - "learning_rate": 3.0832846857365245e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017438386366044266, + "loss": 0.0129, "step": 165990 }, { - "epoch": 1.79, - "learning_rate": 3.081663099176234e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017437629596742864, + "loss": 0.0114, "step": 166000 }, { - "epoch": 1.79, - "eval_cer": 0.9215173798765541, - "eval_loss": 0.005517047364264727, - "eval_runtime": 121.2305, - "eval_samples_per_second": 16.497, - "eval_steps_per_second": 4.124, + "epoch": 0.84, + "eval_cer": 0.9144508479806542, + "eval_loss": 0.008648986928164959, + "eval_runtime": 116.5926, + "eval_samples_per_second": 17.154, + "eval_steps_per_second": 4.288, "step": 166000 }, { - "epoch": 1.79, - "learning_rate": 3.080041512615943e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017436872827441462, + "loss": 0.0157, "step": 166010 }, { - "epoch": 1.79, - "learning_rate": 3.078419926055653e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017436116058140063, + "loss": 0.0134, "step": 166020 }, { - "epoch": 1.79, - "learning_rate": 3.076798339495362e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.0001743535928883866, + "loss": 0.0149, "step": 166030 }, { - "epoch": 1.79, - "learning_rate": 3.0751767529350715e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001743460251953726, + "loss": 0.0105, "step": 166040 }, { - "epoch": 1.8, - "learning_rate": 3.073555166374781e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.0001743384575023586, + "loss": 0.0075, "step": 166050 }, { - "epoch": 1.8, - "learning_rate": 3.07193357981449e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017433088980934458, + "loss": 0.0124, "step": 166060 }, { - "epoch": 1.8, - "learning_rate": 3.0703119932542e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.00017432332211633056, + "loss": 0.011, "step": 166070 }, { - "epoch": 1.8, - "learning_rate": 3.068690406693909e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017431575442331654, + "loss": 0.0146, "step": 166080 }, { - "epoch": 1.8, - "learning_rate": 3.0670688201336186e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017430818673030255, + "loss": 0.0113, "step": 166090 }, { - "epoch": 1.8, - "learning_rate": 3.065447233573328e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017430061903728853, + "loss": 0.0151, "step": 166100 }, { - "epoch": 1.8, - "learning_rate": 3.063825647013037e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017429305134427451, + "loss": 0.0094, "step": 166110 }, { - "epoch": 1.8, - "learning_rate": 3.062204060452747e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017428548365126052, + "loss": 0.0113, "step": 166120 }, { - "epoch": 1.8, - "learning_rate": 3.0605824738924563e-05, - "loss": 0.0092, + "epoch": 0.84, + "learning_rate": 0.0001742779159582465, + "loss": 0.0137, "step": 166130 }, { - "epoch": 1.8, - "learning_rate": 3.0589608873321656e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017427034826523249, + "loss": 0.0128, "step": 166140 }, { - "epoch": 1.8, - "learning_rate": 3.057339300771875e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.0001742627805722185, + "loss": 0.0154, "step": 166150 }, { - "epoch": 1.8, - "learning_rate": 3.055717714211584e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017425521287920448, + "loss": 0.013, "step": 166160 }, { - "epoch": 1.8, - "learning_rate": 3.0540961276512934e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017424764518619046, + "loss": 0.0152, "step": 166170 }, { - "epoch": 1.8, - "learning_rate": 3.0524745410910034e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017424007749317647, + "loss": 0.0132, "step": 166180 }, { - "epoch": 1.8, - "learning_rate": 3.0508529545307127e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017423250980016245, + "loss": 0.0114, "step": 166190 }, { - "epoch": 1.8, - "learning_rate": 3.049231367970422e-05, - "loss": 0.0096, + "epoch": 0.84, + "learning_rate": 0.00017422494210714843, + "loss": 0.0114, "step": 166200 }, { - "epoch": 1.8, - "learning_rate": 3.0476097814101312e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017421737441413444, + "loss": 0.0129, "step": 166210 }, { - "epoch": 1.8, - "learning_rate": 3.0459881948498408e-05, - "loss": 0.009, + "epoch": 0.84, + "learning_rate": 0.00017420980672112042, + "loss": 0.0129, "step": 166220 }, { - "epoch": 1.8, - "learning_rate": 3.04436660828955e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.0001742022390281064, + "loss": 0.0094, "step": 166230 }, { - "epoch": 1.8, - "learning_rate": 3.0427450217292597e-05, - "loss": 0.0083, + "epoch": 0.84, + "learning_rate": 0.00017419467133509238, + "loss": 0.0112, "step": 166240 }, { - "epoch": 1.8, - "learning_rate": 3.041123435168969e-05, - "loss": 0.0051, + "epoch": 0.84, + "learning_rate": 0.0001741871036420784, + "loss": 0.0107, "step": 166250 }, { - "epoch": 1.8, - "learning_rate": 3.0395018486086783e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017417953594906437, + "loss": 0.0133, "step": 166260 }, { - "epoch": 1.8, - "learning_rate": 3.037880262048388e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017417196825605035, + "loss": 0.0128, "step": 166270 }, { - "epoch": 1.8, - "learning_rate": 3.036258675488097e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017416440056303636, + "loss": 0.0112, "step": 166280 }, { - "epoch": 1.8, - "learning_rate": 3.0346370889278064e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017415683287002234, + "loss": 0.013, "step": 166290 }, { - "epoch": 1.8, - "learning_rate": 3.033015502367516e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017414926517700832, + "loss": 0.0125, "step": 166300 }, { - "epoch": 1.8, - "learning_rate": 3.0313939158072253e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017414169748399433, + "loss": 0.0129, "step": 166310 }, { - "epoch": 1.8, - "learning_rate": 3.0297723292469346e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017413412979098031, + "loss": 0.0122, "step": 166320 }, { - "epoch": 1.8, - "learning_rate": 3.0281507426866442e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.0001741265620979663, + "loss": 0.0102, "step": 166330 }, { - "epoch": 1.8, - "learning_rate": 3.0265291561263538e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.0001741189944049523, + "loss": 0.0123, "step": 166340 }, { - "epoch": 1.8, - "learning_rate": 3.0249075695660634e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017411142671193829, + "loss": 0.0116, "step": 166350 }, { - "epoch": 1.8, - "learning_rate": 3.0232859830057727e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017410385901892427, + "loss": 0.0143, "step": 166360 }, { - "epoch": 1.8, - "learning_rate": 3.0216643964454823e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017409629132591028, + "loss": 0.0112, "step": 166370 }, { - "epoch": 1.8, - "learning_rate": 3.0200428098851916e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017408872363289626, + "loss": 0.0116, "step": 166380 }, { - "epoch": 1.8, - "learning_rate": 3.018421223324901e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.00017408115593988224, + "loss": 0.0101, "step": 166390 }, { - "epoch": 1.8, - "learning_rate": 3.0167996367646105e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017407358824686825, + "loss": 0.0112, "step": 166400 }, { - "epoch": 1.8, - "learning_rate": 3.0151780502043198e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017406602055385423, + "loss": 0.0138, "step": 166410 }, { - "epoch": 1.8, - "learning_rate": 3.013556463644029e-05, - "loss": 0.0048, + "epoch": 0.84, + "learning_rate": 0.0001740584528608402, + "loss": 0.0123, "step": 166420 }, { - "epoch": 1.8, - "learning_rate": 3.0119348770837386e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.0001740508851678262, + "loss": 0.0136, "step": 166430 }, { - "epoch": 1.8, - "learning_rate": 3.010313290523448e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.0001740433174748122, + "loss": 0.0097, "step": 166440 }, { - "epoch": 1.8, - "learning_rate": 3.0086917039631575e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017403574978179818, + "loss": 0.012, "step": 166450 }, { - "epoch": 1.8, - "learning_rate": 3.0070701174028668e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017402818208878416, + "loss": 0.0113, "step": 166460 }, { - "epoch": 1.8, - "learning_rate": 3.005448530842576e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017402061439577017, + "loss": 0.0106, "step": 166470 }, { - "epoch": 1.8, - "learning_rate": 3.0038269442822857e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017401304670275615, + "loss": 0.0121, "step": 166480 }, { - "epoch": 1.8, - "learning_rate": 3.002205357721995e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017400547900974213, + "loss": 0.012, "step": 166490 }, { - "epoch": 1.8, - "learning_rate": 3.0005837711617042e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017399791131672814, + "loss": 0.0156, "step": 166500 }, { - "epoch": 1.8, - "learning_rate": 2.998962184601414e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017399034362371412, + "loss": 0.0114, "step": 166510 }, { - "epoch": 1.8, - "learning_rate": 2.997340598041123e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.0001739827759307001, + "loss": 0.0105, "step": 166520 }, { - "epoch": 1.8, - "learning_rate": 2.9957190114808327e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017397520823768611, + "loss": 0.011, "step": 166530 }, { - "epoch": 1.8, - "learning_rate": 2.994097424920542e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017396764054467207, + "loss": 0.0108, "step": 166540 }, { - "epoch": 1.8, - "learning_rate": 2.9924758383602513e-05, - "loss": 0.0089, + "epoch": 0.84, + "learning_rate": 0.00017396007285165805, + "loss": 0.0133, "step": 166550 }, { - "epoch": 1.8, - "learning_rate": 2.990854251799961e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017395250515864403, + "loss": 0.0113, "step": 166560 }, { - "epoch": 1.8, - "learning_rate": 2.9892326652396702e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017394493746563004, + "loss": 0.0152, "step": 166570 }, { - "epoch": 1.8, - "learning_rate": 2.9876110786793794e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017393736977261602, + "loss": 0.0163, "step": 166580 }, { - "epoch": 1.8, - "learning_rate": 2.985989492119089e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.000173929802079602, + "loss": 0.0113, "step": 166590 }, { - "epoch": 1.8, - "learning_rate": 2.9843679055587983e-05, - "loss": 0.0088, + "epoch": 0.84, + "learning_rate": 0.000173922234386588, + "loss": 0.0157, "step": 166600 }, { - "epoch": 1.8, - "learning_rate": 2.9827463189985076e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.000173914666693574, + "loss": 0.0118, "step": 166610 }, { - "epoch": 1.8, - "learning_rate": 2.9811247324382172e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017390709900055997, + "loss": 0.016, "step": 166620 }, { - "epoch": 1.8, - "learning_rate": 2.9795031458779265e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017389953130754596, + "loss": 0.0121, "step": 166630 }, { - "epoch": 1.8, - "learning_rate": 2.977881559317636e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017389196361453196, + "loss": 0.0125, "step": 166640 }, { - "epoch": 1.8, - "learning_rate": 2.9762599727573454e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017388439592151795, + "loss": 0.0123, "step": 166650 }, { - "epoch": 1.8, - "learning_rate": 2.9746383861970547e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017387682822850393, + "loss": 0.0106, "step": 166660 }, { - "epoch": 1.8, - "learning_rate": 2.9730167996367643e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017386926053548994, + "loss": 0.0118, "step": 166670 }, { - "epoch": 1.8, - "learning_rate": 2.9713952130764735e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017386169284247592, + "loss": 0.0119, "step": 166680 }, { - "epoch": 1.8, - "learning_rate": 2.9697736265161828e-05, - "loss": 0.0048, + "epoch": 0.84, + "learning_rate": 0.0001738541251494619, + "loss": 0.0081, "step": 166690 }, { - "epoch": 1.8, - "learning_rate": 2.9681520399558928e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001738465574564479, + "loss": 0.0124, "step": 166700 }, { - "epoch": 1.8, - "learning_rate": 2.966530453395602e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001738389897634339, + "loss": 0.0149, "step": 166710 }, { - "epoch": 1.8, - "learning_rate": 2.9649088668353117e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017383142207041987, + "loss": 0.0119, "step": 166720 }, { - "epoch": 1.8, - "learning_rate": 2.963287280275021e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017382385437740588, + "loss": 0.0129, "step": 166730 }, { - "epoch": 1.8, - "learning_rate": 2.9616656937147305e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017381628668439186, + "loss": 0.0107, "step": 166740 }, { - "epoch": 1.8, - "learning_rate": 2.9600441071544398e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017380871899137784, + "loss": 0.0131, "step": 166750 }, { - "epoch": 1.8, - "learning_rate": 2.958422520594149e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017380115129836385, + "loss": 0.0118, "step": 166760 }, { - "epoch": 1.8, - "learning_rate": 2.9568009340338587e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017379358360534983, + "loss": 0.0103, "step": 166770 }, { - "epoch": 1.8, - "learning_rate": 2.955179347473568e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001737860159123358, + "loss": 0.0115, "step": 166780 }, { - "epoch": 1.8, - "learning_rate": 2.9535577609132773e-05, - "loss": 0.0094, + "epoch": 0.84, + "learning_rate": 0.00017377844821932182, + "loss": 0.0114, "step": 166790 }, { - "epoch": 1.8, - "learning_rate": 2.951936174352987e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001737708805263078, + "loss": 0.0098, "step": 166800 }, { - "epoch": 1.8, - "learning_rate": 2.950314587792696e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017376331283329378, + "loss": 0.0121, "step": 166810 }, { - "epoch": 1.8, - "learning_rate": 2.9486930012324058e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017375574514027977, + "loss": 0.0119, "step": 166820 }, { - "epoch": 1.8, - "learning_rate": 2.947071414672115e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017374817744726577, + "loss": 0.0106, "step": 166830 }, { - "epoch": 1.8, - "learning_rate": 2.9454498281118243e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017374060975425176, + "loss": 0.0118, "step": 166840 }, { - "epoch": 1.8, - "learning_rate": 2.943828241551534e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017373304206123774, + "loss": 0.0119, "step": 166850 }, { - "epoch": 1.8, - "learning_rate": 2.9422066549912432e-05, - "loss": 0.0083, + "epoch": 0.84, + "learning_rate": 0.00017372547436822375, + "loss": 0.0102, "step": 166860 }, { - "epoch": 1.8, - "learning_rate": 2.9405850684309525e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017371790667520973, + "loss": 0.0139, "step": 166870 }, { - "epoch": 1.8, - "learning_rate": 2.938963481870662e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001737103389821957, + "loss": 0.0119, "step": 166880 }, { - "epoch": 1.8, - "learning_rate": 2.9373418953103714e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017370277128918172, + "loss": 0.0108, "step": 166890 }, { - "epoch": 1.8, - "learning_rate": 2.9357203087500806e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001736952035961677, + "loss": 0.0122, "step": 166900 }, { - "epoch": 1.8, - "learning_rate": 2.9340987221897902e-05, - "loss": 0.0093, + "epoch": 0.84, + "learning_rate": 0.00017368763590315368, + "loss": 0.0102, "step": 166910 }, { - "epoch": 1.8, - "learning_rate": 2.9324771356294995e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.0001736800682101397, + "loss": 0.0112, "step": 166920 }, { - "epoch": 1.8, - "learning_rate": 2.930855549069209e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017367250051712567, + "loss": 0.01, "step": 166930 }, { - "epoch": 1.8, - "learning_rate": 2.9292339625089184e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017366493282411165, + "loss": 0.0123, "step": 166940 }, { - "epoch": 1.8, - "learning_rate": 2.9276123759486277e-05, - "loss": 0.0047, + "epoch": 0.84, + "learning_rate": 0.00017365736513109766, + "loss": 0.0113, "step": 166950 }, { - "epoch": 1.8, - "learning_rate": 2.9259907893883373e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017364979743808364, + "loss": 0.0096, "step": 166960 }, { - "epoch": 1.81, - "learning_rate": 2.9243692028280466e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017364222974506962, + "loss": 0.0096, "step": 166970 }, { - "epoch": 1.81, - "learning_rate": 2.922747616267756e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.0001736346620520556, + "loss": 0.0114, "step": 166980 }, { - "epoch": 1.81, - "learning_rate": 2.9211260297074655e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001736270943590416, + "loss": 0.0108, "step": 166990 }, { - "epoch": 1.81, - "learning_rate": 2.9195044431471747e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.0001736195266660276, + "loss": 0.0144, "step": 167000 }, { - "epoch": 1.81, - "eval_cer": 0.9215278031120306, - "eval_loss": 0.0055626993998885155, - "eval_runtime": 121.1369, - "eval_samples_per_second": 16.51, - "eval_steps_per_second": 4.128, + "epoch": 0.84, + "eval_cer": 0.9144906342217957, + "eval_loss": 0.008696102537214756, + "eval_runtime": 116.717, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 167000 }, { - "epoch": 1.81, - "learning_rate": 2.9178828565868843e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017361195897301358, + "loss": 0.0094, "step": 167010 }, { - "epoch": 1.81, - "learning_rate": 2.9162612700265936e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.00017360439127999958, + "loss": 0.0124, "step": 167020 }, { - "epoch": 1.81, - "learning_rate": 2.914639683466303e-05, - "loss": 0.0051, + "epoch": 0.84, + "learning_rate": 0.00017359682358698557, + "loss": 0.0132, "step": 167030 }, { - "epoch": 1.81, - "learning_rate": 2.9130180969060125e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017358925589397155, + "loss": 0.01, "step": 167040 }, { - "epoch": 1.81, - "learning_rate": 2.9113965103457218e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017358168820095756, + "loss": 0.0132, "step": 167050 }, { - "epoch": 1.81, - "learning_rate": 2.9097749237854317e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017357412050794354, + "loss": 0.0123, "step": 167060 }, { - "epoch": 1.81, - "learning_rate": 2.908153337225141e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017356655281492952, + "loss": 0.0114, "step": 167070 }, { - "epoch": 1.81, - "learning_rate": 2.9065317506648503e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017355898512191553, + "loss": 0.0145, "step": 167080 }, { - "epoch": 1.81, - "learning_rate": 2.90491016410456e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.0001735514174289015, + "loss": 0.01, "step": 167090 }, { - "epoch": 1.81, - "learning_rate": 2.903288577544269e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.0001735438497358875, + "loss": 0.0122, "step": 167100 }, { - "epoch": 1.81, - "learning_rate": 2.9016669909839788e-05, - "loss": 0.0046, + "epoch": 0.84, + "learning_rate": 0.0001735362820428735, + "loss": 0.0117, "step": 167110 }, { - "epoch": 1.81, - "learning_rate": 2.900045404423688e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017352871434985948, + "loss": 0.0097, "step": 167120 }, { - "epoch": 1.81, - "learning_rate": 2.8984238178633973e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017352114665684546, + "loss": 0.013, "step": 167130 }, { - "epoch": 1.81, - "learning_rate": 2.896802231303107e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017351357896383144, + "loss": 0.0112, "step": 167140 }, { - "epoch": 1.81, - "learning_rate": 2.8951806447428162e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017350601127081745, + "loss": 0.0142, "step": 167150 }, { - "epoch": 1.81, - "learning_rate": 2.8935590581825255e-05, - "loss": 0.0049, + "epoch": 0.84, + "learning_rate": 0.00017349844357780343, + "loss": 0.0128, "step": 167160 }, { - "epoch": 1.81, - "learning_rate": 2.891937471622235e-05, - "loss": 0.009, + "epoch": 0.84, + "learning_rate": 0.00017349087588478941, + "loss": 0.0121, "step": 167170 }, { - "epoch": 1.81, - "learning_rate": 2.8903158850619444e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017348330819177542, + "loss": 0.0113, "step": 167180 }, { - "epoch": 1.81, - "learning_rate": 2.8886942985016537e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.0001734757404987614, + "loss": 0.0109, "step": 167190 }, { - "epoch": 1.81, - "learning_rate": 2.8870727119413633e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017346817280574739, + "loss": 0.0136, "step": 167200 }, { - "epoch": 1.81, - "learning_rate": 2.8854511253810725e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001734606051127334, + "loss": 0.0099, "step": 167210 }, { - "epoch": 1.81, - "learning_rate": 2.883829538820782e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.00017345303741971938, + "loss": 0.0107, "step": 167220 }, { - "epoch": 1.81, - "learning_rate": 2.8822079522604914e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017344546972670536, + "loss": 0.0121, "step": 167230 }, { - "epoch": 1.81, - "learning_rate": 2.8805863657002007e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.00017343790203369137, + "loss": 0.011, "step": 167240 }, { - "epoch": 1.81, - "learning_rate": 2.8789647791399103e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017343033434067735, + "loss": 0.0119, "step": 167250 }, { - "epoch": 1.81, - "learning_rate": 2.8773431925796196e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017342276664766333, + "loss": 0.0121, "step": 167260 }, { - "epoch": 1.81, - "learning_rate": 2.875721606019329e-05, - "loss": 0.0091, + "epoch": 0.84, + "learning_rate": 0.00017341519895464934, + "loss": 0.0112, "step": 167270 }, { - "epoch": 1.81, - "learning_rate": 2.8741000194590385e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017340763126163532, + "loss": 0.0117, "step": 167280 }, { - "epoch": 1.81, - "learning_rate": 2.8724784328987478e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001734000635686213, + "loss": 0.012, "step": 167290 }, { - "epoch": 1.81, - "learning_rate": 2.8708568463384574e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001733924958756073, + "loss": 0.0103, "step": 167300 }, { - "epoch": 1.81, - "learning_rate": 2.8692352597781666e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.0001733849281825933, + "loss": 0.0111, "step": 167310 }, { - "epoch": 1.81, - "learning_rate": 2.867613673217876e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017337736048957927, + "loss": 0.0115, "step": 167320 }, { - "epoch": 1.81, - "learning_rate": 2.8659920866575855e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017336979279656525, + "loss": 0.0086, "step": 167330 }, { - "epoch": 1.81, - "learning_rate": 2.8643705000972948e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017336222510355126, + "loss": 0.0151, "step": 167340 }, { - "epoch": 1.81, - "learning_rate": 2.862748913537004e-05, - "loss": 0.0087, + "epoch": 0.84, + "learning_rate": 0.00017335465741053724, + "loss": 0.0096, "step": 167350 }, { - "epoch": 1.81, - "learning_rate": 2.8611273269767137e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017334708971752322, + "loss": 0.0109, "step": 167360 }, { - "epoch": 1.81, - "learning_rate": 2.859505740416423e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017333952202450923, + "loss": 0.0148, "step": 167370 }, { - "epoch": 1.81, - "learning_rate": 2.8578841538561326e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017333195433149521, + "loss": 0.013, "step": 167380 }, { - "epoch": 1.81, - "learning_rate": 2.856262567295842e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001733243866384812, + "loss": 0.0121, "step": 167390 }, { - "epoch": 1.81, - "learning_rate": 2.854640980735551e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001733168189454672, + "loss": 0.0105, "step": 167400 }, { - "epoch": 1.81, - "learning_rate": 2.8530193941752607e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017330925125245319, + "loss": 0.0123, "step": 167410 }, { - "epoch": 1.81, - "learning_rate": 2.8513978076149704e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017330168355943917, + "loss": 0.0119, "step": 167420 }, { - "epoch": 1.81, - "learning_rate": 2.84977622105468e-05, - "loss": 0.0087, + "epoch": 0.84, + "learning_rate": 0.00017329411586642518, + "loss": 0.0118, "step": 167430 }, { - "epoch": 1.81, - "learning_rate": 2.8481546344943892e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017328654817341116, + "loss": 0.0103, "step": 167440 }, { - "epoch": 1.81, - "learning_rate": 2.8465330479340985e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017327898048039714, + "loss": 0.0102, "step": 167450 }, { - "epoch": 1.81, - "learning_rate": 2.844911461373808e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017327141278738315, + "loss": 0.0108, "step": 167460 }, { - "epoch": 1.81, - "learning_rate": 2.8432898748135174e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017326384509436913, + "loss": 0.0096, "step": 167470 }, { - "epoch": 1.81, - "learning_rate": 2.841668288253227e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.0001732562774013551, + "loss": 0.0141, "step": 167480 }, { - "epoch": 1.81, - "learning_rate": 2.8400467016929363e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.0001732487097083411, + "loss": 0.0153, "step": 167490 }, { - "epoch": 1.81, - "learning_rate": 2.8384251151326456e-05, - "loss": 0.0046, + "epoch": 0.85, + "learning_rate": 0.0001732411420153271, + "loss": 0.0126, "step": 167500 }, { - "epoch": 1.81, - "learning_rate": 2.8368035285723552e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017323357432231308, + "loss": 0.0137, "step": 167510 }, { - "epoch": 1.81, - "learning_rate": 2.8351819420120644e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017322600662929906, + "loss": 0.015, "step": 167520 }, { - "epoch": 1.81, - "learning_rate": 2.8335603554517737e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017321843893628507, + "loss": 0.0118, "step": 167530 }, { - "epoch": 1.81, - "learning_rate": 2.8319387688914833e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017321087124327105, + "loss": 0.0108, "step": 167540 }, { - "epoch": 1.81, - "learning_rate": 2.8303171823311926e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017320330355025703, + "loss": 0.0101, "step": 167550 }, { - "epoch": 1.81, - "learning_rate": 2.828695595770902e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017319573585724304, + "loss": 0.0102, "step": 167560 }, { - "epoch": 1.81, - "learning_rate": 2.8270740092106115e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017318816816422902, + "loss": 0.0129, "step": 167570 }, { - "epoch": 1.81, - "learning_rate": 2.8254524226503208e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.000173180600471215, + "loss": 0.0145, "step": 167580 }, { - "epoch": 1.81, - "learning_rate": 2.8238308360900304e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017317303277820101, + "loss": 0.012, "step": 167590 }, { - "epoch": 1.81, - "learning_rate": 2.8222092495297397e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.000173165465085187, + "loss": 0.0163, "step": 167600 }, { - "epoch": 1.81, - "learning_rate": 2.820587662969449e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017315789739217298, + "loss": 0.0091, "step": 167610 }, { - "epoch": 1.81, - "learning_rate": 2.8189660764091585e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017315032969915899, + "loss": 0.0127, "step": 167620 }, { - "epoch": 1.81, - "learning_rate": 2.8173444898488678e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017314276200614497, + "loss": 0.0114, "step": 167630 }, { - "epoch": 1.81, - "learning_rate": 2.815722903288577e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017313519431313095, + "loss": 0.0142, "step": 167640 }, { - "epoch": 1.81, - "learning_rate": 2.8141013167282867e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017312762662011693, + "loss": 0.0122, "step": 167650 }, { - "epoch": 1.81, - "learning_rate": 2.812479730167996e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017312005892710294, + "loss": 0.011, "step": 167660 }, { - "epoch": 1.81, - "learning_rate": 2.8108581436077056e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017311249123408892, + "loss": 0.0138, "step": 167670 }, { - "epoch": 1.81, - "learning_rate": 2.809236557047415e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001731049235410749, + "loss": 0.014, "step": 167680 }, { - "epoch": 1.81, - "learning_rate": 2.807614970487124e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.0001730973558480609, + "loss": 0.0115, "step": 167690 }, { - "epoch": 1.81, - "learning_rate": 2.8059933839268338e-05, - "loss": 0.0095, + "epoch": 0.85, + "learning_rate": 0.0001730897881550469, + "loss": 0.0123, "step": 167700 }, { - "epoch": 1.81, - "learning_rate": 2.804371797366543e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017308222046203287, + "loss": 0.0152, "step": 167710 }, { - "epoch": 1.81, - "learning_rate": 2.8027502108062523e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017307465276901888, + "loss": 0.0124, "step": 167720 }, { - "epoch": 1.81, - "learning_rate": 2.801128624245962e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017306708507600486, + "loss": 0.0114, "step": 167730 }, { - "epoch": 1.81, - "learning_rate": 2.7995070376856712e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017305951738299084, + "loss": 0.0119, "step": 167740 }, { - "epoch": 1.81, - "learning_rate": 2.7978854511253808e-05, - "loss": 0.0047, + "epoch": 0.85, + "learning_rate": 0.00017305194968997685, + "loss": 0.0122, "step": 167750 }, { - "epoch": 1.81, - "learning_rate": 2.79626386456509e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017304438199696283, + "loss": 0.0202, "step": 167760 }, { - "epoch": 1.81, - "learning_rate": 2.7946422780047994e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017303681430394882, + "loss": 0.012, "step": 167770 }, { - "epoch": 1.81, - "learning_rate": 2.7930206914445093e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017302924661093482, + "loss": 0.0115, "step": 167780 }, { - "epoch": 1.81, - "learning_rate": 2.7913991048842186e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.0001730216789179208, + "loss": 0.011, "step": 167790 }, { - "epoch": 1.81, - "learning_rate": 2.7897775183239282e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017301411122490676, + "loss": 0.0136, "step": 167800 }, { - "epoch": 1.81, - "learning_rate": 2.7881559317636375e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017300654353189274, + "loss": 0.012, "step": 167810 }, { - "epoch": 1.81, - "learning_rate": 2.7865343452033467e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017299897583887875, + "loss": 0.0144, "step": 167820 }, { - "epoch": 1.81, - "learning_rate": 2.7849127586430564e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017299140814586473, + "loss": 0.0135, "step": 167830 }, { - "epoch": 1.81, - "learning_rate": 2.7832911720827656e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017298384045285071, + "loss": 0.0133, "step": 167840 }, { - "epoch": 1.81, - "learning_rate": 2.781669585522475e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017297627275983672, + "loss": 0.012, "step": 167850 }, { - "epoch": 1.81, - "learning_rate": 2.7800479989621845e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001729687050668227, + "loss": 0.0126, "step": 167860 }, { - "epoch": 1.81, - "learning_rate": 2.7784264124018938e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017296113737380869, + "loss": 0.0136, "step": 167870 }, { - "epoch": 1.81, - "learning_rate": 2.7768048258416034e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017295356968079467, + "loss": 0.0127, "step": 167880 }, { - "epoch": 1.81, - "learning_rate": 2.7751832392813127e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017294600198778067, + "loss": 0.0127, "step": 167890 }, { - "epoch": 1.82, - "learning_rate": 2.773561652721022e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017293843429476666, + "loss": 0.0118, "step": 167900 }, { - "epoch": 1.82, - "learning_rate": 2.7719400661607316e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017293086660175264, + "loss": 0.0123, "step": 167910 }, { - "epoch": 1.82, - "learning_rate": 2.770318479600441e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017292329890873865, + "loss": 0.0128, "step": 167920 }, { - "epoch": 1.82, - "learning_rate": 2.76869689304015e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017291573121572463, + "loss": 0.0128, "step": 167930 }, { - "epoch": 1.82, - "learning_rate": 2.7670753064798597e-05, - "loss": 0.0044, + "epoch": 0.85, + "learning_rate": 0.0001729081635227106, + "loss": 0.0138, "step": 167940 }, { - "epoch": 1.82, - "learning_rate": 2.765453719919569e-05, - "loss": 0.0099, + "epoch": 0.85, + "learning_rate": 0.00017290059582969662, + "loss": 0.0138, "step": 167950 }, { - "epoch": 1.82, - "learning_rate": 2.7638321333592786e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.0001728930281366826, + "loss": 0.0106, "step": 167960 }, { - "epoch": 1.82, - "learning_rate": 2.762210546798988e-05, - "loss": 0.0044, + "epoch": 0.85, + "learning_rate": 0.00017288546044366858, + "loss": 0.0127, "step": 167970 }, { - "epoch": 1.82, - "learning_rate": 2.760588960238697e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.0001728778927506546, + "loss": 0.0111, "step": 167980 }, { - "epoch": 1.82, - "learning_rate": 2.7589673736784068e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017287032505764057, + "loss": 0.0111, "step": 167990 }, { - "epoch": 1.82, - "learning_rate": 2.757345787118116e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017286275736462655, + "loss": 0.012, "step": 168000 }, { - "epoch": 1.82, - "eval_cer": 0.9215182484795105, - "eval_loss": 0.005569620057940483, - "eval_runtime": 121.2406, - "eval_samples_per_second": 16.496, - "eval_steps_per_second": 4.124, + "epoch": 0.85, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.008770990185439587, + "eval_runtime": 116.7217, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, "step": 168000 }, { - "epoch": 1.82, - "learning_rate": 2.7557242005578253e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017285518967161256, + "loss": 0.0147, "step": 168010 }, { - "epoch": 1.82, - "learning_rate": 2.754102613997535e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017284762197859854, + "loss": 0.0125, "step": 168020 }, { - "epoch": 1.82, - "learning_rate": 2.7524810274372442e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017284005428558452, + "loss": 0.012, "step": 168030 }, { - "epoch": 1.82, - "learning_rate": 2.7508594408769538e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.0001728324865925705, + "loss": 0.0086, "step": 168040 }, { - "epoch": 1.82, - "learning_rate": 2.749237854316663e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017282491889955651, + "loss": 0.0135, "step": 168050 }, { - "epoch": 1.82, - "learning_rate": 2.7476162677563724e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001728173512065425, + "loss": 0.0141, "step": 168060 }, { - "epoch": 1.82, - "learning_rate": 2.745994681196082e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017280978351352848, + "loss": 0.0135, "step": 168070 }, { - "epoch": 1.82, - "learning_rate": 2.7443730946357913e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017280221582051449, + "loss": 0.0137, "step": 168080 }, { - "epoch": 1.82, - "learning_rate": 2.7427515080755005e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017279464812750047, + "loss": 0.01, "step": 168090 }, { - "epoch": 1.82, - "learning_rate": 2.74112992151521e-05, - "loss": 0.0093, + "epoch": 0.85, + "learning_rate": 0.00017278708043448645, + "loss": 0.0123, "step": 168100 }, { - "epoch": 1.82, - "learning_rate": 2.7395083349549194e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017277951274147246, + "loss": 0.013, "step": 168110 }, { - "epoch": 1.82, - "learning_rate": 2.737886748394629e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017277194504845844, + "loss": 0.01, "step": 168120 }, { - "epoch": 1.82, - "learning_rate": 2.7362651618343383e-05, - "loss": 0.0112, + "epoch": 0.85, + "learning_rate": 0.00017276437735544442, + "loss": 0.0123, "step": 168130 }, { - "epoch": 1.82, - "learning_rate": 2.734643575274048e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017275680966243043, + "loss": 0.0131, "step": 168140 }, { - "epoch": 1.82, - "learning_rate": 2.7330219887137575e-05, - "loss": 0.0046, + "epoch": 0.85, + "learning_rate": 0.0001727492419694164, + "loss": 0.01, "step": 168150 }, { - "epoch": 1.82, - "learning_rate": 2.7314004021534668e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.0001727416742764024, + "loss": 0.0154, "step": 168160 }, { - "epoch": 1.82, - "learning_rate": 2.7297788155931764e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.0001727341065833884, + "loss": 0.0103, "step": 168170 }, { - "epoch": 1.82, - "learning_rate": 2.7281572290328857e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017272653889037438, + "loss": 0.0105, "step": 168180 }, { - "epoch": 1.82, - "learning_rate": 2.726535642472595e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017271897119736036, + "loss": 0.0125, "step": 168190 }, { - "epoch": 1.82, - "learning_rate": 2.7249140559123046e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017271140350434637, + "loss": 0.0122, "step": 168200 }, { - "epoch": 1.82, - "learning_rate": 2.723292469352014e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017270383581133235, + "loss": 0.0112, "step": 168210 }, { - "epoch": 1.82, - "learning_rate": 2.721670882791723e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.00017269626811831833, + "loss": 0.0126, "step": 168220 }, { - "epoch": 1.82, - "learning_rate": 2.7200492962314328e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017268870042530432, + "loss": 0.0117, "step": 168230 }, { - "epoch": 1.82, - "learning_rate": 2.718427709671142e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017268113273229032, + "loss": 0.0132, "step": 168240 }, { - "epoch": 1.82, - "learning_rate": 2.7168061231108516e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.0001726735650392763, + "loss": 0.0142, "step": 168250 }, { - "epoch": 1.82, - "learning_rate": 2.715184536550561e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.0001726659973462623, + "loss": 0.0142, "step": 168260 }, { - "epoch": 1.82, - "learning_rate": 2.7135629499902702e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.0001726584296532483, + "loss": 0.0155, "step": 168270 }, { - "epoch": 1.82, - "learning_rate": 2.7119413634299798e-05, - "loss": 0.0078, + "epoch": 0.85, + "learning_rate": 0.00017265086196023428, + "loss": 0.0107, "step": 168280 }, { - "epoch": 1.82, - "learning_rate": 2.710319776869689e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017264329426722026, + "loss": 0.0107, "step": 168290 }, { - "epoch": 1.82, - "learning_rate": 2.7086981903093984e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017263572657420627, + "loss": 0.0151, "step": 168300 }, { - "epoch": 1.82, - "learning_rate": 2.707076603749108e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017262815888119225, + "loss": 0.0118, "step": 168310 }, { - "epoch": 1.82, - "learning_rate": 2.7054550171888172e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.00017262059118817823, + "loss": 0.014, "step": 168320 }, { - "epoch": 1.82, - "learning_rate": 2.703833430628527e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017261302349516424, + "loss": 0.0142, "step": 168330 }, { - "epoch": 1.82, - "learning_rate": 2.702211844068236e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017260545580215022, + "loss": 0.0116, "step": 168340 }, { - "epoch": 1.82, - "learning_rate": 2.7005902575079454e-05, - "loss": 0.0087, + "epoch": 0.85, + "learning_rate": 0.0001725978881091362, + "loss": 0.0125, "step": 168350 }, { - "epoch": 1.82, - "learning_rate": 2.698968670947655e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001725903204161222, + "loss": 0.0129, "step": 168360 }, { - "epoch": 1.82, - "learning_rate": 2.6973470843873643e-05, - "loss": 0.0096, + "epoch": 0.85, + "learning_rate": 0.0001725827527231082, + "loss": 0.0115, "step": 168370 }, { - "epoch": 1.82, - "learning_rate": 2.6957254978270736e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017257518503009417, + "loss": 0.0126, "step": 168380 }, { - "epoch": 1.82, - "learning_rate": 2.6941039112667832e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017256761733708015, + "loss": 0.014, "step": 168390 }, { - "epoch": 1.82, - "learning_rate": 2.6924823247064924e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017256004964406616, + "loss": 0.0147, "step": 168400 }, { - "epoch": 1.82, - "learning_rate": 2.690860738146202e-05, - "loss": 0.0046, + "epoch": 0.85, + "learning_rate": 0.00017255248195105214, + "loss": 0.0114, "step": 168410 }, { - "epoch": 1.82, - "learning_rate": 2.6892391515859113e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017254491425803813, + "loss": 0.0113, "step": 168420 }, { - "epoch": 1.82, - "learning_rate": 2.6876175650256206e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017253734656502413, + "loss": 0.0099, "step": 168430 }, { - "epoch": 1.82, - "learning_rate": 2.6859959784653302e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017252977887201012, + "loss": 0.0123, "step": 168440 }, { - "epoch": 1.82, - "learning_rate": 2.6843743919050395e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.0001725222111789961, + "loss": 0.0137, "step": 168450 }, { - "epoch": 1.82, - "learning_rate": 2.6827528053447488e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.0001725146434859821, + "loss": 0.0128, "step": 168460 }, { - "epoch": 1.82, - "learning_rate": 2.6811312187844584e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.0001725070757929681, + "loss": 0.0117, "step": 168470 }, { - "epoch": 1.82, - "learning_rate": 2.6795096322241677e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017249950809995407, + "loss": 0.0119, "step": 168480 }, { - "epoch": 1.82, - "learning_rate": 2.677888045663877e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017249194040694008, + "loss": 0.0117, "step": 168490 }, { - "epoch": 1.82, - "learning_rate": 2.676266459103587e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017248437271392606, + "loss": 0.0097, "step": 168500 }, { - "epoch": 1.82, - "learning_rate": 2.674644872543296e-05, - "loss": 0.0048, + "epoch": 0.85, + "learning_rate": 0.00017247680502091204, + "loss": 0.0095, "step": 168510 }, { - "epoch": 1.82, - "learning_rate": 2.6730232859830058e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017246923732789805, + "loss": 0.0114, "step": 168520 }, { - "epoch": 1.82, - "learning_rate": 2.671401699422715e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017246166963488403, + "loss": 0.0118, "step": 168530 }, { - "epoch": 1.82, - "learning_rate": 2.6697801128624247e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017245410194187, + "loss": 0.0109, "step": 168540 }, { - "epoch": 1.82, - "learning_rate": 2.668158526302134e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.000172446534248856, + "loss": 0.0108, "step": 168550 }, { - "epoch": 1.82, - "learning_rate": 2.6665369397418432e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.000172438966555842, + "loss": 0.0125, "step": 168560 }, { - "epoch": 1.82, - "learning_rate": 2.6649153531815528e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017243139886282798, + "loss": 0.0102, "step": 168570 }, { - "epoch": 1.82, - "learning_rate": 2.663293766621262e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017242383116981396, + "loss": 0.0117, "step": 168580 }, { - "epoch": 1.82, - "learning_rate": 2.6616721800609714e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017241626347679997, + "loss": 0.0107, "step": 168590 }, { - "epoch": 1.82, - "learning_rate": 2.660050593500681e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017240869578378595, + "loss": 0.0119, "step": 168600 }, { - "epoch": 1.82, - "learning_rate": 2.6584290069403903e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017240112809077194, + "loss": 0.0104, "step": 168610 }, { - "epoch": 1.82, - "learning_rate": 2.6568074203801e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017239356039775794, + "loss": 0.013, "step": 168620 }, { - "epoch": 1.82, - "learning_rate": 2.655185833819809e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017238599270474393, + "loss": 0.0133, "step": 168630 }, { - "epoch": 1.82, - "learning_rate": 2.6535642472595184e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.0001723784250117299, + "loss": 0.014, "step": 168640 }, { - "epoch": 1.82, - "learning_rate": 2.651942660699228e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.00017237085731871592, + "loss": 0.0151, "step": 168650 }, { - "epoch": 1.82, - "learning_rate": 2.6503210741389373e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.0001723632896257019, + "loss": 0.0118, "step": 168660 }, { - "epoch": 1.82, - "learning_rate": 2.6486994875786466e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017235572193268788, + "loss": 0.017, "step": 168670 }, { - "epoch": 1.82, - "learning_rate": 2.6470779010183562e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.0001723481542396739, + "loss": 0.0123, "step": 168680 }, { - "epoch": 1.82, - "learning_rate": 2.6454563144580655e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017234058654665987, + "loss": 0.0113, "step": 168690 }, { - "epoch": 1.82, - "learning_rate": 2.643834727897775e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017233301885364585, + "loss": 0.0135, "step": 168700 }, { - "epoch": 1.82, - "learning_rate": 2.6422131413374844e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017232545116063183, + "loss": 0.0087, "step": 168710 }, { - "epoch": 1.82, - "learning_rate": 2.6405915547771936e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017231788346761784, + "loss": 0.0144, "step": 168720 }, { - "epoch": 1.82, - "learning_rate": 2.6389699682169032e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017231031577460382, + "loss": 0.0153, "step": 168730 }, { - "epoch": 1.82, - "learning_rate": 2.6373483816566125e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.0001723027480815898, + "loss": 0.0119, "step": 168740 }, { - "epoch": 1.82, - "learning_rate": 2.6357267950963218e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.0001722951803885758, + "loss": 0.0116, "step": 168750 }, { - "epoch": 1.82, - "learning_rate": 2.6341052085360314e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.0001722876126955618, + "loss": 0.0104, "step": 168760 }, { - "epoch": 1.82, - "learning_rate": 2.6324836219757407e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017228004500254777, + "loss": 0.0118, "step": 168770 }, { - "epoch": 1.82, - "learning_rate": 2.63086203541545e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017227247730953378, + "loss": 0.0119, "step": 168780 }, { - "epoch": 1.82, - "learning_rate": 2.6292404488551596e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017226490961651976, + "loss": 0.0123, "step": 168790 }, { - "epoch": 1.82, - "learning_rate": 2.627618862294869e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017225734192350575, + "loss": 0.0121, "step": 168800 }, { - "epoch": 1.82, - "learning_rate": 2.6259972757345785e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017224977423049175, + "loss": 0.0109, "step": 168810 }, { - "epoch": 1.83, - "learning_rate": 2.6243756891742877e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017224220653747774, + "loss": 0.0138, "step": 168820 }, { - "epoch": 1.83, - "learning_rate": 2.622754102613997e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017223463884446372, + "loss": 0.014, "step": 168830 }, { - "epoch": 1.83, - "learning_rate": 2.6211325160537066e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017222707115144973, + "loss": 0.011, "step": 168840 }, { - "epoch": 1.83, - "learning_rate": 2.619510929493416e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.0001722195034584357, + "loss": 0.0108, "step": 168850 }, { - "epoch": 1.83, - "learning_rate": 2.617889342933126e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.0001722119357654217, + "loss": 0.0111, "step": 168860 }, { - "epoch": 1.83, - "learning_rate": 2.616267756372835e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.0001722043680724077, + "loss": 0.0112, "step": 168870 }, { - "epoch": 1.83, - "learning_rate": 2.6146461698125444e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017219680037939368, + "loss": 0.0131, "step": 168880 }, { - "epoch": 1.83, - "learning_rate": 2.613024583252254e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017218923268637966, + "loss": 0.014, "step": 168890 }, { - "epoch": 1.83, - "learning_rate": 2.6114029966919633e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017218166499336564, + "loss": 0.0154, "step": 168900 }, { - "epoch": 1.83, - "learning_rate": 2.609781410131673e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017217409730035165, + "loss": 0.0108, "step": 168910 }, { - "epoch": 1.83, - "learning_rate": 2.6081598235713822e-05, - "loss": 0.004, + "epoch": 0.85, + "learning_rate": 0.00017216652960733763, + "loss": 0.0129, "step": 168920 }, { - "epoch": 1.83, - "learning_rate": 2.6065382370110914e-05, - "loss": 0.0078, + "epoch": 0.85, + "learning_rate": 0.0001721589619143236, + "loss": 0.0135, "step": 168930 }, { - "epoch": 1.83, - "learning_rate": 2.604916650450801e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017215139422130962, + "loss": 0.0101, "step": 168940 }, { - "epoch": 1.83, - "learning_rate": 2.6032950638905103e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.0001721438265282956, + "loss": 0.0124, "step": 168950 }, { - "epoch": 1.83, - "learning_rate": 2.6016734773302196e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017213625883528158, + "loss": 0.0111, "step": 168960 }, { - "epoch": 1.83, - "learning_rate": 2.6000518907699292e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.0001721286911422676, + "loss": 0.0107, "step": 168970 }, { - "epoch": 1.83, - "learning_rate": 2.5984303042096385e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017212112344925357, + "loss": 0.0089, "step": 168980 }, { - "epoch": 1.83, - "learning_rate": 2.596808717649348e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017211355575623956, + "loss": 0.0138, "step": 168990 }, { - "epoch": 1.83, - "learning_rate": 2.5951871310890574e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017210598806322556, + "loss": 0.0129, "step": 169000 }, { - "epoch": 1.83, - "eval_cer": 0.9215139054647287, - "eval_loss": 0.005461297929286957, - "eval_runtime": 121.167, - "eval_samples_per_second": 16.506, - "eval_steps_per_second": 4.127, + "epoch": 0.85, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.008490633219480515, + "eval_runtime": 116.745, + "eval_samples_per_second": 17.131, + "eval_steps_per_second": 4.283, "step": 169000 }, { - "epoch": 1.83, - "learning_rate": 2.5935655445287667e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017209842037021155, + "loss": 0.0123, "step": 169010 }, { - "epoch": 1.83, - "learning_rate": 2.5919439579684763e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017209085267719753, + "loss": 0.0113, "step": 169020 }, { - "epoch": 1.83, - "learning_rate": 2.5903223714081855e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017208328498418354, + "loss": 0.017, "step": 169030 }, { - "epoch": 1.83, - "learning_rate": 2.5887007848478948e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017207571729116952, + "loss": 0.0104, "step": 169040 }, { - "epoch": 1.83, - "learning_rate": 2.5870791982876044e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.0001720681495981555, + "loss": 0.0144, "step": 169050 }, { - "epoch": 1.83, - "learning_rate": 2.5854576117273137e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.00017206058190514145, + "loss": 0.0148, "step": 169060 }, { - "epoch": 1.83, - "learning_rate": 2.5838360251670233e-05, - "loss": 0.0104, + "epoch": 0.85, + "learning_rate": 0.00017205301421212746, + "loss": 0.0138, "step": 169070 }, { - "epoch": 1.83, - "learning_rate": 2.5822144386067326e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017204544651911344, + "loss": 0.0138, "step": 169080 }, { - "epoch": 1.83, - "learning_rate": 2.580592852046442e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017203787882609942, + "loss": 0.0119, "step": 169090 }, { - "epoch": 1.83, - "learning_rate": 2.5789712654861515e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017203031113308543, + "loss": 0.0121, "step": 169100 }, { - "epoch": 1.83, - "learning_rate": 2.5773496789258608e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.00017202274344007141, + "loss": 0.0147, "step": 169110 }, { - "epoch": 1.83, - "learning_rate": 2.57572809236557e-05, - "loss": 0.0107, + "epoch": 0.85, + "learning_rate": 0.0001720151757470574, + "loss": 0.0131, "step": 169120 }, { - "epoch": 1.83, - "learning_rate": 2.5741065058052796e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017200760805404338, + "loss": 0.0117, "step": 169130 }, { - "epoch": 1.83, - "learning_rate": 2.572484919244989e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017200004036102939, + "loss": 0.0119, "step": 169140 }, { - "epoch": 1.83, - "learning_rate": 2.5708633326846982e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017199247266801537, + "loss": 0.0121, "step": 169150 }, { - "epoch": 1.83, - "learning_rate": 2.5692417461244078e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017198490497500135, + "loss": 0.0098, "step": 169160 }, { - "epoch": 1.83, - "learning_rate": 2.567620159564117e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.00017197733728198736, + "loss": 0.0112, "step": 169170 }, { - "epoch": 1.83, - "learning_rate": 2.5659985730038267e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017196976958897334, + "loss": 0.0108, "step": 169180 }, { - "epoch": 1.83, - "learning_rate": 2.564376986443536e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017196220189595932, + "loss": 0.0121, "step": 169190 }, { - "epoch": 1.83, - "learning_rate": 2.5627553998832452e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017195463420294533, + "loss": 0.0125, "step": 169200 }, { - "epoch": 1.83, - "learning_rate": 2.561133813322955e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.0001719470665099313, + "loss": 0.0115, "step": 169210 }, { - "epoch": 1.83, - "learning_rate": 2.5595122267626645e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001719394988169173, + "loss": 0.0125, "step": 169220 }, { - "epoch": 1.83, - "learning_rate": 2.557890640202374e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001719319311239033, + "loss": 0.0139, "step": 169230 }, { - "epoch": 1.83, - "learning_rate": 2.5562690536420834e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017192436343088928, + "loss": 0.01, "step": 169240 }, { - "epoch": 1.83, - "learning_rate": 2.5546474670817926e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017191679573787526, + "loss": 0.0127, "step": 169250 }, { - "epoch": 1.83, - "learning_rate": 2.5530258805215022e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017190922804486127, + "loss": 0.012, "step": 169260 }, { - "epoch": 1.83, - "learning_rate": 2.5514042939612115e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017190166035184725, + "loss": 0.0133, "step": 169270 }, { - "epoch": 1.83, - "learning_rate": 2.549782707400921e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017189409265883323, + "loss": 0.0124, "step": 169280 }, { - "epoch": 1.83, - "learning_rate": 2.5481611208406304e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017188652496581922, + "loss": 0.0108, "step": 169290 }, { - "epoch": 1.83, - "learning_rate": 2.5465395342803397e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017187895727280522, + "loss": 0.0101, "step": 169300 }, { - "epoch": 1.83, - "learning_rate": 2.5449179477200493e-05, - "loss": 0.0103, + "epoch": 0.85, + "learning_rate": 0.0001718713895797912, + "loss": 0.0131, "step": 169310 }, { - "epoch": 1.83, - "learning_rate": 2.5432963611597586e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.0001718638218867772, + "loss": 0.0193, "step": 169320 }, { - "epoch": 1.83, - "learning_rate": 2.541674774599468e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001718562541937632, + "loss": 0.0136, "step": 169330 }, { - "epoch": 1.83, - "learning_rate": 2.5400531880391775e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017184868650074918, + "loss": 0.012, "step": 169340 }, { - "epoch": 1.83, - "learning_rate": 2.5384316014788867e-05, - "loss": 0.009, + "epoch": 0.85, + "learning_rate": 0.00017184111880773516, + "loss": 0.0128, "step": 169350 }, { - "epoch": 1.83, - "learning_rate": 2.5368100149185963e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017183355111472117, + "loss": 0.0118, "step": 169360 }, { - "epoch": 1.83, - "learning_rate": 2.5351884283583056e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017182598342170715, + "loss": 0.0119, "step": 169370 }, { - "epoch": 1.83, - "learning_rate": 2.533566841798015e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017181841572869313, + "loss": 0.0135, "step": 169380 }, { - "epoch": 1.83, - "learning_rate": 2.5319452552377245e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017181084803567914, + "loss": 0.013, "step": 169390 }, { - "epoch": 1.83, - "learning_rate": 2.5303236686774338e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017180328034266512, + "loss": 0.0116, "step": 169400 }, { - "epoch": 1.83, - "learning_rate": 2.528702082117143e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.0001717957126496511, + "loss": 0.015, "step": 169410 }, { - "epoch": 1.83, - "learning_rate": 2.5270804955568527e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.0001717881449566371, + "loss": 0.0127, "step": 169420 }, { - "epoch": 1.83, - "learning_rate": 2.525458908996562e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001717805772636231, + "loss": 0.0144, "step": 169430 }, { - "epoch": 1.83, - "learning_rate": 2.5238373224362712e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017177300957060907, + "loss": 0.0112, "step": 169440 }, { - "epoch": 1.83, - "learning_rate": 2.5222157358759808e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017176544187759505, + "loss": 0.0133, "step": 169450 }, { - "epoch": 1.83, - "learning_rate": 2.52059414931569e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017175787418458106, + "loss": 0.0128, "step": 169460 }, { - "epoch": 1.83, - "learning_rate": 2.5189725627553997e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017175030649156704, + "loss": 0.014, "step": 169470 }, { - "epoch": 1.83, - "learning_rate": 2.517350976195109e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017174273879855303, + "loss": 0.0123, "step": 169480 }, { - "epoch": 1.83, - "learning_rate": 2.5157293896348183e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.00017173517110553903, + "loss": 0.012, "step": 169490 }, { - "epoch": 1.83, - "learning_rate": 2.514107803074528e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017172760341252502, + "loss": 0.0136, "step": 169500 }, { - "epoch": 1.83, - "learning_rate": 2.512486216514237e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.000171720035719511, + "loss": 0.0091, "step": 169510 }, { - "epoch": 1.83, - "learning_rate": 2.5108646299539464e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.000171712468026497, + "loss": 0.0108, "step": 169520 }, { - "epoch": 1.83, - "learning_rate": 2.509243043393656e-05, - "loss": 0.0043, + "epoch": 0.86, + "learning_rate": 0.000171704900333483, + "loss": 0.0122, "step": 169530 }, { - "epoch": 1.83, - "learning_rate": 2.5076214568333653e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017169733264046897, + "loss": 0.0137, "step": 169540 }, { - "epoch": 1.83, - "learning_rate": 2.505999870273075e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017168976494745498, + "loss": 0.0132, "step": 169550 }, { - "epoch": 1.83, - "learning_rate": 2.5043782837127842e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017168219725444096, + "loss": 0.0103, "step": 169560 }, { - "epoch": 1.83, - "learning_rate": 2.5027566971524935e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017167462956142694, + "loss": 0.0129, "step": 169570 }, { - "epoch": 1.83, - "learning_rate": 2.5011351105922034e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017166706186841295, + "loss": 0.0103, "step": 169580 }, { - "epoch": 1.83, - "learning_rate": 2.4995135240319127e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.00017165949417539893, + "loss": 0.01, "step": 169590 }, { - "epoch": 1.83, - "learning_rate": 2.4978919374716223e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.0001716519264823849, + "loss": 0.0152, "step": 169600 }, { - "epoch": 1.83, - "learning_rate": 2.4962703509113316e-05, - "loss": 0.0088, + "epoch": 0.86, + "learning_rate": 0.0001716443587893709, + "loss": 0.0107, "step": 169610 }, { - "epoch": 1.83, - "learning_rate": 2.494648764351041e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.0001716367910963569, + "loss": 0.011, "step": 169620 }, { - "epoch": 1.83, - "learning_rate": 2.4930271777907505e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017162922340334288, + "loss": 0.0135, "step": 169630 }, { - "epoch": 1.83, - "learning_rate": 2.4914055912304597e-05, - "loss": 0.0089, + "epoch": 0.86, + "learning_rate": 0.00017162165571032886, + "loss": 0.0098, "step": 169640 }, { - "epoch": 1.83, - "learning_rate": 2.4897840046701694e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017161408801731487, + "loss": 0.0088, "step": 169650 }, { - "epoch": 1.83, - "learning_rate": 2.4881624181098786e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017160652032430085, + "loss": 0.0099, "step": 169660 }, { - "epoch": 1.83, - "learning_rate": 2.486540831549588e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017159895263128684, + "loss": 0.0094, "step": 169670 }, { - "epoch": 1.83, - "learning_rate": 2.4849192449892975e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017159138493827284, + "loss": 0.0123, "step": 169680 }, { - "epoch": 1.83, - "learning_rate": 2.4832976584290068e-05, - "loss": 0.0084, + "epoch": 0.86, + "learning_rate": 0.00017158381724525883, + "loss": 0.0152, "step": 169690 }, { - "epoch": 1.83, - "learning_rate": 2.481676071868716e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.0001715762495522448, + "loss": 0.0108, "step": 169700 }, { - "epoch": 1.83, - "learning_rate": 2.4800544853084257e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017156868185923082, + "loss": 0.0098, "step": 169710 }, { - "epoch": 1.83, - "learning_rate": 2.478432898748135e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.0001715611141662168, + "loss": 0.0096, "step": 169720 }, { - "epoch": 1.83, - "learning_rate": 2.4768113121878442e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.00017155354647320278, + "loss": 0.0138, "step": 169730 }, { - "epoch": 1.83, - "learning_rate": 2.475189725627554e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001715459787801888, + "loss": 0.0136, "step": 169740 }, { - "epoch": 1.84, - "learning_rate": 2.473568139067263e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017153841108717477, + "loss": 0.0111, "step": 169750 }, { - "epoch": 1.84, - "learning_rate": 2.4719465525069727e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017153084339416075, + "loss": 0.0103, "step": 169760 }, { - "epoch": 1.84, - "learning_rate": 2.470324965946682e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017152327570114676, + "loss": 0.0115, "step": 169770 }, { - "epoch": 1.84, - "learning_rate": 2.4687033793863913e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017151570800813274, + "loss": 0.0116, "step": 169780 }, { - "epoch": 1.84, - "learning_rate": 2.467081792826101e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017150814031511872, + "loss": 0.01, "step": 169790 }, { - "epoch": 1.84, - "learning_rate": 2.4654602062658102e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001715005726221047, + "loss": 0.0111, "step": 169800 }, { - "epoch": 1.84, - "learning_rate": 2.4638386197055194e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.0001714930049290907, + "loss": 0.012, "step": 169810 }, { - "epoch": 1.84, - "learning_rate": 2.462217033145229e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.0001714854372360767, + "loss": 0.011, "step": 169820 }, { - "epoch": 1.84, - "learning_rate": 2.4605954465849383e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017147786954306267, + "loss": 0.0097, "step": 169830 }, { - "epoch": 1.84, - "learning_rate": 2.458973860024648e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017147030185004868, + "loss": 0.0122, "step": 169840 }, { - "epoch": 1.84, - "learning_rate": 2.4573522734643572e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017146273415703466, + "loss": 0.0112, "step": 169850 }, { - "epoch": 1.84, - "learning_rate": 2.4557306869040665e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017145516646402065, + "loss": 0.0126, "step": 169860 }, { - "epoch": 1.84, - "learning_rate": 2.454109100343776e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017144759877100665, + "loss": 0.0124, "step": 169870 }, { - "epoch": 1.84, - "learning_rate": 2.4524875137834854e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017144003107799264, + "loss": 0.0147, "step": 169880 }, { - "epoch": 1.84, - "learning_rate": 2.4508659272231947e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017143246338497862, + "loss": 0.0113, "step": 169890 }, { - "epoch": 1.84, - "learning_rate": 2.4492443406629043e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017142489569196463, + "loss": 0.0103, "step": 169900 }, { - "epoch": 1.84, - "learning_rate": 2.4476227541026135e-05, - "loss": 0.01, + "epoch": 0.86, + "learning_rate": 0.0001714173279989506, + "loss": 0.0116, "step": 169910 }, { - "epoch": 1.84, - "learning_rate": 2.446001167542323e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.0001714097603059366, + "loss": 0.0103, "step": 169920 }, { - "epoch": 1.84, - "learning_rate": 2.4443795809820324e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.0001714021926129226, + "loss": 0.0128, "step": 169930 }, { - "epoch": 1.84, - "learning_rate": 2.4427579944217424e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017139462491990858, + "loss": 0.0119, "step": 169940 }, { - "epoch": 1.84, - "learning_rate": 2.4411364078614517e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.00017138705722689456, + "loss": 0.0113, "step": 169950 }, { - "epoch": 1.84, - "learning_rate": 2.439514821301161e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017137948953388054, + "loss": 0.0139, "step": 169960 }, { - "epoch": 1.84, - "learning_rate": 2.4378932347408705e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017137192184086655, + "loss": 0.0115, "step": 169970 }, { - "epoch": 1.84, - "learning_rate": 2.4362716481805798e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017136435414785253, + "loss": 0.0093, "step": 169980 }, { - "epoch": 1.84, - "learning_rate": 2.434650061620289e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.0001713567864548385, + "loss": 0.0162, "step": 169990 }, { - "epoch": 1.84, - "learning_rate": 2.4330284750599987e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017134921876182452, + "loss": 0.015, "step": 170000 }, { - "epoch": 1.84, - "eval_cer": 0.9215234600972488, - "eval_loss": 0.005428744480013847, - "eval_runtime": 121.1672, - "eval_samples_per_second": 16.506, - "eval_steps_per_second": 4.127, + "epoch": 0.86, + "eval_cer": 0.9144799598644162, + "eval_loss": 0.00878238771110773, + "eval_runtime": 116.6286, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, "step": 170000 }, { - "epoch": 1.84, - "learning_rate": 2.431406888499708e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.0001713416510688105, + "loss": 0.0126, "step": 170010 }, { - "epoch": 1.84, - "learning_rate": 2.4297853019394173e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017133408337579648, + "loss": 0.0136, "step": 170020 }, { - "epoch": 1.84, - "learning_rate": 2.428163715379127e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.0001713265156827825, + "loss": 0.0109, "step": 170030 }, { - "epoch": 1.84, - "learning_rate": 2.426542128818836e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017131894798976847, + "loss": 0.0117, "step": 170040 }, { - "epoch": 1.84, - "learning_rate": 2.4249205422585458e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017131138029675446, + "loss": 0.0139, "step": 170050 }, { - "epoch": 1.84, - "learning_rate": 2.423298955698255e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017130381260374046, + "loss": 0.0119, "step": 170060 }, { - "epoch": 1.84, - "learning_rate": 2.4216773691379643e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017129624491072645, + "loss": 0.011, "step": 170070 }, { - "epoch": 1.84, - "learning_rate": 2.420055782577674e-05, - "loss": 0.0093, + "epoch": 0.86, + "learning_rate": 0.00017128867721771243, + "loss": 0.0101, "step": 170080 }, { - "epoch": 1.84, - "learning_rate": 2.4184341960173832e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017128110952469844, + "loss": 0.0131, "step": 170090 }, { - "epoch": 1.84, - "learning_rate": 2.4168126094570925e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017127354183168442, + "loss": 0.0118, "step": 170100 }, { - "epoch": 1.84, - "learning_rate": 2.415191022896802e-05, - "loss": 0.0082, + "epoch": 0.86, + "learning_rate": 0.0001712659741386704, + "loss": 0.0122, "step": 170110 }, { - "epoch": 1.84, - "learning_rate": 2.4135694363365114e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017125840644565638, + "loss": 0.0124, "step": 170120 }, { - "epoch": 1.84, - "learning_rate": 2.411947849776221e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.0001712508387526424, + "loss": 0.0122, "step": 170130 }, { - "epoch": 1.84, - "learning_rate": 2.4103262632159302e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017124327105962837, + "loss": 0.0124, "step": 170140 }, { - "epoch": 1.84, - "learning_rate": 2.4087046766556395e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017123570336661435, + "loss": 0.0128, "step": 170150 }, { - "epoch": 1.84, - "learning_rate": 2.407083090095349e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.00017122813567360036, + "loss": 0.0099, "step": 170160 }, { - "epoch": 1.84, - "learning_rate": 2.4054615035350584e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017122056798058634, + "loss": 0.0125, "step": 170170 }, { - "epoch": 1.84, - "learning_rate": 2.4038399169747677e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017121300028757232, + "loss": 0.0101, "step": 170180 }, { - "epoch": 1.84, - "learning_rate": 2.4022183304144773e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017120543259455833, + "loss": 0.0121, "step": 170190 }, { - "epoch": 1.84, - "learning_rate": 2.4005967438541866e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001711978649015443, + "loss": 0.0113, "step": 170200 }, { - "epoch": 1.84, - "learning_rate": 2.3989751572938962e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.0001711902972085303, + "loss": 0.011, "step": 170210 }, { - "epoch": 1.84, - "learning_rate": 2.3973535707336055e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.0001711827295155163, + "loss": 0.0158, "step": 170220 }, { - "epoch": 1.84, - "learning_rate": 2.3957319841733147e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017117516182250228, + "loss": 0.0129, "step": 170230 }, { - "epoch": 1.84, - "learning_rate": 2.3941103976130243e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017116759412948827, + "loss": 0.0127, "step": 170240 }, { - "epoch": 1.84, - "learning_rate": 2.3924888110527336e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017116002643647427, + "loss": 0.0115, "step": 170250 }, { - "epoch": 1.84, - "learning_rate": 2.390867224492443e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017115245874346026, + "loss": 0.0271, "step": 170260 }, { - "epoch": 1.84, - "learning_rate": 2.3892456379321525e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017114489105044624, + "loss": 0.0112, "step": 170270 }, { - "epoch": 1.84, - "learning_rate": 2.3876240513718618e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017113732335743225, + "loss": 0.0129, "step": 170280 }, { - "epoch": 1.84, - "learning_rate": 2.3860024648115714e-05, - "loss": 0.0045, + "epoch": 0.86, + "learning_rate": 0.00017112975566441823, + "loss": 0.0123, "step": 170290 }, { - "epoch": 1.84, - "learning_rate": 2.384380878251281e-05, - "loss": 0.0086, + "epoch": 0.86, + "learning_rate": 0.0001711221879714042, + "loss": 0.0142, "step": 170300 }, { - "epoch": 1.84, - "learning_rate": 2.3827592916909903e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017111462027839016, + "loss": 0.0148, "step": 170310 }, { - "epoch": 1.84, - "learning_rate": 2.3811377051307e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017110705258537617, + "loss": 0.0113, "step": 170320 }, { - "epoch": 1.84, - "learning_rate": 2.379516118570409e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017109948489236215, + "loss": 0.012, "step": 170330 }, { - "epoch": 1.84, - "learning_rate": 2.3778945320101188e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017109191719934813, + "loss": 0.011, "step": 170340 }, { - "epoch": 1.84, - "learning_rate": 2.376272945449828e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017108434950633412, + "loss": 0.0127, "step": 170350 }, { - "epoch": 1.84, - "learning_rate": 2.3746513588895373e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017107678181332012, + "loss": 0.0173, "step": 170360 }, { - "epoch": 1.84, - "learning_rate": 2.373029772329247e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001710692141203061, + "loss": 0.015, "step": 170370 }, { - "epoch": 1.84, - "learning_rate": 2.3714081857689562e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001710616464272921, + "loss": 0.0106, "step": 170380 }, { - "epoch": 1.84, - "learning_rate": 2.3697865992086655e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.0001710540787342781, + "loss": 0.0098, "step": 170390 }, { - "epoch": 1.84, - "learning_rate": 2.368165012648375e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017104651104126408, + "loss": 0.0113, "step": 170400 }, { - "epoch": 1.84, - "learning_rate": 2.3665434260880844e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017103894334825006, + "loss": 0.023, "step": 170410 }, { - "epoch": 1.84, - "learning_rate": 2.364921839527794e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017103137565523607, + "loss": 0.0125, "step": 170420 }, { - "epoch": 1.84, - "learning_rate": 2.3633002529675033e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017102380796222205, + "loss": 0.0142, "step": 170430 }, { - "epoch": 1.84, - "learning_rate": 2.3616786664072125e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017101624026920803, + "loss": 0.0121, "step": 170440 }, { - "epoch": 1.84, - "learning_rate": 2.360057079846922e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017100867257619404, + "loss": 0.0095, "step": 170450 }, { - "epoch": 1.84, - "learning_rate": 2.3584354932866314e-05, - "loss": 0.0081, + "epoch": 0.86, + "learning_rate": 0.00017100110488318002, + "loss": 0.0118, "step": 170460 }, { - "epoch": 1.84, - "learning_rate": 2.3568139067263407e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.000170993537190166, + "loss": 0.0098, "step": 170470 }, { - "epoch": 1.84, - "learning_rate": 2.3551923201660503e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.000170985969497152, + "loss": 0.0096, "step": 170480 }, { - "epoch": 1.84, - "learning_rate": 2.3535707336057596e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.000170978401804138, + "loss": 0.0117, "step": 170490 }, { - "epoch": 1.84, - "learning_rate": 2.3519491470454692e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017097083411112397, + "loss": 0.0129, "step": 170500 }, { - "epoch": 1.84, - "learning_rate": 2.3503275604851785e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017096326641810995, + "loss": 0.0102, "step": 170510 }, { - "epoch": 1.84, - "learning_rate": 2.3487059739248877e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017095569872509596, + "loss": 0.0144, "step": 170520 }, { - "epoch": 1.84, - "learning_rate": 2.3470843873645974e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017094813103208194, + "loss": 0.0121, "step": 170530 }, { - "epoch": 1.84, - "learning_rate": 2.3454628008043066e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017094056333906793, + "loss": 0.0141, "step": 170540 }, { - "epoch": 1.84, - "learning_rate": 2.343841214244016e-05, - "loss": 0.0084, + "epoch": 0.86, + "learning_rate": 0.00017093299564605393, + "loss": 0.0121, "step": 170550 }, { - "epoch": 1.84, - "learning_rate": 2.3422196276837255e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017092542795303992, + "loss": 0.0126, "step": 170560 }, { - "epoch": 1.84, - "learning_rate": 2.3405980411234348e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001709178602600259, + "loss": 0.0125, "step": 170570 }, { - "epoch": 1.84, - "learning_rate": 2.3389764545631444e-05, - "loss": 0.0082, + "epoch": 0.86, + "learning_rate": 0.0001709102925670119, + "loss": 0.0105, "step": 170580 }, { - "epoch": 1.84, - "learning_rate": 2.3373548680028537e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.0001709027248739979, + "loss": 0.0116, "step": 170590 }, { - "epoch": 1.84, - "learning_rate": 2.335733281442563e-05, - "loss": 0.0117, + "epoch": 0.86, + "learning_rate": 0.00017089515718098387, + "loss": 0.0133, "step": 170600 }, { - "epoch": 1.84, - "learning_rate": 2.3341116948822726e-05, - "loss": 0.0089, + "epoch": 0.86, + "learning_rate": 0.00017088758948796988, + "loss": 0.0117, "step": 170610 }, { - "epoch": 1.84, - "learning_rate": 2.332490108321982e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017088002179495586, + "loss": 0.0116, "step": 170620 }, { - "epoch": 1.84, - "learning_rate": 2.330868521761691e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017087245410194184, + "loss": 0.0113, "step": 170630 }, { - "epoch": 1.84, - "learning_rate": 2.3292469352014007e-05, - "loss": 0.0043, + "epoch": 0.86, + "learning_rate": 0.00017086488640892785, + "loss": 0.0117, "step": 170640 }, { - "epoch": 1.84, - "learning_rate": 2.32762534864111e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017085731871591383, + "loss": 0.0138, "step": 170650 }, { - "epoch": 1.84, - "learning_rate": 2.32600376208082e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001708497510228998, + "loss": 0.0104, "step": 170660 }, { - "epoch": 1.85, - "learning_rate": 2.3243821755205292e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017084218332988582, + "loss": 0.0165, "step": 170670 }, { - "epoch": 1.85, - "learning_rate": 2.3227605889602385e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.0001708346156368718, + "loss": 0.0107, "step": 170680 }, { - "epoch": 1.85, - "learning_rate": 2.321139002399948e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017082704794385778, + "loss": 0.0118, "step": 170690 }, { - "epoch": 1.85, - "learning_rate": 2.3195174158396574e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017081948025084376, + "loss": 0.0125, "step": 170700 }, { - "epoch": 1.85, - "learning_rate": 2.317895829279367e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017081191255782977, + "loss": 0.0113, "step": 170710 }, { - "epoch": 1.85, - "learning_rate": 2.3162742427190763e-05, - "loss": 0.0081, + "epoch": 0.86, + "learning_rate": 0.00017080434486481575, + "loss": 0.0132, "step": 170720 }, { - "epoch": 1.85, - "learning_rate": 2.3146526561587856e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017079677717180174, + "loss": 0.0098, "step": 170730 }, { - "epoch": 1.85, - "learning_rate": 2.3130310695984952e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017078920947878774, + "loss": 0.0098, "step": 170740 }, { - "epoch": 1.85, - "learning_rate": 2.3114094830382044e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017078164178577373, + "loss": 0.0121, "step": 170750 }, { - "epoch": 1.85, - "learning_rate": 2.3097878964779137e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001707740740927597, + "loss": 0.0148, "step": 170760 }, { - "epoch": 1.85, - "learning_rate": 2.3081663099176233e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017076650639974572, + "loss": 0.0139, "step": 170770 }, { - "epoch": 1.85, - "learning_rate": 2.3065447233573326e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.0001707589387067317, + "loss": 0.0155, "step": 170780 }, { - "epoch": 1.85, - "learning_rate": 2.3049231367970422e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017075137101371768, + "loss": 0.0094, "step": 170790 }, { - "epoch": 1.85, - "learning_rate": 2.3033015502367515e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001707438033207037, + "loss": 0.0137, "step": 170800 }, { - "epoch": 1.85, - "learning_rate": 2.3016799636764608e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017073623562768967, + "loss": 0.0097, "step": 170810 }, { - "epoch": 1.85, - "learning_rate": 2.3000583771161704e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017072866793467565, + "loss": 0.0095, "step": 170820 }, { - "epoch": 1.85, - "learning_rate": 2.2984367905558797e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017072110024166166, + "loss": 0.0162, "step": 170830 }, { - "epoch": 1.85, - "learning_rate": 2.296815203995589e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017071353254864764, + "loss": 0.0122, "step": 170840 }, { - "epoch": 1.85, - "learning_rate": 2.2951936174352985e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017070596485563362, + "loss": 0.0098, "step": 170850 }, { - "epoch": 1.85, - "learning_rate": 2.2935720308750078e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.0001706983971626196, + "loss": 0.0128, "step": 170860 }, { - "epoch": 1.85, - "learning_rate": 2.2919504443147174e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001706908294696056, + "loss": 0.0116, "step": 170870 }, { - "epoch": 1.85, - "learning_rate": 2.2903288577544267e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.0001706832617765916, + "loss": 0.0118, "step": 170880 }, { - "epoch": 1.85, - "learning_rate": 2.288707271194136e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017067569408357757, + "loss": 0.0102, "step": 170890 }, { - "epoch": 1.85, - "learning_rate": 2.2870856846338456e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017066812639056358, + "loss": 0.0121, "step": 170900 }, { - "epoch": 1.85, - "learning_rate": 2.285464098073555e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017066055869754956, + "loss": 0.0111, "step": 170910 }, { - "epoch": 1.85, - "learning_rate": 2.283842511513264e-05, - "loss": 0.0043, + "epoch": 0.86, + "learning_rate": 0.00017065299100453555, + "loss": 0.0113, "step": 170920 }, { - "epoch": 1.85, - "learning_rate": 2.2822209249529738e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017064542331152155, + "loss": 0.0141, "step": 170930 }, { - "epoch": 1.85, - "learning_rate": 2.280599338392683e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017063785561850754, + "loss": 0.0115, "step": 170940 }, { - "epoch": 1.85, - "learning_rate": 2.2789777518323926e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017063028792549352, + "loss": 0.0227, "step": 170950 }, { - "epoch": 1.85, - "learning_rate": 2.277356165272102e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.00017062272023247953, + "loss": 0.0105, "step": 170960 }, { - "epoch": 1.85, - "learning_rate": 2.2757345787118112e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.0001706151525394655, + "loss": 0.0113, "step": 170970 }, { - "epoch": 1.85, - "learning_rate": 2.2741129921515208e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.0001706075848464515, + "loss": 0.0103, "step": 170980 }, { - "epoch": 1.85, - "learning_rate": 2.27249140559123e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.0001706000171534375, + "loss": 0.0109, "step": 170990 }, { - "epoch": 1.85, - "learning_rate": 2.2708698190309394e-05, - "loss": 0.0081, + "epoch": 0.86, + "learning_rate": 0.00017059244946042348, + "loss": 0.0112, "step": 171000 }, { - "epoch": 1.85, - "eval_cer": 0.9215208542883797, - "eval_loss": 0.005525045562535524, - "eval_runtime": 121.1759, - "eval_samples_per_second": 16.505, - "eval_steps_per_second": 4.126, + "epoch": 0.86, + "eval_cer": 0.914508101352053, + "eval_loss": 0.008454186841845512, + "eval_runtime": 116.644, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.287, "step": 171000 }, { - "epoch": 1.85, - "learning_rate": 2.269248232470649e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017058488176740946, + "loss": 0.0105, "step": 171010 }, { - "epoch": 1.85, - "learning_rate": 2.2676266459103586e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017057731407439544, + "loss": 0.0115, "step": 171020 }, { - "epoch": 1.85, - "learning_rate": 2.2660050593500682e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017056974638138145, + "loss": 0.0135, "step": 171030 }, { - "epoch": 1.85, - "learning_rate": 2.2643834727897775e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017056217868836743, + "loss": 0.0112, "step": 171040 }, { - "epoch": 1.85, - "learning_rate": 2.2627618862294867e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.0001705546109953534, + "loss": 0.0095, "step": 171050 }, { - "epoch": 1.85, - "learning_rate": 2.2611402996691964e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017054704330233942, + "loss": 0.0116, "step": 171060 }, { - "epoch": 1.85, - "learning_rate": 2.2595187131089056e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.0001705394756093254, + "loss": 0.0101, "step": 171070 }, { - "epoch": 1.85, - "learning_rate": 2.2578971265486152e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017053190791631138, + "loss": 0.0124, "step": 171080 }, { - "epoch": 1.85, - "learning_rate": 2.2562755399883245e-05, - "loss": 0.0087, + "epoch": 0.86, + "learning_rate": 0.0001705243402232974, + "loss": 0.0097, "step": 171090 }, { - "epoch": 1.85, - "learning_rate": 2.2546539534280338e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017051677253028337, + "loss": 0.011, "step": 171100 }, { - "epoch": 1.85, - "learning_rate": 2.2530323668677434e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017050920483726936, + "loss": 0.0133, "step": 171110 }, { - "epoch": 1.85, - "learning_rate": 2.2514107803074527e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017050163714425536, + "loss": 0.0121, "step": 171120 }, { - "epoch": 1.85, - "learning_rate": 2.249789193747162e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017049406945124135, + "loss": 0.0109, "step": 171130 }, { - "epoch": 1.85, - "learning_rate": 2.2481676071868716e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017048650175822733, + "loss": 0.0118, "step": 171140 }, { - "epoch": 1.85, - "learning_rate": 2.246546020626581e-05, - "loss": 0.0044, + "epoch": 0.86, + "learning_rate": 0.00017047893406521334, + "loss": 0.0097, "step": 171150 }, { - "epoch": 1.85, - "learning_rate": 2.2449244340662905e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017047136637219932, + "loss": 0.0131, "step": 171160 }, { - "epoch": 1.85, - "learning_rate": 2.2433028475059997e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.0001704637986791853, + "loss": 0.0114, "step": 171170 }, { - "epoch": 1.85, - "learning_rate": 2.241681260945709e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.0001704562309861713, + "loss": 0.01, "step": 171180 }, { - "epoch": 1.85, - "learning_rate": 2.2400596743854186e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.0001704486632931573, + "loss": 0.0127, "step": 171190 }, { - "epoch": 1.85, - "learning_rate": 2.238438087825128e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017044109560014327, + "loss": 0.0152, "step": 171200 }, { - "epoch": 1.85, - "learning_rate": 2.236816501264837e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017043352790712925, + "loss": 0.0144, "step": 171210 }, { - "epoch": 1.85, - "learning_rate": 2.2351949147045468e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017042596021411526, + "loss": 0.0109, "step": 171220 }, { - "epoch": 1.85, - "learning_rate": 2.233573328144256e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017041839252110124, + "loss": 0.0093, "step": 171230 }, { - "epoch": 1.85, - "learning_rate": 2.2319517415839657e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.00017041082482808722, + "loss": 0.0102, "step": 171240 }, { - "epoch": 1.85, - "learning_rate": 2.230330155023675e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017040325713507323, + "loss": 0.0106, "step": 171250 }, { - "epoch": 1.85, - "learning_rate": 2.2287085684633842e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.0001703956894420592, + "loss": 0.012, "step": 171260 }, { - "epoch": 1.85, - "learning_rate": 2.2270869819030938e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.0001703881217490452, + "loss": 0.0092, "step": 171270 }, { - "epoch": 1.85, - "learning_rate": 2.225465395342803e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.0001703805540560312, + "loss": 0.0085, "step": 171280 }, { - "epoch": 1.85, - "learning_rate": 2.2238438087825124e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017037298636301718, + "loss": 0.0103, "step": 171290 }, { - "epoch": 1.85, - "learning_rate": 2.222222222222222e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017036541867000317, + "loss": 0.0119, "step": 171300 }, { - "epoch": 1.85, - "learning_rate": 2.2206006356619313e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017035785097698917, + "loss": 0.0116, "step": 171310 }, { - "epoch": 1.85, - "learning_rate": 2.2189790491016405e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017035028328397516, + "loss": 0.0106, "step": 171320 }, { - "epoch": 1.85, - "learning_rate": 2.21735746254135e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017034271559096114, + "loss": 0.0105, "step": 171330 }, { - "epoch": 1.85, - "learning_rate": 2.2157358759810594e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017033514789794715, + "loss": 0.009, "step": 171340 }, { - "epoch": 1.85, - "learning_rate": 2.214114289420769e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017032758020493313, + "loss": 0.0111, "step": 171350 }, { - "epoch": 1.85, - "learning_rate": 2.2124927028604783e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.0001703200125119191, + "loss": 0.0101, "step": 171360 }, { - "epoch": 1.85, - "learning_rate": 2.2108711163001876e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.0001703124448189051, + "loss": 0.0129, "step": 171370 }, { - "epoch": 1.85, - "learning_rate": 2.2092495297398975e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.0001703048771258911, + "loss": 0.0114, "step": 171380 }, { - "epoch": 1.85, - "learning_rate": 2.2076279431796068e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017029730943287708, + "loss": 0.0128, "step": 171390 }, { - "epoch": 1.85, - "learning_rate": 2.2060063566193164e-05, - "loss": 0.0092, + "epoch": 0.86, + "learning_rate": 0.00017028974173986306, + "loss": 0.011, "step": 171400 }, { - "epoch": 1.85, - "learning_rate": 2.2043847700590257e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017028217404684907, + "loss": 0.0086, "step": 171410 }, { - "epoch": 1.85, - "learning_rate": 2.202763183498735e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.00017027460635383505, + "loss": 0.0116, "step": 171420 }, { - "epoch": 1.85, - "learning_rate": 2.2011415969384446e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017026703866082103, + "loss": 0.012, "step": 171430 }, { - "epoch": 1.85, - "learning_rate": 2.199520010378154e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017025947096780704, + "loss": 0.0109, "step": 171440 }, { - "epoch": 1.85, - "learning_rate": 2.1978984238178635e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017025190327479302, + "loss": 0.0098, "step": 171450 }, { - "epoch": 1.85, - "learning_rate": 2.1962768372575728e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.000170244335581779, + "loss": 0.0105, "step": 171460 }, { - "epoch": 1.85, - "learning_rate": 2.194655250697282e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.000170236767888765, + "loss": 0.0107, "step": 171470 }, { - "epoch": 1.85, - "learning_rate": 2.1930336641369916e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.000170229200195751, + "loss": 0.0118, "step": 171480 }, { - "epoch": 1.85, - "learning_rate": 2.191412077576701e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00017022163250273698, + "loss": 0.0116, "step": 171490 }, { - "epoch": 1.85, - "learning_rate": 2.1897904910164102e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00017021406480972298, + "loss": 0.0115, "step": 171500 }, { - "epoch": 1.85, - "learning_rate": 2.1881689044561198e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00017020649711670897, + "loss": 0.0115, "step": 171510 }, { - "epoch": 1.85, - "learning_rate": 2.186547317895829e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00017019892942369495, + "loss": 0.01, "step": 171520 }, { - "epoch": 1.85, - "learning_rate": 2.1849257313355387e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00017019136173068093, + "loss": 0.0124, "step": 171530 }, { - "epoch": 1.85, - "learning_rate": 2.183304144775248e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00017018379403766694, + "loss": 0.0118, "step": 171540 }, { - "epoch": 1.85, - "learning_rate": 2.1816825582149572e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00017017622634465292, + "loss": 0.0116, "step": 171550 }, { - "epoch": 1.85, - "learning_rate": 2.180060971654667e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.0001701686586516389, + "loss": 0.0131, "step": 171560 }, { - "epoch": 1.85, - "learning_rate": 2.178439385094376e-05, - "loss": 0.0031, + "epoch": 0.87, + "learning_rate": 0.00017016109095862488, + "loss": 0.0154, "step": 171570 }, { - "epoch": 1.85, - "learning_rate": 2.1768177985340854e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00017015352326561086, + "loss": 0.0102, "step": 171580 }, { - "epoch": 1.85, - "learning_rate": 2.175196211973795e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00017014595557259684, + "loss": 0.011, "step": 171590 }, { - "epoch": 1.86, - "learning_rate": 2.1735746254135043e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00017013838787958283, + "loss": 0.0132, "step": 171600 }, { - "epoch": 1.86, - "learning_rate": 2.1719530388532136e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00017013082018656883, + "loss": 0.0096, "step": 171610 }, { - "epoch": 1.86, - "learning_rate": 2.1703314522929232e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00017012325249355482, + "loss": 0.0092, "step": 171620 }, { - "epoch": 1.86, - "learning_rate": 2.1687098657326324e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001701156848005408, + "loss": 0.017, "step": 171630 }, { - "epoch": 1.86, - "learning_rate": 2.167088279172342e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001701081171075268, + "loss": 0.0112, "step": 171640 }, { - "epoch": 1.86, - "learning_rate": 2.1654666926120513e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.0001701005494145128, + "loss": 0.0108, "step": 171650 }, { - "epoch": 1.86, - "learning_rate": 2.1638451060517606e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00017009298172149877, + "loss": 0.0099, "step": 171660 }, { - "epoch": 1.86, - "learning_rate": 2.1622235194914702e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00017008541402848478, + "loss": 0.0111, "step": 171670 }, { - "epoch": 1.86, - "learning_rate": 2.1606019329311795e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00017007784633547076, + "loss": 0.0118, "step": 171680 }, { - "epoch": 1.86, - "learning_rate": 2.1589803463708888e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00017007027864245674, + "loss": 0.0108, "step": 171690 }, { - "epoch": 1.86, - "learning_rate": 2.1573587598105984e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00017006271094944275, + "loss": 0.0088, "step": 171700 }, { - "epoch": 1.86, - "learning_rate": 2.1557371732503077e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00017005514325642873, + "loss": 0.0282, "step": 171710 }, { - "epoch": 1.86, - "learning_rate": 2.1541155866900173e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.0001700475755634147, + "loss": 0.0125, "step": 171720 }, { - "epoch": 1.86, - "learning_rate": 2.1524940001297265e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00017004000787040072, + "loss": 0.0127, "step": 171730 }, { - "epoch": 1.86, - "learning_rate": 2.1508724135694365e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001700324401773867, + "loss": 0.0111, "step": 171740 }, { - "epoch": 1.86, - "learning_rate": 2.1492508270091458e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00017002487248437268, + "loss": 0.0106, "step": 171750 }, { - "epoch": 1.86, - "learning_rate": 2.147629240448855e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00017001730479135866, + "loss": 0.0117, "step": 171760 }, { - "epoch": 1.86, - "learning_rate": 2.1460076538885647e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00017000973709834467, + "loss": 0.0125, "step": 171770 }, { - "epoch": 1.86, - "learning_rate": 2.144386067328274e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00017000216940533065, + "loss": 0.0092, "step": 171780 }, { - "epoch": 1.86, - "learning_rate": 2.1427644807679832e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016999460171231664, + "loss": 0.0109, "step": 171790 }, { - "epoch": 1.86, - "learning_rate": 2.1411428942076928e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016998703401930264, + "loss": 0.0102, "step": 171800 }, { - "epoch": 1.86, - "learning_rate": 2.139521307647402e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016997946632628863, + "loss": 0.012, "step": 171810 }, { - "epoch": 1.86, - "learning_rate": 2.1378997210871117e-05, - "loss": 0.0091, + "epoch": 0.87, + "learning_rate": 0.0001699718986332746, + "loss": 0.0099, "step": 171820 }, { - "epoch": 1.86, - "learning_rate": 2.136278134526821e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016996433094026062, + "loss": 0.0109, "step": 171830 }, { - "epoch": 1.86, - "learning_rate": 2.1346565479665303e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.0001699567632472466, + "loss": 0.0103, "step": 171840 }, { - "epoch": 1.86, - "learning_rate": 2.13303496140624e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016994919555423258, + "loss": 0.0121, "step": 171850 }, { - "epoch": 1.86, - "learning_rate": 2.131413374845949e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.0001699416278612186, + "loss": 0.0107, "step": 171860 }, { - "epoch": 1.86, - "learning_rate": 2.1297917882856584e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016993406016820457, + "loss": 0.0111, "step": 171870 }, { - "epoch": 1.86, - "learning_rate": 2.128170201725368e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016992649247519055, + "loss": 0.009, "step": 171880 }, { - "epoch": 1.86, - "learning_rate": 2.1265486151650773e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016991892478217656, + "loss": 0.0139, "step": 171890 }, { - "epoch": 1.86, - "learning_rate": 2.124927028604787e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016991135708916254, + "loss": 0.009, "step": 171900 }, { - "epoch": 1.86, - "learning_rate": 2.1233054420444962e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016990378939614852, + "loss": 0.0108, "step": 171910 }, { - "epoch": 1.86, - "learning_rate": 2.1216838554842055e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.0001698962217031345, + "loss": 0.011, "step": 171920 }, { - "epoch": 1.86, - "learning_rate": 2.120062268923915e-05, - "loss": 0.009, + "epoch": 0.87, + "learning_rate": 0.0001698886540101205, + "loss": 0.0123, "step": 171930 }, { - "epoch": 1.86, - "learning_rate": 2.1184406823636244e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.0001698810863171065, + "loss": 0.0106, "step": 171940 }, { - "epoch": 1.86, - "learning_rate": 2.1168190958033336e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016987351862409247, + "loss": 0.0106, "step": 171950 }, { - "epoch": 1.86, - "learning_rate": 2.1151975092430432e-05, - "loss": 0.0084, + "epoch": 0.87, + "learning_rate": 0.00016986595093107848, + "loss": 0.0097, "step": 171960 }, { - "epoch": 1.86, - "learning_rate": 2.1135759226827525e-05, - "loss": 0.0036, + "epoch": 0.87, + "learning_rate": 0.00016985838323806446, + "loss": 0.016, "step": 171970 }, { - "epoch": 1.86, - "learning_rate": 2.1119543361224618e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016985081554505045, + "loss": 0.0124, "step": 171980 }, { - "epoch": 1.86, - "learning_rate": 2.1103327495621714e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.00016984324785203645, + "loss": 0.012, "step": 171990 }, { - "epoch": 1.86, - "learning_rate": 2.1087111630018807e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016983568015902244, + "loss": 0.011, "step": 172000 }, { - "epoch": 1.86, - "eval_cer": 0.9215199856854233, - "eval_loss": 0.005438223015516996, - "eval_runtime": 121.1016, - "eval_samples_per_second": 16.515, - "eval_steps_per_second": 4.129, + "epoch": 0.87, + "eval_cer": 0.9145003381830497, + "eval_loss": 0.00847652181982994, + "eval_runtime": 116.6974, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.285, "step": 172000 }, { - "epoch": 1.86, - "learning_rate": 2.1070895764415903e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016982811246600842, + "loss": 0.0102, "step": 172010 }, { - "epoch": 1.86, - "learning_rate": 2.1054679898812996e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016982054477299443, + "loss": 0.0126, "step": 172020 }, { - "epoch": 1.86, - "learning_rate": 2.103846403321009e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001698129770799804, + "loss": 0.01, "step": 172030 }, { - "epoch": 1.86, - "learning_rate": 2.1022248167607185e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.0001698054093869664, + "loss": 0.0121, "step": 172040 }, { - "epoch": 1.86, - "learning_rate": 2.1006032302004277e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.0001697978416939524, + "loss": 0.0103, "step": 172050 }, { - "epoch": 1.86, - "learning_rate": 2.098981643640137e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016979027400093838, + "loss": 0.0138, "step": 172060 }, { - "epoch": 1.86, - "learning_rate": 2.0973600570798466e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016978270630792436, + "loss": 0.0139, "step": 172070 }, { - "epoch": 1.86, - "learning_rate": 2.095738470519556e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016977513861491037, + "loss": 0.0152, "step": 172080 }, { - "epoch": 1.86, - "learning_rate": 2.0941168839592655e-05, - "loss": 0.0087, + "epoch": 0.87, + "learning_rate": 0.00016976757092189635, + "loss": 0.0113, "step": 172090 }, { - "epoch": 1.86, - "learning_rate": 2.092495297398975e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016976000322888233, + "loss": 0.0123, "step": 172100 }, { - "epoch": 1.86, - "learning_rate": 2.0908737108386847e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.0001697524355358683, + "loss": 0.0147, "step": 172110 }, { - "epoch": 1.86, - "learning_rate": 2.089252124278394e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016974486784285432, + "loss": 0.0077, "step": 172120 }, { - "epoch": 1.86, - "learning_rate": 2.0876305377181033e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.0001697373001498403, + "loss": 0.0108, "step": 172130 }, { - "epoch": 1.86, - "learning_rate": 2.086008951157813e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016972973245682628, + "loss": 0.0153, "step": 172140 }, { - "epoch": 1.86, - "learning_rate": 2.084387364597522e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.0001697221647638123, + "loss": 0.01, "step": 172150 }, { - "epoch": 1.86, - "learning_rate": 2.0827657780372314e-05, - "loss": 0.0041, + "epoch": 0.87, + "learning_rate": 0.00016971459707079827, + "loss": 0.0128, "step": 172160 }, { - "epoch": 1.86, - "learning_rate": 2.081144191476941e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016970702937778426, + "loss": 0.0133, "step": 172170 }, { - "epoch": 1.86, - "learning_rate": 2.0795226049166503e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016969946168477026, + "loss": 0.013, "step": 172180 }, { - "epoch": 1.86, - "learning_rate": 2.07790101835636e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016969189399175625, + "loss": 0.0123, "step": 172190 }, { - "epoch": 1.86, - "learning_rate": 2.0762794317960692e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016968432629874223, + "loss": 0.0142, "step": 172200 }, { - "epoch": 1.86, - "learning_rate": 2.0746578452357785e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016967675860572824, + "loss": 0.0098, "step": 172210 }, { - "epoch": 1.86, - "learning_rate": 2.073036258675488e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016966919091271422, + "loss": 0.0096, "step": 172220 }, { - "epoch": 1.86, - "learning_rate": 2.0714146721151974e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.0001696616232197002, + "loss": 0.0123, "step": 172230 }, { - "epoch": 1.86, - "learning_rate": 2.0697930855549067e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.0001696540555266862, + "loss": 0.0134, "step": 172240 }, { - "epoch": 1.86, - "learning_rate": 2.0681714989946163e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.0001696464878336722, + "loss": 0.0133, "step": 172250 }, { - "epoch": 1.86, - "learning_rate": 2.0665499124343255e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016963892014065817, + "loss": 0.0122, "step": 172260 }, { - "epoch": 1.86, - "learning_rate": 2.0649283258740348e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016963135244764415, + "loss": 0.0126, "step": 172270 }, { - "epoch": 1.86, - "learning_rate": 2.0633067393137444e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016962378475463016, + "loss": 0.0114, "step": 172280 }, { - "epoch": 1.86, - "learning_rate": 2.0616851527534537e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016961621706161614, + "loss": 0.0126, "step": 172290 }, { - "epoch": 1.86, - "learning_rate": 2.0600635661931633e-05, - "loss": 0.0091, + "epoch": 0.87, + "learning_rate": 0.00016960864936860212, + "loss": 0.0121, "step": 172300 }, { - "epoch": 1.86, - "learning_rate": 2.0584419796328726e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016960108167558813, + "loss": 0.0157, "step": 172310 }, { - "epoch": 1.86, - "learning_rate": 2.056820393072582e-05, - "loss": 0.008, + "epoch": 0.87, + "learning_rate": 0.0001695935139825741, + "loss": 0.0136, "step": 172320 }, { - "epoch": 1.86, - "learning_rate": 2.0551988065122915e-05, - "loss": 0.0119, + "epoch": 0.87, + "learning_rate": 0.0001695859462895601, + "loss": 0.0127, "step": 172330 }, { - "epoch": 1.86, - "learning_rate": 2.0535772199520008e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.0001695783785965461, + "loss": 0.0127, "step": 172340 }, { - "epoch": 1.86, - "learning_rate": 2.05195563339171e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016957081090353208, + "loss": 0.0112, "step": 172350 }, { - "epoch": 1.86, - "learning_rate": 2.0503340468314196e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016956324321051807, + "loss": 0.0104, "step": 172360 }, { - "epoch": 1.86, - "learning_rate": 2.048712460271129e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016955567551750407, + "loss": 0.0099, "step": 172370 }, { - "epoch": 1.86, - "learning_rate": 2.0470908737108385e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016954810782449006, + "loss": 0.0114, "step": 172380 }, { - "epoch": 1.86, - "learning_rate": 2.0454692871505478e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016954054013147604, + "loss": 0.013, "step": 172390 }, { - "epoch": 1.86, - "learning_rate": 2.043847700590257e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016953297243846205, + "loss": 0.0135, "step": 172400 }, { - "epoch": 1.86, - "learning_rate": 2.0422261140299667e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016952540474544803, + "loss": 0.0131, "step": 172410 }, { - "epoch": 1.86, - "learning_rate": 2.040604527469676e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.000169517837052434, + "loss": 0.0124, "step": 172420 }, { - "epoch": 1.86, - "learning_rate": 2.0389829409093852e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016951026935942, + "loss": 0.0106, "step": 172430 }, { - "epoch": 1.86, - "learning_rate": 2.037361354349095e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.000169502701666406, + "loss": 0.0102, "step": 172440 }, { - "epoch": 1.86, - "learning_rate": 2.035739767788804e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016949513397339198, + "loss": 0.0116, "step": 172450 }, { - "epoch": 1.86, - "learning_rate": 2.034118181228514e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016948756628037796, + "loss": 0.0109, "step": 172460 }, { - "epoch": 1.86, - "learning_rate": 2.0324965946682234e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016947999858736397, + "loss": 0.0129, "step": 172470 }, { - "epoch": 1.86, - "learning_rate": 2.030875008107933e-05, - "loss": 0.0087, + "epoch": 0.87, + "learning_rate": 0.00016947243089434995, + "loss": 0.0124, "step": 172480 }, { - "epoch": 1.86, - "learning_rate": 2.0292534215476422e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016946486320133593, + "loss": 0.0147, "step": 172490 }, { - "epoch": 1.86, - "learning_rate": 2.0276318349873515e-05, - "loss": 0.0045, + "epoch": 0.87, + "learning_rate": 0.00016945729550832194, + "loss": 0.0126, "step": 172500 }, { - "epoch": 1.86, - "learning_rate": 2.026010248427061e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016944972781530792, + "loss": 0.0113, "step": 172510 }, { - "epoch": 1.87, - "learning_rate": 2.0243886618667704e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.0001694421601222939, + "loss": 0.0116, "step": 172520 }, { - "epoch": 1.87, - "learning_rate": 2.0227670753064797e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.0001694345924292799, + "loss": 0.0178, "step": 172530 }, { - "epoch": 1.87, - "learning_rate": 2.0211454887461893e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.0001694270247362659, + "loss": 0.0161, "step": 172540 }, { - "epoch": 1.87, - "learning_rate": 2.0195239021858986e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016941945704325188, + "loss": 0.0105, "step": 172550 }, { - "epoch": 1.87, - "learning_rate": 2.017902315625608e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00016941188935023788, + "loss": 0.0102, "step": 172560 }, { - "epoch": 1.87, - "learning_rate": 2.0162807290653174e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016940432165722387, + "loss": 0.0096, "step": 172570 }, { - "epoch": 1.87, - "learning_rate": 2.0146591425050267e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016939675396420985, + "loss": 0.0099, "step": 172580 }, { - "epoch": 1.87, - "learning_rate": 2.0130375559447363e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016938918627119583, + "loss": 0.012, "step": 172590 }, { - "epoch": 1.87, - "learning_rate": 2.0114159693844456e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016938161857818184, + "loss": 0.0118, "step": 172600 }, { - "epoch": 1.87, - "learning_rate": 2.009794382824155e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016937405088516782, + "loss": 0.0129, "step": 172610 }, { - "epoch": 1.87, - "learning_rate": 2.0081727962638645e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.0001693664831921538, + "loss": 0.0124, "step": 172620 }, { - "epoch": 1.87, - "learning_rate": 2.0065512097035738e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001693589154991398, + "loss": 0.0109, "step": 172630 }, { - "epoch": 1.87, - "learning_rate": 2.004929623143283e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.0001693513478061258, + "loss": 0.0111, "step": 172640 }, { - "epoch": 1.87, - "learning_rate": 2.0033080365829927e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016934378011311177, + "loss": 0.0121, "step": 172650 }, { - "epoch": 1.87, - "learning_rate": 2.001686450022702e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016933621242009778, + "loss": 0.0125, "step": 172660 }, { - "epoch": 1.87, - "learning_rate": 2.0000648634624115e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016932864472708376, + "loss": 0.0118, "step": 172670 }, { - "epoch": 1.87, - "learning_rate": 1.9984432769021208e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016932107703406974, + "loss": 0.0128, "step": 172680 }, { - "epoch": 1.87, - "learning_rate": 1.99682169034183e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016931350934105575, + "loss": 0.0122, "step": 172690 }, { - "epoch": 1.87, - "learning_rate": 1.9952001037815397e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016930594164804173, + "loss": 0.012, "step": 172700 }, { - "epoch": 1.87, - "learning_rate": 1.993578517221249e-05, - "loss": 0.0112, + "epoch": 0.87, + "learning_rate": 0.00016929837395502771, + "loss": 0.0111, "step": 172710 }, { - "epoch": 1.87, - "learning_rate": 1.9919569306609583e-05, - "loss": 0.0088, + "epoch": 0.87, + "learning_rate": 0.00016929080626201372, + "loss": 0.012, "step": 172720 }, { - "epoch": 1.87, - "learning_rate": 1.990335344100668e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001692832385689997, + "loss": 0.0109, "step": 172730 }, { - "epoch": 1.87, - "learning_rate": 1.988713757540377e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016927567087598569, + "loss": 0.0133, "step": 172740 }, { - "epoch": 1.87, - "learning_rate": 1.9870921709800868e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.0001692681031829717, + "loss": 0.0126, "step": 172750 }, { - "epoch": 1.87, - "learning_rate": 1.985470584419796e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016926053548995768, + "loss": 0.0131, "step": 172760 }, { - "epoch": 1.87, - "learning_rate": 1.9838489978595053e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016925296779694366, + "loss": 0.0128, "step": 172770 }, { - "epoch": 1.87, - "learning_rate": 1.982227411299215e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016924540010392964, + "loss": 0.0091, "step": 172780 }, { - "epoch": 1.87, - "learning_rate": 1.9806058247389242e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016923783241091565, + "loss": 0.0085, "step": 172790 }, { - "epoch": 1.87, - "learning_rate": 1.9789842381786335e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016923026471790163, + "loss": 0.0116, "step": 172800 }, { - "epoch": 1.87, - "learning_rate": 1.977362651618343e-05, - "loss": 0.0085, + "epoch": 0.87, + "learning_rate": 0.0001692226970248876, + "loss": 0.0147, "step": 172810 }, { - "epoch": 1.87, - "learning_rate": 1.9757410650580527e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016921512933187362, + "loss": 0.0115, "step": 172820 }, { - "epoch": 1.87, - "learning_rate": 1.9741194784977623e-05, - "loss": 0.0046, + "epoch": 0.87, + "learning_rate": 0.00016920756163885957, + "loss": 0.0095, "step": 172830 }, { - "epoch": 1.87, - "learning_rate": 1.9724978919374716e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016919999394584555, + "loss": 0.012, "step": 172840 }, { - "epoch": 1.87, - "learning_rate": 1.970876305377181e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016919242625283154, + "loss": 0.0104, "step": 172850 }, { - "epoch": 1.87, - "learning_rate": 1.9692547188168905e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016918485855981754, + "loss": 0.011, "step": 172860 }, { - "epoch": 1.87, - "learning_rate": 1.9676331322565997e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016917729086680353, + "loss": 0.0128, "step": 172870 }, { - "epoch": 1.87, - "learning_rate": 1.9660115456963094e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.0001691697231737895, + "loss": 0.0164, "step": 172880 }, { - "epoch": 1.87, - "learning_rate": 1.9643899591360186e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016916215548077552, + "loss": 0.0117, "step": 172890 }, { - "epoch": 1.87, - "learning_rate": 1.962768372575728e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.0001691545877877615, + "loss": 0.012, "step": 172900 }, { - "epoch": 1.87, - "learning_rate": 1.9611467860154375e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016914702009474748, + "loss": 0.014, "step": 172910 }, { - "epoch": 1.87, - "learning_rate": 1.9595251994551468e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001691394524017335, + "loss": 0.0113, "step": 172920 }, { - "epoch": 1.87, - "learning_rate": 1.957903612894856e-05, - "loss": 0.0114, + "epoch": 0.87, + "learning_rate": 0.00016913188470871947, + "loss": 0.0157, "step": 172930 }, { - "epoch": 1.87, - "learning_rate": 1.9562820263345657e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016912431701570545, + "loss": 0.0115, "step": 172940 }, { - "epoch": 1.87, - "learning_rate": 1.954660439774275e-05, - "loss": 0.0048, + "epoch": 0.87, + "learning_rate": 0.00016911674932269146, + "loss": 0.0128, "step": 172950 }, { - "epoch": 1.87, - "learning_rate": 1.9530388532139846e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016910918162967744, + "loss": 0.0118, "step": 172960 }, { - "epoch": 1.87, - "learning_rate": 1.951417266653694e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016910161393666342, + "loss": 0.0147, "step": 172970 }, { - "epoch": 1.87, - "learning_rate": 1.949795680093403e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016909404624364943, + "loss": 0.0104, "step": 172980 }, { - "epoch": 1.87, - "learning_rate": 1.9481740935331127e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.0001690864785506354, + "loss": 0.0115, "step": 172990 }, { - "epoch": 1.87, - "learning_rate": 1.946552506972822e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.0001690789108576214, + "loss": 0.0146, "step": 173000 }, { - "epoch": 1.87, - "eval_cer": 0.921521722891336, - "eval_loss": 0.00535942055284977, - "eval_runtime": 121.276, - "eval_samples_per_second": 16.491, - "eval_steps_per_second": 4.123, + "epoch": 0.87, + "eval_cer": 0.9145003381830497, + "eval_loss": 0.008254943415522575, + "eval_runtime": 116.8302, + "eval_samples_per_second": 17.119, + "eval_steps_per_second": 4.28, "step": 173000 }, { - "epoch": 1.87, - "learning_rate": 1.9449309204125313e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016907134316460737, + "loss": 0.0116, "step": 173010 }, { - "epoch": 1.87, - "learning_rate": 1.943309333852241e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016906377547159338, + "loss": 0.0118, "step": 173020 }, { - "epoch": 1.87, - "learning_rate": 1.94168774729195e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00016905620777857936, + "loss": 0.0114, "step": 173030 }, { - "epoch": 1.87, - "learning_rate": 1.9400661607316598e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016904864008556535, + "loss": 0.0126, "step": 173040 }, { - "epoch": 1.87, - "learning_rate": 1.938444574171369e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00016904107239255135, + "loss": 0.0095, "step": 173050 }, { - "epoch": 1.87, - "learning_rate": 1.9368229876110783e-05, - "loss": 0.0048, + "epoch": 0.87, + "learning_rate": 0.00016903350469953734, + "loss": 0.0099, "step": 173060 }, { - "epoch": 1.87, - "learning_rate": 1.935201401050788e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016902593700652332, + "loss": 0.0109, "step": 173070 }, { - "epoch": 1.87, - "learning_rate": 1.9335798144904972e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016901836931350933, + "loss": 0.0124, "step": 173080 }, { - "epoch": 1.87, - "learning_rate": 1.9319582279302065e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001690108016204953, + "loss": 0.0124, "step": 173090 }, { - "epoch": 1.87, - "learning_rate": 1.930336641369916e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.0001690032339274813, + "loss": 0.0123, "step": 173100 }, { - "epoch": 1.87, - "learning_rate": 1.9287150548096254e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.0001689956662344673, + "loss": 0.0135, "step": 173110 }, { - "epoch": 1.87, - "learning_rate": 1.927093468249335e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016898809854145328, + "loss": 0.0114, "step": 173120 }, { - "epoch": 1.87, - "learning_rate": 1.9254718816890443e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016898053084843926, + "loss": 0.0131, "step": 173130 }, { - "epoch": 1.87, - "learning_rate": 1.9238502951287535e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016897296315542527, + "loss": 0.0121, "step": 173140 }, { - "epoch": 1.87, - "learning_rate": 1.922228708568463e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016896539546241125, + "loss": 0.0107, "step": 173150 }, { - "epoch": 1.87, - "learning_rate": 1.9206071220081724e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016895782776939723, + "loss": 0.0147, "step": 173160 }, { - "epoch": 1.87, - "learning_rate": 1.9189855354478817e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.0001689502600763832, + "loss": 0.0129, "step": 173170 }, { - "epoch": 1.87, - "learning_rate": 1.9173639488875917e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016894269238336922, + "loss": 0.0115, "step": 173180 }, { - "epoch": 1.87, - "learning_rate": 1.915742362327301e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.0001689351246903552, + "loss": 0.0149, "step": 173190 }, { - "epoch": 1.87, - "learning_rate": 1.9141207757670105e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016892755699734118, + "loss": 0.0107, "step": 173200 }, { - "epoch": 1.87, - "learning_rate": 1.9124991892067198e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001689199893043272, + "loss": 0.0116, "step": 173210 }, { - "epoch": 1.87, - "learning_rate": 1.910877602646429e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016891242161131317, + "loss": 0.0092, "step": 173220 }, { - "epoch": 1.87, - "learning_rate": 1.9092560160861387e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016890485391829916, + "loss": 0.0112, "step": 173230 }, { - "epoch": 1.87, - "learning_rate": 1.907634429525848e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016889728622528516, + "loss": 0.0091, "step": 173240 }, { - "epoch": 1.87, - "learning_rate": 1.9060128429655576e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016888971853227115, + "loss": 0.0133, "step": 173250 }, { - "epoch": 1.87, - "learning_rate": 1.904391256405267e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016888215083925713, + "loss": 0.0127, "step": 173260 }, { - "epoch": 1.87, - "learning_rate": 1.902769669844976e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016887458314624314, + "loss": 0.0124, "step": 173270 }, { - "epoch": 1.87, - "learning_rate": 1.9011480832846858e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016886701545322912, + "loss": 0.0125, "step": 173280 }, { - "epoch": 1.87, - "learning_rate": 1.899526496724395e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001688594477602151, + "loss": 0.0104, "step": 173290 }, { - "epoch": 1.87, - "learning_rate": 1.8979049101641043e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.0001688518800672011, + "loss": 0.0155, "step": 173300 }, { - "epoch": 1.87, - "learning_rate": 1.896283323603814e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.0001688443123741871, + "loss": 0.0156, "step": 173310 }, { - "epoch": 1.87, - "learning_rate": 1.8946617370435232e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016883674468117307, + "loss": 0.0135, "step": 173320 }, { - "epoch": 1.87, - "learning_rate": 1.8930401504832328e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016882917698815905, + "loss": 0.0126, "step": 173330 }, { - "epoch": 1.87, - "learning_rate": 1.891418563922942e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016882160929514506, + "loss": 0.0139, "step": 173340 }, { - "epoch": 1.87, - "learning_rate": 1.8897969773626514e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016881404160213104, + "loss": 0.0113, "step": 173350 }, { - "epoch": 1.87, - "learning_rate": 1.888175390802361e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.00016880647390911702, + "loss": 0.0099, "step": 173360 }, { - "epoch": 1.87, - "learning_rate": 1.8865538042420702e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016879890621610303, + "loss": 0.0102, "step": 173370 }, { - "epoch": 1.87, - "learning_rate": 1.8849322176817795e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.000168791338523089, + "loss": 0.01, "step": 173380 }, { - "epoch": 1.87, - "learning_rate": 1.883310631121489e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.000168783770830075, + "loss": 0.0125, "step": 173390 }, { - "epoch": 1.87, - "learning_rate": 1.8816890445611984e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.000168776203137061, + "loss": 0.0106, "step": 173400 }, { - "epoch": 1.87, - "learning_rate": 1.880067458000908e-05, - "loss": 0.0122, + "epoch": 0.87, + "learning_rate": 0.00016876863544404698, + "loss": 0.0115, "step": 173410 }, { - "epoch": 1.87, - "learning_rate": 1.8784458714406173e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016876106775103297, + "loss": 0.0119, "step": 173420 }, { - "epoch": 1.87, - "learning_rate": 1.8768242848803266e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016875350005801897, + "loss": 0.013, "step": 173430 }, { - "epoch": 1.87, - "learning_rate": 1.8752026983200362e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016874593236500496, + "loss": 0.013, "step": 173440 }, { - "epoch": 1.88, - "learning_rate": 1.8735811117597458e-05, - "loss": 0.009, + "epoch": 0.88, + "learning_rate": 0.00016873836467199094, + "loss": 0.012, "step": 173450 }, { - "epoch": 1.88, - "learning_rate": 1.871959525199455e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016873079697897695, + "loss": 0.0103, "step": 173460 }, { - "epoch": 1.88, - "learning_rate": 1.8703379386391643e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016872322928596293, + "loss": 0.0123, "step": 173470 }, { - "epoch": 1.88, - "learning_rate": 1.868716352078874e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.0001687156615929489, + "loss": 0.0134, "step": 173480 }, { - "epoch": 1.88, - "learning_rate": 1.8670947655185832e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.0001687080938999349, + "loss": 0.0126, "step": 173490 }, { - "epoch": 1.88, - "learning_rate": 1.8654731789582925e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.0001687005262069209, + "loss": 0.0122, "step": 173500 }, { - "epoch": 1.88, - "learning_rate": 1.863851592398002e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016869295851390688, + "loss": 0.0121, "step": 173510 }, { - "epoch": 1.88, - "learning_rate": 1.8622300058377114e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016868539082089286, + "loss": 0.0143, "step": 173520 }, { - "epoch": 1.88, - "learning_rate": 1.860608419277421e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016867782312787887, + "loss": 0.0112, "step": 173530 }, { - "epoch": 1.88, - "learning_rate": 1.8589868327171303e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016867025543486485, + "loss": 0.0152, "step": 173540 }, { - "epoch": 1.88, - "learning_rate": 1.8573652461568395e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016866268774185083, + "loss": 0.0105, "step": 173550 }, { - "epoch": 1.88, - "learning_rate": 1.855743659596549e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016865512004883684, + "loss": 0.0091, "step": 173560 }, { - "epoch": 1.88, - "learning_rate": 1.8541220730362584e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016864755235582282, + "loss": 0.01, "step": 173570 }, { - "epoch": 1.88, - "learning_rate": 1.8525004864759677e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.0001686399846628088, + "loss": 0.0158, "step": 173580 }, { - "epoch": 1.88, - "learning_rate": 1.8508788999156773e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.0001686324169697948, + "loss": 0.01, "step": 173590 }, { - "epoch": 1.88, - "learning_rate": 1.8492573133553866e-05, - "loss": 0.0048, + "epoch": 0.88, + "learning_rate": 0.0001686248492767808, + "loss": 0.0135, "step": 173600 }, { - "epoch": 1.88, - "learning_rate": 1.8476357267950962e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016861728158376678, + "loss": 0.0092, "step": 173610 }, { - "epoch": 1.88, - "learning_rate": 1.8460141402348055e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016860971389075278, + "loss": 0.0101, "step": 173620 }, { - "epoch": 1.88, - "learning_rate": 1.844392553674515e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016860214619773877, + "loss": 0.013, "step": 173630 }, { - "epoch": 1.88, - "learning_rate": 1.8427709671142244e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016859457850472475, + "loss": 0.0092, "step": 173640 }, { - "epoch": 1.88, - "learning_rate": 1.841149380553934e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016858701081171076, + "loss": 0.0128, "step": 173650 }, { - "epoch": 1.88, - "learning_rate": 1.8395277939936433e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016857944311869674, + "loss": 0.0123, "step": 173660 }, { - "epoch": 1.88, - "learning_rate": 1.8379062074333525e-05, - "loss": 0.0088, + "epoch": 0.88, + "learning_rate": 0.00016857187542568272, + "loss": 0.0131, "step": 173670 }, { - "epoch": 1.88, - "learning_rate": 1.836284620873062e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.0001685643077326687, + "loss": 0.012, "step": 173680 }, { - "epoch": 1.88, - "learning_rate": 1.8346630343127714e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.0001685567400396547, + "loss": 0.0117, "step": 173690 }, { - "epoch": 1.88, - "learning_rate": 1.833041447752481e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.0001685491723466407, + "loss": 0.0113, "step": 173700 }, { - "epoch": 1.88, - "learning_rate": 1.8314198611921903e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016854160465362667, + "loss": 0.0143, "step": 173710 }, { - "epoch": 1.88, - "learning_rate": 1.8297982746318996e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016853403696061268, + "loss": 0.0109, "step": 173720 }, { - "epoch": 1.88, - "learning_rate": 1.8281766880716092e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016852646926759866, + "loss": 0.0139, "step": 173730 }, { - "epoch": 1.88, - "learning_rate": 1.8265551015113185e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016851890157458464, + "loss": 0.0117, "step": 173740 }, { - "epoch": 1.88, - "learning_rate": 1.8249335149510277e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016851133388157065, + "loss": 0.0112, "step": 173750 }, { - "epoch": 1.88, - "learning_rate": 1.8233119283907374e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016850376618855663, + "loss": 0.0101, "step": 173760 }, { - "epoch": 1.88, - "learning_rate": 1.8216903418304466e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016849619849554261, + "loss": 0.0126, "step": 173770 }, { - "epoch": 1.88, - "learning_rate": 1.8200687552701562e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016848863080252862, + "loss": 0.0122, "step": 173780 }, { - "epoch": 1.88, - "learning_rate": 1.8184471687098655e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.0001684810631095146, + "loss": 0.0147, "step": 173790 }, { - "epoch": 1.88, - "learning_rate": 1.8168255821495748e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016847349541650059, + "loss": 0.0124, "step": 173800 }, { - "epoch": 1.88, - "learning_rate": 1.8152039955892844e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.0001684659277234866, + "loss": 0.0127, "step": 173810 }, { - "epoch": 1.88, - "learning_rate": 1.813582409028994e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016845836003047258, + "loss": 0.0084, "step": 173820 }, { - "epoch": 1.88, - "learning_rate": 1.8119608224687033e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016845079233745856, + "loss": 0.0099, "step": 173830 }, { - "epoch": 1.88, - "learning_rate": 1.8103392359084126e-05, - "loss": 0.0047, + "epoch": 0.88, + "learning_rate": 0.00016844322464444454, + "loss": 0.0115, "step": 173840 }, { - "epoch": 1.88, - "learning_rate": 1.8087176493481222e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016843565695143055, + "loss": 0.0107, "step": 173850 }, { - "epoch": 1.88, - "learning_rate": 1.8070960627878315e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016842808925841653, + "loss": 0.0147, "step": 173860 }, { - "epoch": 1.88, - "learning_rate": 1.8054744762275407e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.0001684205215654025, + "loss": 0.0123, "step": 173870 }, { - "epoch": 1.88, - "learning_rate": 1.8038528896672503e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.00016841295387238852, + "loss": 0.0131, "step": 173880 }, { - "epoch": 1.88, - "learning_rate": 1.8022313031069596e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.0001684053861793745, + "loss": 0.0166, "step": 173890 }, { - "epoch": 1.88, - "learning_rate": 1.8006097165466692e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.00016839781848636048, + "loss": 0.0117, "step": 173900 }, { - "epoch": 1.88, - "learning_rate": 1.7989881299863785e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.0001683902507933465, + "loss": 0.0117, "step": 173910 }, { - "epoch": 1.88, - "learning_rate": 1.7973665434260878e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016838268310033247, + "loss": 0.0101, "step": 173920 }, { - "epoch": 1.88, - "learning_rate": 1.7957449568657974e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016837511540731845, + "loss": 0.0107, "step": 173930 }, { - "epoch": 1.88, - "learning_rate": 1.7941233703055067e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016836754771430446, + "loss": 0.0134, "step": 173940 }, { - "epoch": 1.88, - "learning_rate": 1.792501783745216e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.00016835998002129044, + "loss": 0.0124, "step": 173950 }, { - "epoch": 1.88, - "learning_rate": 1.7908801971849256e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016835241232827643, + "loss": 0.0116, "step": 173960 }, { - "epoch": 1.88, - "learning_rate": 1.789258610624635e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016834484463526243, + "loss": 0.01, "step": 173970 }, { - "epoch": 1.88, - "learning_rate": 1.7876370240643444e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016833727694224842, + "loss": 0.012, "step": 173980 }, { - "epoch": 1.88, - "learning_rate": 1.786015437504054e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.0001683297092492344, + "loss": 0.012, "step": 173990 }, { - "epoch": 1.88, - "learning_rate": 1.7843938509437633e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016832214155622038, + "loss": 0.0158, "step": 174000 }, { - "epoch": 1.88, - "eval_cer": 0.9215086938469904, - "eval_loss": 0.005281680729240179, - "eval_runtime": 121.3681, - "eval_samples_per_second": 16.479, - "eval_steps_per_second": 4.12, + "epoch": 0.88, + "eval_cer": 0.9144935454101719, + "eval_loss": 0.008368046954274178, + "eval_runtime": 116.7718, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, "step": 174000 }, { - "epoch": 1.88, - "learning_rate": 1.7827722643834726e-05, - "loss": 0.0084, + "epoch": 0.88, + "learning_rate": 0.0001683145738632064, + "loss": 0.0139, "step": 174010 }, { - "epoch": 1.88, - "learning_rate": 1.7811506778231822e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016830700617019237, + "loss": 0.0124, "step": 174020 }, { - "epoch": 1.88, - "learning_rate": 1.7795290912628915e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016829943847717835, + "loss": 0.0109, "step": 174030 }, { - "epoch": 1.88, - "learning_rate": 1.7779075047026008e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016829187078416436, + "loss": 0.0119, "step": 174040 }, { - "epoch": 1.88, - "learning_rate": 1.7762859181423104e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016828430309115034, + "loss": 0.0109, "step": 174050 }, { - "epoch": 1.88, - "learning_rate": 1.7746643315820197e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016827673539813632, + "loss": 0.0111, "step": 174060 }, { - "epoch": 1.88, - "learning_rate": 1.7730427450217293e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.00016826916770512233, + "loss": 0.0111, "step": 174070 }, { - "epoch": 1.88, - "learning_rate": 1.7714211584614385e-05, - "loss": 0.0115, + "epoch": 0.88, + "learning_rate": 0.00016826160001210828, + "loss": 0.0125, "step": 174080 }, { - "epoch": 1.88, - "learning_rate": 1.7697995719011478e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016825403231909427, + "loss": 0.0105, "step": 174090 }, { - "epoch": 1.88, - "learning_rate": 1.7681779853408574e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016824646462608025, + "loss": 0.0113, "step": 174100 }, { - "epoch": 1.88, - "learning_rate": 1.7665563987805667e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016823889693306626, + "loss": 0.01, "step": 174110 }, { - "epoch": 1.88, - "learning_rate": 1.764934812220276e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016823132924005224, + "loss": 0.0127, "step": 174120 }, { - "epoch": 1.88, - "learning_rate": 1.7633132256599856e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016822376154703822, + "loss": 0.0127, "step": 174130 }, { - "epoch": 1.88, - "learning_rate": 1.761691639099695e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016821619385402423, + "loss": 0.0132, "step": 174140 }, { - "epoch": 1.88, - "learning_rate": 1.760070052539404e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.0001682086261610102, + "loss": 0.0115, "step": 174150 }, { - "epoch": 1.88, - "learning_rate": 1.7584484659791138e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001682010584679962, + "loss": 0.016, "step": 174160 }, { - "epoch": 1.88, - "learning_rate": 1.7568268794188234e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001681934907749822, + "loss": 0.0159, "step": 174170 }, { - "epoch": 1.88, - "learning_rate": 1.7552052928585326e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016818592308196818, + "loss": 0.0128, "step": 174180 }, { - "epoch": 1.88, - "learning_rate": 1.7535837062982423e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016817835538895416, + "loss": 0.0096, "step": 174190 }, { - "epoch": 1.88, - "learning_rate": 1.7519621197379515e-05, - "loss": 0.0091, + "epoch": 0.88, + "learning_rate": 0.00016817078769594017, + "loss": 0.0148, "step": 174200 }, { - "epoch": 1.88, - "learning_rate": 1.7503405331776608e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016816322000292615, + "loss": 0.0113, "step": 174210 }, { - "epoch": 1.88, - "learning_rate": 1.7487189466173704e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016815565230991213, + "loss": 0.0112, "step": 174220 }, { - "epoch": 1.88, - "learning_rate": 1.7470973600570797e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016814808461689811, + "loss": 0.0109, "step": 174230 }, { - "epoch": 1.88, - "learning_rate": 1.745475773496789e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016814051692388412, + "loss": 0.0105, "step": 174240 }, { - "epoch": 1.88, - "learning_rate": 1.7438541869364986e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.0001681329492308701, + "loss": 0.0129, "step": 174250 }, { - "epoch": 1.88, - "learning_rate": 1.742232600376208e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016812538153785609, + "loss": 0.0125, "step": 174260 }, { - "epoch": 1.88, - "learning_rate": 1.7406110138159175e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.0001681178138448421, + "loss": 0.01, "step": 174270 }, { - "epoch": 1.88, - "learning_rate": 1.7389894272556267e-05, - "loss": 0.0044, + "epoch": 0.88, + "learning_rate": 0.00016811024615182808, + "loss": 0.0126, "step": 174280 }, { - "epoch": 1.88, - "learning_rate": 1.737367840695336e-05, - "loss": 0.0084, + "epoch": 0.88, + "learning_rate": 0.00016810267845881406, + "loss": 0.0113, "step": 174290 }, { - "epoch": 1.88, - "learning_rate": 1.7357462541350456e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016809511076580007, + "loss": 0.0104, "step": 174300 }, { - "epoch": 1.88, - "learning_rate": 1.734124667574755e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016808754307278605, + "loss": 0.0091, "step": 174310 }, { - "epoch": 1.88, - "learning_rate": 1.7325030810144642e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016807997537977203, + "loss": 0.0122, "step": 174320 }, { - "epoch": 1.88, - "learning_rate": 1.7308814944541738e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016807240768675804, + "loss": 0.0118, "step": 174330 }, { - "epoch": 1.88, - "learning_rate": 1.729259907893883e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016806483999374402, + "loss": 0.0109, "step": 174340 }, { - "epoch": 1.88, - "learning_rate": 1.7276383213335927e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016805727230073, + "loss": 0.0142, "step": 174350 }, { - "epoch": 1.88, - "learning_rate": 1.7260167347733023e-05, - "loss": 0.0084, + "epoch": 0.88, + "learning_rate": 0.000168049704607716, + "loss": 0.0124, "step": 174360 }, { - "epoch": 1.89, - "learning_rate": 1.7243951482130116e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.000168042136914702, + "loss": 0.0108, "step": 174370 }, { - "epoch": 1.89, - "learning_rate": 1.722773561652721e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016803456922168797, + "loss": 0.0127, "step": 174380 }, { - "epoch": 1.89, - "learning_rate": 1.7211519750924305e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016802700152867395, + "loss": 0.0171, "step": 174390 }, { - "epoch": 1.89, - "learning_rate": 1.7195303885321397e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016801943383565996, + "loss": 0.0124, "step": 174400 }, { - "epoch": 1.89, - "learning_rate": 1.717908801971849e-05, - "loss": 0.0078, + "epoch": 0.88, + "learning_rate": 0.00016801186614264594, + "loss": 0.012, "step": 174410 }, { - "epoch": 1.89, - "learning_rate": 1.7162872154115586e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016800429844963192, + "loss": 0.0125, "step": 174420 }, { - "epoch": 1.89, - "learning_rate": 1.714665628851268e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016799673075661793, + "loss": 0.0132, "step": 174430 }, { - "epoch": 1.89, - "learning_rate": 1.713044042290977e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016798916306360391, + "loss": 0.0117, "step": 174440 }, { - "epoch": 1.89, - "learning_rate": 1.7114224557306868e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001679815953705899, + "loss": 0.0106, "step": 174450 }, { - "epoch": 1.89, - "learning_rate": 1.709800869170396e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.0001679740276775759, + "loss": 0.0155, "step": 174460 }, { - "epoch": 1.89, - "learning_rate": 1.7081792826101057e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016796645998456189, + "loss": 0.0109, "step": 174470 }, { - "epoch": 1.89, - "learning_rate": 1.706557696049815e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016795889229154787, + "loss": 0.0123, "step": 174480 }, { - "epoch": 1.89, - "learning_rate": 1.7049361094895242e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016795132459853388, + "loss": 0.0099, "step": 174490 }, { - "epoch": 1.89, - "learning_rate": 1.7033145229292338e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016794375690551986, + "loss": 0.0129, "step": 174500 }, { - "epoch": 1.89, - "learning_rate": 1.701692936368943e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016793618921250584, + "loss": 0.0128, "step": 174510 }, { - "epoch": 1.89, - "learning_rate": 1.7000713498086524e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016792862151949185, + "loss": 0.0121, "step": 174520 }, { - "epoch": 1.89, - "learning_rate": 1.698449763248362e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016792105382647783, + "loss": 0.0142, "step": 174530 }, { - "epoch": 1.89, - "learning_rate": 1.6968281766880716e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.0001679134861334638, + "loss": 0.0112, "step": 174540 }, { - "epoch": 1.89, - "learning_rate": 1.695206590127781e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016790591844044982, + "loss": 0.0118, "step": 174550 }, { - "epoch": 1.89, - "learning_rate": 1.6935850035674905e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.0001678983507474358, + "loss": 0.0131, "step": 174560 }, { - "epoch": 1.89, - "learning_rate": 1.6919634170071998e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016789078305442178, + "loss": 0.0134, "step": 174570 }, { - "epoch": 1.89, - "learning_rate": 1.690341830446909e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016788321536140776, + "loss": 0.0129, "step": 174580 }, { - "epoch": 1.89, - "learning_rate": 1.6887202438866187e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016787564766839377, + "loss": 0.0142, "step": 174590 }, { - "epoch": 1.89, - "learning_rate": 1.687098657326328e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.00016786807997537975, + "loss": 0.0105, "step": 174600 }, { - "epoch": 1.89, - "learning_rate": 1.6854770707660372e-05, - "loss": 0.004, + "epoch": 0.88, + "learning_rate": 0.00016786051228236573, + "loss": 0.0125, "step": 174610 }, { - "epoch": 1.89, - "learning_rate": 1.6838554842057468e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016785294458935174, + "loss": 0.0111, "step": 174620 }, { - "epoch": 1.89, - "learning_rate": 1.682233897645456e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016784537689633772, + "loss": 0.0116, "step": 174630 }, { - "epoch": 1.89, - "learning_rate": 1.6806123110851657e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.0001678378092033237, + "loss": 0.0102, "step": 174640 }, { - "epoch": 1.89, - "learning_rate": 1.678990724524875e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016783024151030971, + "loss": 0.012, "step": 174650 }, { - "epoch": 1.89, - "learning_rate": 1.6773691379645842e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.0001678226738172957, + "loss": 0.0114, "step": 174660 }, { - "epoch": 1.89, - "learning_rate": 1.675747551404294e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016781510612428168, + "loss": 0.0125, "step": 174670 }, { - "epoch": 1.89, - "learning_rate": 1.674125964844003e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016780753843126769, + "loss": 0.0111, "step": 174680 }, { - "epoch": 1.89, - "learning_rate": 1.6725043782837124e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016779997073825367, + "loss": 0.0131, "step": 174690 }, { - "epoch": 1.89, - "learning_rate": 1.670882791723422e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016779240304523965, + "loss": 0.0107, "step": 174700 }, { - "epoch": 1.89, - "learning_rate": 1.6692612051631316e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016778483535222566, + "loss": 0.0114, "step": 174710 }, { - "epoch": 1.89, - "learning_rate": 1.667639618602841e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016777726765921164, + "loss": 0.0112, "step": 174720 }, { - "epoch": 1.89, - "learning_rate": 1.6660180320425505e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016776969996619762, + "loss": 0.0146, "step": 174730 }, { - "epoch": 1.89, - "learning_rate": 1.6643964454822598e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001677621322731836, + "loss": 0.0094, "step": 174740 }, { - "epoch": 1.89, - "learning_rate": 1.662774858921969e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001677545645801696, + "loss": 0.0108, "step": 174750 }, { - "epoch": 1.89, - "learning_rate": 1.6611532723616787e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.0001677469968871556, + "loss": 0.0112, "step": 174760 }, { - "epoch": 1.89, - "learning_rate": 1.659531685801388e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016773942919414157, + "loss": 0.0125, "step": 174770 }, { - "epoch": 1.89, - "learning_rate": 1.6579100992410972e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016773186150112758, + "loss": 0.0134, "step": 174780 }, { - "epoch": 1.89, - "learning_rate": 1.656288512680807e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016772429380811356, + "loss": 0.0144, "step": 174790 }, { - "epoch": 1.89, - "learning_rate": 1.654666926120516e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016771672611509954, + "loss": 0.0119, "step": 174800 }, { - "epoch": 1.89, - "learning_rate": 1.6530453395602254e-05, - "loss": 0.0038, + "epoch": 0.88, + "learning_rate": 0.00016770915842208555, + "loss": 0.0101, "step": 174810 }, { - "epoch": 1.89, - "learning_rate": 1.651423752999935e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016770159072907153, + "loss": 0.0094, "step": 174820 }, { - "epoch": 1.89, - "learning_rate": 1.6498021664396443e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016769402303605752, + "loss": 0.0108, "step": 174830 }, { - "epoch": 1.89, - "learning_rate": 1.648180579879354e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016768645534304352, + "loss": 0.0135, "step": 174840 }, { - "epoch": 1.89, - "learning_rate": 1.6465589933190632e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.0001676788876500295, + "loss": 0.012, "step": 174850 }, { - "epoch": 1.89, - "learning_rate": 1.6449374067587724e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.0001676713199570155, + "loss": 0.0097, "step": 174860 }, { - "epoch": 1.89, - "learning_rate": 1.643315820198482e-05, - "loss": 0.0047, + "epoch": 0.88, + "learning_rate": 0.0001676637522640015, + "loss": 0.0116, "step": 174870 }, { - "epoch": 1.89, - "learning_rate": 1.6416942336381917e-05, - "loss": 0.004, + "epoch": 0.88, + "learning_rate": 0.00016765618457098748, + "loss": 0.0154, "step": 174880 }, { - "epoch": 1.89, - "learning_rate": 1.640072647077901e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016764861687797346, + "loss": 0.0117, "step": 174890 }, { - "epoch": 1.89, - "learning_rate": 1.6384510605176102e-05, - "loss": 0.0047, + "epoch": 0.88, + "learning_rate": 0.00016764104918495944, + "loss": 0.0136, "step": 174900 }, { - "epoch": 1.89, - "learning_rate": 1.63682947395732e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016763348149194545, + "loss": 0.0115, "step": 174910 }, { - "epoch": 1.89, - "learning_rate": 1.635207887397029e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016762591379893143, + "loss": 0.0115, "step": 174920 }, { - "epoch": 1.89, - "learning_rate": 1.6335863008367387e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.0001676183461059174, + "loss": 0.0157, "step": 174930 }, { - "epoch": 1.89, - "learning_rate": 1.631964714276448e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016761077841290342, + "loss": 0.0141, "step": 174940 }, { - "epoch": 1.89, - "learning_rate": 1.6303431277161573e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001676032107198894, + "loss": 0.0148, "step": 174950 }, { - "epoch": 1.89, - "learning_rate": 1.628721541155867e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016759564302687538, + "loss": 0.0887, "step": 174960 }, { - "epoch": 1.89, - "learning_rate": 1.627099954595576e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001675880753338614, + "loss": 0.0107, "step": 174970 }, { - "epoch": 1.89, - "learning_rate": 1.6254783680352854e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016758050764084737, + "loss": 0.0109, "step": 174980 }, { - "epoch": 1.89, - "learning_rate": 1.623856781474995e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016757293994783335, + "loss": 0.0149, "step": 174990 }, { - "epoch": 1.89, - "learning_rate": 1.6222351949147043e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016756537225481936, + "loss": 0.0152, "step": 175000 }, { - "epoch": 1.89, - "eval_cer": 0.9215121682588159, - "eval_loss": 0.005301313009113073, - "eval_runtime": 121.5762, - "eval_samples_per_second": 16.451, - "eval_steps_per_second": 4.113, + "epoch": 0.88, + "eval_cer": 0.9144993677869243, + "eval_loss": 0.008513858541846275, + "eval_runtime": 116.6209, + "eval_samples_per_second": 17.15, + "eval_steps_per_second": 4.287, "step": 175000 }, { - "epoch": 1.89, - "learning_rate": 1.620613608354414e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016755780456180534, + "loss": 0.011, "step": 175010 }, { - "epoch": 1.89, - "learning_rate": 1.6189920217941232e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016755023686879133, + "loss": 0.0107, "step": 175020 }, { - "epoch": 1.89, - "learning_rate": 1.6173704352338325e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016754266917577733, + "loss": 0.0094, "step": 175030 }, { - "epoch": 1.89, - "learning_rate": 1.615748848673542e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016753510148276332, + "loss": 0.0135, "step": 175040 }, { - "epoch": 1.89, - "learning_rate": 1.6141272621132514e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.0001675275337897493, + "loss": 0.0135, "step": 175050 }, { - "epoch": 1.89, - "learning_rate": 1.612505675552961e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.0001675199660967353, + "loss": 0.0105, "step": 175060 }, { - "epoch": 1.89, - "learning_rate": 1.6108840889926703e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.0001675123984037213, + "loss": 0.0112, "step": 175070 }, { - "epoch": 1.89, - "learning_rate": 1.60926250243238e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.00016750483071070727, + "loss": 0.0127, "step": 175080 }, { - "epoch": 1.89, - "learning_rate": 1.607640915872089e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016749726301769325, + "loss": 0.0088, "step": 175090 }, { - "epoch": 1.89, - "learning_rate": 1.6060193293117984e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016748969532467926, + "loss": 0.013, "step": 175100 }, { - "epoch": 1.89, - "learning_rate": 1.604397742751508e-05, - "loss": 0.0108, + "epoch": 0.88, + "learning_rate": 0.00016748212763166524, + "loss": 0.0099, "step": 175110 }, { - "epoch": 1.89, - "learning_rate": 1.6027761561912173e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016747455993865122, + "loss": 0.0102, "step": 175120 }, { - "epoch": 1.89, - "learning_rate": 1.601154569630927e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016746699224563723, + "loss": 0.0136, "step": 175130 }, { - "epoch": 1.89, - "learning_rate": 1.5995329830706362e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.0001674594245526232, + "loss": 0.01, "step": 175140 }, { - "epoch": 1.89, - "learning_rate": 1.5979113965103455e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.0001674518568596092, + "loss": 0.0104, "step": 175150 }, { - "epoch": 1.89, - "learning_rate": 1.596289809950055e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.0001674442891665952, + "loss": 0.0131, "step": 175160 }, { - "epoch": 1.89, - "learning_rate": 1.5946682233897644e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.00016743672147358118, + "loss": 0.0118, "step": 175170 }, { - "epoch": 1.89, - "learning_rate": 1.5930466368294736e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016742915378056716, + "loss": 0.0116, "step": 175180 }, { - "epoch": 1.89, - "learning_rate": 1.5914250502691832e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016742158608755317, + "loss": 0.0102, "step": 175190 }, { - "epoch": 1.89, - "learning_rate": 1.5898034637088925e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016741401839453915, + "loss": 0.0098, "step": 175200 }, { - "epoch": 1.89, - "learning_rate": 1.588181877148602e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016740645070152514, + "loss": 0.0161, "step": 175210 }, { - "epoch": 1.89, - "learning_rate": 1.5865602905883114e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016739888300851114, + "loss": 0.0142, "step": 175220 }, { - "epoch": 1.89, - "learning_rate": 1.5849387040280207e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016739131531549713, + "loss": 0.0103, "step": 175230 }, { - "epoch": 1.89, - "learning_rate": 1.5833171174677303e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.0001673837476224831, + "loss": 0.0101, "step": 175240 }, { - "epoch": 1.89, - "learning_rate": 1.58169553090744e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.0001673761799294691, + "loss": 0.0103, "step": 175250 }, { - "epoch": 1.89, - "learning_rate": 1.5800739443471492e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.0001673686122364551, + "loss": 0.0115, "step": 175260 }, { - "epoch": 1.89, - "learning_rate": 1.5784523577868585e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016736104454344108, + "loss": 0.0131, "step": 175270 }, { - "epoch": 1.89, - "learning_rate": 1.576830771226568e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016735347685042706, + "loss": 0.0109, "step": 175280 }, { - "epoch": 1.89, - "learning_rate": 1.5752091846662773e-05, - "loss": 0.009, + "epoch": 0.88, + "learning_rate": 0.00016734590915741307, + "loss": 0.0166, "step": 175290 }, { - "epoch": 1.9, - "learning_rate": 1.573587598105987e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016733834146439905, + "loss": 0.0112, "step": 175300 }, { - "epoch": 1.9, - "learning_rate": 1.5719660115456962e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016733077377138503, + "loss": 0.0108, "step": 175310 }, { - "epoch": 1.9, - "learning_rate": 1.5703444249854055e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016732320607837104, + "loss": 0.0121, "step": 175320 }, { - "epoch": 1.9, - "learning_rate": 1.568722838425115e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016731563838535702, + "loss": 0.0146, "step": 175330 }, { - "epoch": 1.9, - "learning_rate": 1.5671012518648244e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016730807069234298, + "loss": 0.0115, "step": 175340 }, { - "epoch": 1.9, - "learning_rate": 1.5654796653045337e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016730050299932896, + "loss": 0.01, "step": 175350 }, { - "epoch": 1.9, - "learning_rate": 1.5638580787442433e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.00016729293530631497, + "loss": 0.0127, "step": 175360 }, { - "epoch": 1.9, - "learning_rate": 1.5622364921839526e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.00016728536761330095, + "loss": 0.0126, "step": 175370 }, { - "epoch": 1.9, - "learning_rate": 1.5606149056236618e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016727779992028693, + "loss": 0.0124, "step": 175380 }, { - "epoch": 1.9, - "learning_rate": 1.5589933190633714e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016727023222727294, + "loss": 0.0123, "step": 175390 }, { - "epoch": 1.9, - "learning_rate": 1.5573717325030807e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016726266453425892, + "loss": 0.0139, "step": 175400 }, { - "epoch": 1.9, - "learning_rate": 1.5557501459427903e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.0001672550968412449, + "loss": 0.0119, "step": 175410 }, { - "epoch": 1.9, - "learning_rate": 1.5541285593825e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.0001672475291482309, + "loss": 0.0114, "step": 175420 }, { - "epoch": 1.9, - "learning_rate": 1.5525069728222092e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.0001672399614552169, + "loss": 0.0104, "step": 175430 }, { - "epoch": 1.9, - "learning_rate": 1.5508853862619185e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016723239376220287, + "loss": 0.0096, "step": 175440 }, { - "epoch": 1.9, - "learning_rate": 1.549263799701628e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016722482606918888, + "loss": 0.0138, "step": 175450 }, { - "epoch": 1.9, - "learning_rate": 1.5476422131413374e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016721725837617486, + "loss": 0.0134, "step": 175460 }, { - "epoch": 1.9, - "learning_rate": 1.5460206265810467e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016720969068316084, + "loss": 0.01, "step": 175470 }, { - "epoch": 1.9, - "learning_rate": 1.5443990400207563e-05, - "loss": 0.0045, + "epoch": 0.89, + "learning_rate": 0.00016720212299014682, + "loss": 0.0178, "step": 175480 }, { - "epoch": 1.9, - "learning_rate": 1.5427774534604655e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.00016719455529713283, + "loss": 0.0152, "step": 175490 }, { - "epoch": 1.9, - "learning_rate": 1.541155866900175e-05, - "loss": 0.0044, + "epoch": 0.89, + "learning_rate": 0.00016718698760411881, + "loss": 0.0124, "step": 175500 }, { - "epoch": 1.9, - "learning_rate": 1.5395342803398844e-05, - "loss": 0.0089, + "epoch": 0.89, + "learning_rate": 0.0001671794199111048, + "loss": 0.0128, "step": 175510 }, { - "epoch": 1.9, - "learning_rate": 1.5379126937795937e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.0001671718522180908, + "loss": 0.0107, "step": 175520 }, { - "epoch": 1.9, - "learning_rate": 1.5362911072193033e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016716428452507679, + "loss": 0.0123, "step": 175530 }, { - "epoch": 1.9, - "learning_rate": 1.5346695206590126e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016715671683206277, + "loss": 0.0117, "step": 175540 }, { - "epoch": 1.9, - "learning_rate": 1.533047934098722e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016714914913904878, + "loss": 0.0108, "step": 175550 }, { - "epoch": 1.9, - "learning_rate": 1.5314263475384315e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016714158144603476, + "loss": 0.0101, "step": 175560 }, { - "epoch": 1.9, - "learning_rate": 1.5298047609781407e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.00016713401375302074, + "loss": 0.0141, "step": 175570 }, { - "epoch": 1.9, - "learning_rate": 1.5281831744178504e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016712644606000675, + "loss": 0.012, "step": 175580 }, { - "epoch": 1.9, - "learning_rate": 1.5265615878575596e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016711887836699273, + "loss": 0.0092, "step": 175590 }, { - "epoch": 1.9, - "learning_rate": 1.5249400012972693e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.0001671113106739787, + "loss": 0.0102, "step": 175600 }, { - "epoch": 1.9, - "learning_rate": 1.5233184147369787e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016710374298096472, + "loss": 0.0124, "step": 175610 }, { - "epoch": 1.9, - "learning_rate": 1.521696828176688e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.0001670961752879507, + "loss": 0.0137, "step": 175620 }, { - "epoch": 1.9, - "learning_rate": 1.5200752416163974e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016708860759493668, + "loss": 0.0117, "step": 175630 }, { - "epoch": 1.9, - "learning_rate": 1.5184536550561069e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016708103990192266, + "loss": 0.015, "step": 175640 }, { - "epoch": 1.9, - "learning_rate": 1.5168320684958163e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016707347220890867, + "loss": 0.0104, "step": 175650 }, { - "epoch": 1.9, - "learning_rate": 1.5152104819355256e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016706590451589465, + "loss": 0.0118, "step": 175660 }, { - "epoch": 1.9, - "learning_rate": 1.513588895375235e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016705833682288063, + "loss": 0.0121, "step": 175670 }, { - "epoch": 1.9, - "learning_rate": 1.5119673088149445e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016705076912986664, + "loss": 0.012, "step": 175680 }, { - "epoch": 1.9, - "learning_rate": 1.5103457222546537e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016704320143685262, + "loss": 0.0092, "step": 175690 }, { - "epoch": 1.9, - "learning_rate": 1.5087241356943632e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001670356337438386, + "loss": 0.0102, "step": 175700 }, { - "epoch": 1.9, - "learning_rate": 1.5071025491340726e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016702806605082461, + "loss": 0.0163, "step": 175710 }, { - "epoch": 1.9, - "learning_rate": 1.505480962573782e-05, - "loss": 0.0045, + "epoch": 0.89, + "learning_rate": 0.0001670204983578106, + "loss": 0.011, "step": 175720 }, { - "epoch": 1.9, - "learning_rate": 1.5038593760134913e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016701293066479658, + "loss": 0.011, "step": 175730 }, { - "epoch": 1.9, - "learning_rate": 1.5022377894532008e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016700536297178259, + "loss": 0.0099, "step": 175740 }, { - "epoch": 1.9, - "learning_rate": 1.5006162028929102e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016699779527876857, + "loss": 0.0122, "step": 175750 }, { - "epoch": 1.9, - "learning_rate": 1.4989946163326197e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016699022758575455, + "loss": 0.0118, "step": 175760 }, { - "epoch": 1.9, - "learning_rate": 1.497373029772329e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016698265989274056, + "loss": 0.0109, "step": 175770 }, { - "epoch": 1.9, - "learning_rate": 1.4957514432120386e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016697509219972654, + "loss": 0.0132, "step": 175780 }, { - "epoch": 1.9, - "learning_rate": 1.494129856651748e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016696752450671252, + "loss": 0.0105, "step": 175790 }, { - "epoch": 1.9, - "learning_rate": 1.4925082700914574e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.0001669599568136985, + "loss": 0.0131, "step": 175800 }, { - "epoch": 1.9, - "learning_rate": 1.4908866835311669e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.0001669523891206845, + "loss": 0.0215, "step": 175810 }, { - "epoch": 1.9, - "learning_rate": 1.4892650969708762e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.0001669448214276705, + "loss": 0.0096, "step": 175820 }, { - "epoch": 1.9, - "learning_rate": 1.4876435104105856e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.00016693725373465647, + "loss": 0.0115, "step": 175830 }, { - "epoch": 1.9, - "learning_rate": 1.486021923850295e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016692968604164248, + "loss": 0.0108, "step": 175840 }, { - "epoch": 1.9, - "learning_rate": 1.4844003372900045e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.00016692211834862846, + "loss": 0.0099, "step": 175850 }, { - "epoch": 1.9, - "learning_rate": 1.4827787507297138e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016691455065561444, + "loss": 0.0117, "step": 175860 }, { - "epoch": 1.9, - "learning_rate": 1.4811571641694232e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016690698296260045, + "loss": 0.0157, "step": 175870 }, { - "epoch": 1.9, - "learning_rate": 1.4795355776091327e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016689941526958643, + "loss": 0.0113, "step": 175880 }, { - "epoch": 1.9, - "learning_rate": 1.4779139910488421e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016689184757657242, + "loss": 0.0156, "step": 175890 }, { - "epoch": 1.9, - "learning_rate": 1.4762924044885514e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016688427988355842, + "loss": 0.0122, "step": 175900 }, { - "epoch": 1.9, - "learning_rate": 1.4746708179282608e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.0001668767121905444, + "loss": 0.0163, "step": 175910 }, { - "epoch": 1.9, - "learning_rate": 1.4730492313679703e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001668691444975304, + "loss": 0.0128, "step": 175920 }, { - "epoch": 1.9, - "learning_rate": 1.4714276448076797e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.0001668615768045164, + "loss": 0.0168, "step": 175930 }, { - "epoch": 1.9, - "learning_rate": 1.469806058247389e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016685400911150238, + "loss": 0.0131, "step": 175940 }, { - "epoch": 1.9, - "learning_rate": 1.4681844716870984e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016684644141848836, + "loss": 0.0127, "step": 175950 }, { - "epoch": 1.9, - "learning_rate": 1.466562885126808e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016683887372547437, + "loss": 0.0095, "step": 175960 }, { - "epoch": 1.9, - "learning_rate": 1.4649412985665175e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016683130603246035, + "loss": 0.011, "step": 175970 }, { - "epoch": 1.9, - "learning_rate": 1.463319712006227e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016682373833944633, + "loss": 0.0107, "step": 175980 }, { - "epoch": 1.9, - "learning_rate": 1.4616981254459362e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.0001668161706464323, + "loss": 0.0119, "step": 175990 }, { - "epoch": 1.9, - "learning_rate": 1.4600765388856456e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016680860295341832, + "loss": 0.0114, "step": 176000 }, { - "epoch": 1.9, - "eval_cer": 0.9215026136262957, - "eval_loss": 0.005302069243043661, - "eval_runtime": 121.5231, - "eval_samples_per_second": 16.458, - "eval_steps_per_second": 4.114, + "epoch": 0.89, + "eval_cer": 0.9145032493714259, + "eval_loss": 0.008152415975928307, + "eval_runtime": 116.6203, + "eval_samples_per_second": 17.15, + "eval_steps_per_second": 4.287, "step": 176000 }, { - "epoch": 1.9, - "learning_rate": 1.4584549523253551e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001668010352604043, + "loss": 0.012, "step": 176010 }, { - "epoch": 1.9, - "learning_rate": 1.4568333657650644e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016679346756739028, + "loss": 0.0134, "step": 176020 }, { - "epoch": 1.9, - "learning_rate": 1.4552117792047738e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.0001667858998743763, + "loss": 0.0097, "step": 176030 }, { - "epoch": 1.9, - "learning_rate": 1.4535901926444833e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016677833218136227, + "loss": 0.0114, "step": 176040 }, { - "epoch": 1.9, - "learning_rate": 1.4519686060841927e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016677076448834825, + "loss": 0.0141, "step": 176050 }, { - "epoch": 1.9, - "learning_rate": 1.450347019523902e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016676319679533426, + "loss": 0.0126, "step": 176060 }, { - "epoch": 1.9, - "learning_rate": 1.4487254329636114e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016675562910232024, + "loss": 0.0097, "step": 176070 }, { - "epoch": 1.9, - "learning_rate": 1.4471038464033209e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016674806140930623, + "loss": 0.0143, "step": 176080 }, { - "epoch": 1.9, - "learning_rate": 1.4454822598430303e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016674049371629223, + "loss": 0.0112, "step": 176090 }, { - "epoch": 1.9, - "learning_rate": 1.4438606732827396e-05, - "loss": 0.0044, + "epoch": 0.89, + "learning_rate": 0.00016673292602327822, + "loss": 0.0103, "step": 176100 }, { - "epoch": 1.9, - "learning_rate": 1.442239086722449e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.0001667253583302642, + "loss": 0.0131, "step": 176110 }, { - "epoch": 1.9, - "learning_rate": 1.4406175001621585e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.0001667177906372502, + "loss": 0.0111, "step": 176120 }, { - "epoch": 1.9, - "learning_rate": 1.4389959136018679e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.0001667102229442362, + "loss": 0.0116, "step": 176130 }, { - "epoch": 1.9, - "learning_rate": 1.4373743270415775e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016670265525122217, + "loss": 0.0107, "step": 176140 }, { - "epoch": 1.9, - "learning_rate": 1.4357527404812868e-05, - "loss": 0.0085, + "epoch": 0.89, + "learning_rate": 0.00016669508755820815, + "loss": 0.0139, "step": 176150 }, { - "epoch": 1.9, - "learning_rate": 1.4341311539209962e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016668751986519416, + "loss": 0.0087, "step": 176160 }, { - "epoch": 1.9, - "learning_rate": 1.4325095673607057e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016667995217218014, + "loss": 0.0136, "step": 176170 }, { - "epoch": 1.9, - "learning_rate": 1.4308879808004151e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016667238447916612, + "loss": 0.0155, "step": 176180 }, { - "epoch": 1.9, - "learning_rate": 1.4292663942401244e-05, - "loss": 0.0086, + "epoch": 0.89, + "learning_rate": 0.00016666481678615213, + "loss": 0.0128, "step": 176190 }, { - "epoch": 1.9, - "learning_rate": 1.4276448076798338e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.0001666572490931381, + "loss": 0.0107, "step": 176200 }, { - "epoch": 1.9, - "learning_rate": 1.4260232211195433e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.0001666496814001241, + "loss": 0.0107, "step": 176210 }, { - "epoch": 1.91, - "learning_rate": 1.4244016345592527e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.0001666421137071101, + "loss": 0.0126, "step": 176220 }, { - "epoch": 1.91, - "learning_rate": 1.422780047998962e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016663454601409608, + "loss": 0.0119, "step": 176230 }, { - "epoch": 1.91, - "learning_rate": 1.4211584614386714e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016662697832108206, + "loss": 0.0121, "step": 176240 }, { - "epoch": 1.91, - "learning_rate": 1.4195368748783809e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016661941062806807, + "loss": 0.0124, "step": 176250 }, { - "epoch": 1.91, - "learning_rate": 1.4179152883180903e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016661184293505405, + "loss": 0.0137, "step": 176260 }, { - "epoch": 1.91, - "learning_rate": 1.4162937017577996e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016660427524204004, + "loss": 0.009, "step": 176270 }, { - "epoch": 1.91, - "learning_rate": 1.414672115197509e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016659670754902604, + "loss": 0.0101, "step": 176280 }, { - "epoch": 1.91, - "learning_rate": 1.4130505286372185e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016658913985601203, + "loss": 0.0126, "step": 176290 }, { - "epoch": 1.91, - "learning_rate": 1.411428942076928e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.000166581572162998, + "loss": 0.0102, "step": 176300 }, { - "epoch": 1.91, - "learning_rate": 1.4098073555166372e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.000166574004469984, + "loss": 0.0139, "step": 176310 }, { - "epoch": 1.91, - "learning_rate": 1.4081857689563468e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016656643677697, + "loss": 0.0113, "step": 176320 }, { - "epoch": 1.91, - "learning_rate": 1.4065641823960563e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016655886908395598, + "loss": 0.0105, "step": 176330 }, { - "epoch": 1.91, - "learning_rate": 1.4049425958357657e-05, - "loss": 0.0088, + "epoch": 0.89, + "learning_rate": 0.00016655130139094196, + "loss": 0.0149, "step": 176340 }, { - "epoch": 1.91, - "learning_rate": 1.403321009275475e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016654373369792797, + "loss": 0.0111, "step": 176350 }, { - "epoch": 1.91, - "learning_rate": 1.4016994227151844e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016653616600491395, + "loss": 0.0099, "step": 176360 }, { - "epoch": 1.91, - "learning_rate": 1.4000778361548939e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016652859831189993, + "loss": 0.0152, "step": 176370 }, { - "epoch": 1.91, - "learning_rate": 1.3984562495946033e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016652103061888594, + "loss": 0.0116, "step": 176380 }, { - "epoch": 1.91, - "learning_rate": 1.3968346630343126e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016651346292587192, + "loss": 0.0129, "step": 176390 }, { - "epoch": 1.91, - "learning_rate": 1.395213076474022e-05, - "loss": 0.0101, + "epoch": 0.89, + "learning_rate": 0.0001665058952328579, + "loss": 0.0108, "step": 176400 }, { - "epoch": 1.91, - "learning_rate": 1.3935914899137315e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001664983275398439, + "loss": 0.0099, "step": 176410 }, { - "epoch": 1.91, - "learning_rate": 1.391969903353441e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001664907598468299, + "loss": 0.0125, "step": 176420 }, { - "epoch": 1.91, - "learning_rate": 1.3903483167931502e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016648319215381587, + "loss": 0.0105, "step": 176430 }, { - "epoch": 1.91, - "learning_rate": 1.3887267302328596e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016647562446080188, + "loss": 0.0093, "step": 176440 }, { - "epoch": 1.91, - "learning_rate": 1.3871051436725691e-05, - "loss": 0.0041, + "epoch": 0.89, + "learning_rate": 0.00016646805676778786, + "loss": 0.0127, "step": 176450 }, { - "epoch": 1.91, - "learning_rate": 1.3854835571122785e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016646048907477385, + "loss": 0.0106, "step": 176460 }, { - "epoch": 1.91, - "learning_rate": 1.3838619705519878e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016645292138175983, + "loss": 0.0101, "step": 176470 }, { - "epoch": 1.91, - "learning_rate": 1.3822403839916973e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016644535368874584, + "loss": 0.0106, "step": 176480 }, { - "epoch": 1.91, - "learning_rate": 1.3806187974314067e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016643778599573182, + "loss": 0.0145, "step": 176490 }, { - "epoch": 1.91, - "learning_rate": 1.3789972108711163e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001664302183027178, + "loss": 0.011, "step": 176500 }, { - "epoch": 1.91, - "learning_rate": 1.3773756243108258e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001664226506097038, + "loss": 0.0113, "step": 176510 }, { - "epoch": 1.91, - "learning_rate": 1.375754037750535e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.0001664150829166898, + "loss": 0.0117, "step": 176520 }, { - "epoch": 1.91, - "learning_rate": 1.3741324511902445e-05, - "loss": 0.0091, + "epoch": 0.89, + "learning_rate": 0.00016640751522367577, + "loss": 0.0112, "step": 176530 }, { - "epoch": 1.91, - "learning_rate": 1.3725108646299539e-05, - "loss": 0.0087, + "epoch": 0.89, + "learning_rate": 0.00016639994753066178, + "loss": 0.0115, "step": 176540 }, { - "epoch": 1.91, - "learning_rate": 1.3708892780696634e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016639237983764776, + "loss": 0.0113, "step": 176550 }, { - "epoch": 1.91, - "learning_rate": 1.3692676915093726e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.00016638481214463374, + "loss": 0.0119, "step": 176560 }, { - "epoch": 1.91, - "learning_rate": 1.367646104949082e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016637724445161975, + "loss": 0.0118, "step": 176570 }, { - "epoch": 1.91, - "learning_rate": 1.3660245183887915e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016636967675860573, + "loss": 0.0123, "step": 176580 }, { - "epoch": 1.91, - "learning_rate": 1.364402931828501e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.0001663621090655917, + "loss": 0.0141, "step": 176590 }, { - "epoch": 1.91, - "learning_rate": 1.3627813452682102e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.00016635454137257767, + "loss": 0.0099, "step": 176600 }, { - "epoch": 1.91, - "learning_rate": 1.3611597587079197e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016634697367956368, + "loss": 0.014, "step": 176610 }, { - "epoch": 1.91, - "learning_rate": 1.3595381721476291e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016633940598654966, + "loss": 0.0104, "step": 176620 }, { - "epoch": 1.91, - "learning_rate": 1.3579165855873386e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016633183829353564, + "loss": 0.0137, "step": 176630 }, { - "epoch": 1.91, - "learning_rate": 1.3562949990270478e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016632427060052165, + "loss": 0.0104, "step": 176640 }, { - "epoch": 1.91, - "learning_rate": 1.3546734124667573e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016631670290750763, + "loss": 0.0122, "step": 176650 }, { - "epoch": 1.91, - "learning_rate": 1.3530518259064667e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.0001663091352144936, + "loss": 0.0109, "step": 176660 }, { - "epoch": 1.91, - "learning_rate": 1.351430239346176e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.00016630156752147962, + "loss": 0.0146, "step": 176670 }, { - "epoch": 1.91, - "learning_rate": 1.3498086527858856e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.0001662939998284656, + "loss": 0.0109, "step": 176680 }, { - "epoch": 1.91, - "learning_rate": 1.348187066225595e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016628643213545158, + "loss": 0.0111, "step": 176690 }, { - "epoch": 1.91, - "learning_rate": 1.3465654796653045e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016627886444243756, + "loss": 0.0116, "step": 176700 }, { - "epoch": 1.91, - "learning_rate": 1.344943893105014e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016627129674942357, + "loss": 0.0106, "step": 176710 }, { - "epoch": 1.91, - "learning_rate": 1.3433223065447232e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016626372905640955, + "loss": 0.0113, "step": 176720 }, { - "epoch": 1.91, - "learning_rate": 1.3417007199844327e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016625616136339553, + "loss": 0.0096, "step": 176730 }, { - "epoch": 1.91, - "learning_rate": 1.3400791334241421e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.00016624859367038154, + "loss": 0.0116, "step": 176740 }, { - "epoch": 1.91, - "learning_rate": 1.3384575468638516e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016624102597736752, + "loss": 0.0119, "step": 176750 }, { - "epoch": 1.91, - "learning_rate": 1.3368359603035608e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.0001662334582843535, + "loss": 0.0125, "step": 176760 }, { - "epoch": 1.91, - "learning_rate": 1.3352143737432703e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016622589059133951, + "loss": 0.0121, "step": 176770 }, { - "epoch": 1.91, - "learning_rate": 1.3335927871829797e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.0001662183228983255, + "loss": 0.0131, "step": 176780 }, { - "epoch": 1.91, - "learning_rate": 1.3319712006226892e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016621075520531148, + "loss": 0.0092, "step": 176790 }, { - "epoch": 1.91, - "learning_rate": 1.3303496140623984e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016620318751229749, + "loss": 0.0084, "step": 176800 }, { - "epoch": 1.91, - "learning_rate": 1.3287280275021079e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016619561981928347, + "loss": 0.0123, "step": 176810 }, { - "epoch": 1.91, - "learning_rate": 1.3271064409418173e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016618805212626945, + "loss": 0.0105, "step": 176820 }, { - "epoch": 1.91, - "learning_rate": 1.3254848543815268e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016618048443325546, + "loss": 0.0109, "step": 176830 }, { - "epoch": 1.91, - "learning_rate": 1.323863267821236e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016617291674024144, + "loss": 0.0094, "step": 176840 }, { - "epoch": 1.91, - "learning_rate": 1.3222416812609455e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016616534904722742, + "loss": 0.012, "step": 176850 }, { - "epoch": 1.91, - "learning_rate": 1.3206200947006551e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016615778135421343, + "loss": 0.012, "step": 176860 }, { - "epoch": 1.91, - "learning_rate": 1.3189985081403645e-05, - "loss": 0.0086, + "epoch": 0.89, + "learning_rate": 0.0001661502136611994, + "loss": 0.0131, "step": 176870 }, { - "epoch": 1.91, - "learning_rate": 1.317376921580074e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001661426459681854, + "loss": 0.0097, "step": 176880 }, { - "epoch": 1.91, - "learning_rate": 1.3157553350197833e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016613507827517137, + "loss": 0.0148, "step": 176890 }, { - "epoch": 1.91, - "learning_rate": 1.3141337484594927e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016612751058215738, + "loss": 0.0123, "step": 176900 }, { - "epoch": 1.91, - "learning_rate": 1.3125121618992021e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016611994288914336, + "loss": 0.0119, "step": 176910 }, { - "epoch": 1.91, - "learning_rate": 1.3108905753389116e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016611237519612934, + "loss": 0.0106, "step": 176920 }, { - "epoch": 1.91, - "learning_rate": 1.3092689887786209e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016610480750311535, + "loss": 0.0088, "step": 176930 }, { - "epoch": 1.91, - "learning_rate": 1.3076474022183303e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.00016609723981010133, + "loss": 0.0113, "step": 176940 }, { - "epoch": 1.91, - "learning_rate": 1.3060258156580398e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016608967211708732, + "loss": 0.0096, "step": 176950 }, { - "epoch": 1.91, - "learning_rate": 1.304404229097749e-05, - "loss": 0.004, + "epoch": 0.89, + "learning_rate": 0.00016608210442407332, + "loss": 0.0113, "step": 176960 }, { - "epoch": 1.91, - "learning_rate": 1.3027826425374585e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.0001660745367310593, + "loss": 0.0123, "step": 176970 }, { - "epoch": 1.91, - "learning_rate": 1.3011610559771679e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.0001660669690380453, + "loss": 0.0134, "step": 176980 }, { - "epoch": 1.91, - "learning_rate": 1.2995394694168774e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001660594013450313, + "loss": 0.0113, "step": 176990 }, { - "epoch": 1.91, - "learning_rate": 1.2979178828565866e-05, - "loss": 0.0084, + "epoch": 0.89, + "learning_rate": 0.00016605183365201728, + "loss": 0.0093, "step": 177000 }, { - "epoch": 1.91, - "eval_cer": 0.9214921903908192, - "eval_loss": 0.005274078343063593, - "eval_runtime": 121.1903, - "eval_samples_per_second": 16.503, - "eval_steps_per_second": 4.126, + "epoch": 0.89, + "eval_cer": 0.9144896638256703, + "eval_loss": 0.00848294422030449, + "eval_runtime": 116.4993, + "eval_samples_per_second": 17.167, + "eval_steps_per_second": 4.292, "step": 177000 }, { - "epoch": 1.91, - "learning_rate": 1.296296296296296e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016604426595900326, + "loss": 0.0126, "step": 177010 }, { - "epoch": 1.91, - "learning_rate": 1.2946747097360055e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016603669826598927, + "loss": 0.0146, "step": 177020 }, { - "epoch": 1.91, - "learning_rate": 1.293053123175715e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016602913057297525, + "loss": 0.013, "step": 177030 }, { - "epoch": 1.91, - "learning_rate": 1.2914315366154246e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016602156287996123, + "loss": 0.0131, "step": 177040 }, { - "epoch": 1.91, - "learning_rate": 1.2898099500551339e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.0001660139951869472, + "loss": 0.0125, "step": 177050 }, { - "epoch": 1.91, - "learning_rate": 1.2881883634948433e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016600642749393322, + "loss": 0.0099, "step": 177060 }, { - "epoch": 1.91, - "learning_rate": 1.2865667769345527e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001659988598009192, + "loss": 0.0114, "step": 177070 }, { - "epoch": 1.91, - "learning_rate": 1.2849451903742622e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016599129210790518, + "loss": 0.0134, "step": 177080 }, { - "epoch": 1.91, - "learning_rate": 1.2833236038139715e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.0001659837244148912, + "loss": 0.018, "step": 177090 }, { - "epoch": 1.91, - "learning_rate": 1.2817020172536809e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016597615672187717, + "loss": 0.0149, "step": 177100 }, { - "epoch": 1.91, - "learning_rate": 1.2800804306933903e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.00016596858902886315, + "loss": 0.0111, "step": 177110 }, { - "epoch": 1.91, - "learning_rate": 1.2784588441330998e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016596102133584916, + "loss": 0.0115, "step": 177120 }, { - "epoch": 1.91, - "learning_rate": 1.276837257572809e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016595345364283514, + "loss": 0.0112, "step": 177130 }, { - "epoch": 1.91, - "learning_rate": 1.2752156710125185e-05, - "loss": 0.0083, + "epoch": 0.89, + "learning_rate": 0.00016594588594982113, + "loss": 0.0123, "step": 177140 }, { - "epoch": 1.92, - "learning_rate": 1.273594084452228e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016593831825680713, + "loss": 0.0109, "step": 177150 }, { - "epoch": 1.92, - "learning_rate": 1.2719724978919374e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016593075056379312, + "loss": 0.0133, "step": 177160 }, { - "epoch": 1.92, - "learning_rate": 1.2703509113316467e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.0001659231828707791, + "loss": 0.012, "step": 177170 }, { - "epoch": 1.92, - "learning_rate": 1.2687293247713561e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.0001659156151777651, + "loss": 0.0112, "step": 177180 }, { - "epoch": 1.92, - "learning_rate": 1.2671077382110656e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.0001659080474847511, + "loss": 0.011, "step": 177190 }, { - "epoch": 1.92, - "learning_rate": 1.265486151650775e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016590047979173707, + "loss": 0.0091, "step": 177200 }, { - "epoch": 1.92, - "learning_rate": 1.2638645650904843e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016589291209872305, + "loss": 0.0114, "step": 177210 }, { - "epoch": 1.92, - "learning_rate": 1.2622429785301939e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016588534440570906, + "loss": 0.0109, "step": 177220 }, { - "epoch": 1.92, - "learning_rate": 1.2606213919699033e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016587777671269504, + "loss": 0.0131, "step": 177230 }, { - "epoch": 1.92, - "learning_rate": 1.2589998054096128e-05, - "loss": 0.0092, + "epoch": 0.89, + "learning_rate": 0.00016587020901968102, + "loss": 0.0106, "step": 177240 }, { - "epoch": 1.92, - "learning_rate": 1.2573782188493222e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016586264132666703, + "loss": 0.0126, "step": 177250 }, { - "epoch": 1.92, - "learning_rate": 1.2557566322890315e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.000165855073633653, + "loss": 0.011, "step": 177260 }, { - "epoch": 1.92, - "learning_rate": 1.254135045728741e-05, - "loss": 0.0044, + "epoch": 0.89, + "learning_rate": 0.000165847505940639, + "loss": 0.0116, "step": 177270 }, { - "epoch": 1.92, - "learning_rate": 1.2525134591684504e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.000165839938247625, + "loss": 0.0139, "step": 177280 }, { - "epoch": 1.92, - "learning_rate": 1.2508918726081597e-05, - "loss": 0.0042, + "epoch": 0.89, + "learning_rate": 0.00016583237055461098, + "loss": 0.0102, "step": 177290 }, { - "epoch": 1.92, - "learning_rate": 1.2492702860478691e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016582480286159696, + "loss": 0.0112, "step": 177300 }, { - "epoch": 1.92, - "learning_rate": 1.2476486994875785e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016581723516858297, + "loss": 0.013, "step": 177310 }, { - "epoch": 1.92, - "learning_rate": 1.246027112927288e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016580966747556895, + "loss": 0.0123, "step": 177320 }, { - "epoch": 1.92, - "learning_rate": 1.2444055263669973e-05, - "loss": 0.0102, + "epoch": 0.89, + "learning_rate": 0.00016580209978255494, + "loss": 0.0143, "step": 177330 }, { - "epoch": 1.92, - "learning_rate": 1.2427839398067067e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016579453208954094, + "loss": 0.0107, "step": 177340 }, { - "epoch": 1.92, - "learning_rate": 1.2411623532464161e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016578696439652693, + "loss": 0.0089, "step": 177350 }, { - "epoch": 1.92, - "learning_rate": 1.2395407666861256e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.0001657793967035129, + "loss": 0.0101, "step": 177360 }, { - "epoch": 1.92, - "learning_rate": 1.2379191801258349e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.0001657718290104989, + "loss": 0.0096, "step": 177370 }, { - "epoch": 1.92, - "learning_rate": 1.2362975935655443e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.0001657642613174849, + "loss": 0.0106, "step": 177380 }, { - "epoch": 1.92, - "learning_rate": 1.2346760070052538e-05, + "epoch": 0.89, + "learning_rate": 0.00016575669362447088, "loss": 0.0082, "step": 177390 }, { - "epoch": 1.92, - "learning_rate": 1.2330544204449634e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016574912593145686, + "loss": 0.0158, "step": 177400 }, { - "epoch": 1.92, - "learning_rate": 1.2314328338846728e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016574155823844287, + "loss": 0.0124, "step": 177410 }, { - "epoch": 1.92, - "learning_rate": 1.229811247324382e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016573399054542885, + "loss": 0.0128, "step": 177420 }, { - "epoch": 1.92, - "learning_rate": 1.2281896607640915e-05, - "loss": 0.0077, + "epoch": 0.9, + "learning_rate": 0.00016572642285241483, + "loss": 0.0123, "step": 177430 }, { - "epoch": 1.92, - "learning_rate": 1.226568074203801e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016571885515940084, + "loss": 0.0099, "step": 177440 }, { - "epoch": 1.92, - "learning_rate": 1.2249464876435104e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016571128746638682, + "loss": 0.0121, "step": 177450 }, { - "epoch": 1.92, - "learning_rate": 1.2233249010832197e-05, - "loss": 0.0077, + "epoch": 0.9, + "learning_rate": 0.0001657037197733728, + "loss": 0.0099, "step": 177460 }, { - "epoch": 1.92, - "learning_rate": 1.2217033145229291e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001656961520803588, + "loss": 0.0106, "step": 177470 }, { - "epoch": 1.92, - "learning_rate": 1.2200817279626386e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001656885843873448, + "loss": 0.0113, "step": 177480 }, { - "epoch": 1.92, - "learning_rate": 1.218460141402348e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016568101669433077, + "loss": 0.0092, "step": 177490 }, { - "epoch": 1.92, - "learning_rate": 1.2168385548420573e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016567344900131678, + "loss": 0.0106, "step": 177500 }, { - "epoch": 1.92, - "learning_rate": 1.2152169682817667e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016566588130830276, + "loss": 0.0098, "step": 177510 }, { - "epoch": 1.92, - "learning_rate": 1.2135953817214762e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016565831361528875, + "loss": 0.0162, "step": 177520 }, { - "epoch": 1.92, - "learning_rate": 1.2119737951611856e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016565074592227475, + "loss": 0.0133, "step": 177530 }, { - "epoch": 1.92, - "learning_rate": 1.2103522086008949e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016564317822926074, + "loss": 0.0104, "step": 177540 }, { - "epoch": 1.92, - "learning_rate": 1.2087306220406043e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016563561053624672, + "loss": 0.0091, "step": 177550 }, { - "epoch": 1.92, - "learning_rate": 1.2071090354803138e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001656280428432327, + "loss": 0.0135, "step": 177560 }, { - "epoch": 1.92, - "learning_rate": 1.2054874489200232e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.0001656204751502187, + "loss": 0.0117, "step": 177570 }, { - "epoch": 1.92, - "learning_rate": 1.2038658623597327e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.0001656129074572047, + "loss": 0.01, "step": 177580 }, { - "epoch": 1.92, - "learning_rate": 1.2022442757994421e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016560533976419067, + "loss": 0.0166, "step": 177590 }, { - "epoch": 1.92, - "learning_rate": 1.2006226892391516e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.00016559777207117668, + "loss": 0.0102, "step": 177600 }, { - "epoch": 1.92, - "learning_rate": 1.199001102678861e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016559020437816266, + "loss": 0.0112, "step": 177610 }, { - "epoch": 1.92, - "learning_rate": 1.1973795161185703e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016558263668514864, + "loss": 0.0122, "step": 177620 }, { - "epoch": 1.92, - "learning_rate": 1.1957579295582797e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016557506899213465, + "loss": 0.0108, "step": 177630 }, { - "epoch": 1.92, - "learning_rate": 1.1941363429979892e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016556750129912063, + "loss": 0.0107, "step": 177640 }, { - "epoch": 1.92, - "learning_rate": 1.1925147564376986e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001655599336061066, + "loss": 0.0129, "step": 177650 }, { - "epoch": 1.92, - "learning_rate": 1.1908931698774079e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016555236591309262, + "loss": 0.0106, "step": 177660 }, { - "epoch": 1.92, - "learning_rate": 1.1892715833171173e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001655447982200786, + "loss": 0.0116, "step": 177670 }, { - "epoch": 1.92, - "learning_rate": 1.1876499967568268e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016553723052706458, + "loss": 0.0121, "step": 177680 }, { - "epoch": 1.92, - "learning_rate": 1.1860284101965362e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.0001655296628340506, + "loss": 0.0112, "step": 177690 }, { - "epoch": 1.92, - "learning_rate": 1.1844068236362455e-05, - "loss": 0.009, + "epoch": 0.9, + "learning_rate": 0.00016552209514103657, + "loss": 0.0124, "step": 177700 }, { - "epoch": 1.92, - "learning_rate": 1.182785237075955e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016551452744802256, + "loss": 0.0113, "step": 177710 }, { - "epoch": 1.92, - "learning_rate": 1.1811636505156644e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016550695975500854, + "loss": 0.0122, "step": 177720 }, { - "epoch": 1.92, - "learning_rate": 1.1795420639553738e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016549939206199455, + "loss": 0.0115, "step": 177730 }, { - "epoch": 1.92, - "learning_rate": 1.1779204773950831e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016549182436898053, + "loss": 0.0121, "step": 177740 }, { - "epoch": 1.92, - "learning_rate": 1.1762988908347925e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.0001654842566759665, + "loss": 0.0118, "step": 177750 }, { - "epoch": 1.92, - "learning_rate": 1.1746773042745022e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016547668898295252, + "loss": 0.0126, "step": 177760 }, { - "epoch": 1.92, - "learning_rate": 1.1730557177142116e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.0001654691212899385, + "loss": 0.0077, "step": 177770 }, { - "epoch": 1.92, - "learning_rate": 1.171434131153921e-05, - "loss": 0.0079, + "epoch": 0.9, + "learning_rate": 0.00016546155359692448, + "loss": 0.0153, "step": 177780 }, { - "epoch": 1.92, - "learning_rate": 1.1698125445936303e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001654539859039105, + "loss": 0.012, "step": 177790 }, { - "epoch": 1.92, - "learning_rate": 1.1681909580333398e-05, - "loss": 0.0104, + "epoch": 0.9, + "learning_rate": 0.00016544641821089647, + "loss": 0.0099, "step": 177800 }, { - "epoch": 1.92, - "learning_rate": 1.1665693714730492e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016543885051788245, + "loss": 0.0112, "step": 177810 }, { - "epoch": 1.92, - "learning_rate": 1.1649477849127586e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016543128282486846, + "loss": 0.0144, "step": 177820 }, { - "epoch": 1.92, - "learning_rate": 1.163326198352468e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016542371513185444, + "loss": 0.0089, "step": 177830 }, { - "epoch": 1.92, - "learning_rate": 1.1617046117921774e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016541614743884042, + "loss": 0.0104, "step": 177840 }, { - "epoch": 1.92, - "learning_rate": 1.1600830252318868e-05, - "loss": 0.0089, + "epoch": 0.9, + "learning_rate": 0.00016540857974582638, + "loss": 0.0141, "step": 177850 }, { - "epoch": 1.92, - "learning_rate": 1.1584614386715963e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016540101205281239, + "loss": 0.0095, "step": 177860 }, { - "epoch": 1.92, - "learning_rate": 1.1568398521113055e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016539344435979837, + "loss": 0.0119, "step": 177870 }, { - "epoch": 1.92, - "learning_rate": 1.155218265551015e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016538587666678435, + "loss": 0.0143, "step": 177880 }, { - "epoch": 1.92, - "learning_rate": 1.1535966789907244e-05, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.00016537830897377036, + "loss": 0.0156, "step": 177890 }, { - "epoch": 1.92, - "learning_rate": 1.1519750924304337e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016537074128075634, + "loss": 0.0145, "step": 177900 }, { - "epoch": 1.92, - "learning_rate": 1.1503535058701431e-05, - "loss": 0.0083, + "epoch": 0.9, + "learning_rate": 0.00016536317358774232, + "loss": 0.0121, "step": 177910 }, { - "epoch": 1.92, - "learning_rate": 1.1487319193098526e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016535560589472833, + "loss": 0.0112, "step": 177920 }, { - "epoch": 1.92, - "learning_rate": 1.147110332749562e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.0001653480382017143, + "loss": 0.0126, "step": 177930 }, { - "epoch": 1.92, - "learning_rate": 1.1454887461892716e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.0001653404705087003, + "loss": 0.0139, "step": 177940 }, { - "epoch": 1.92, - "learning_rate": 1.1438671596289809e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016533290281568627, + "loss": 0.0114, "step": 177950 }, { - "epoch": 1.92, - "learning_rate": 1.1422455730686904e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016532533512267228, + "loss": 0.0107, "step": 177960 }, { - "epoch": 1.92, - "learning_rate": 1.1406239865083998e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016531776742965826, + "loss": 0.014, "step": 177970 }, { - "epoch": 1.92, - "learning_rate": 1.1390023999481092e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016531019973664424, + "loss": 0.0126, "step": 177980 }, { - "epoch": 1.92, - "learning_rate": 1.1373808133878185e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016530263204363025, + "loss": 0.0126, "step": 177990 }, { - "epoch": 1.92, - "learning_rate": 1.135759226827528e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016529506435061623, + "loss": 0.0134, "step": 178000 }, { - "epoch": 1.92, - "eval_cer": 0.9214965334056011, - "eval_loss": 0.005222100764513016, - "eval_runtime": 121.1363, - "eval_samples_per_second": 16.51, - "eval_steps_per_second": 4.128, + "epoch": 0.9, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.008248904719948769, + "eval_runtime": 116.6185, + "eval_samples_per_second": 17.15, + "eval_steps_per_second": 4.287, "step": 178000 }, { - "epoch": 1.92, - "learning_rate": 1.1341376402672374e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016528749665760222, + "loss": 0.0122, "step": 178010 }, { - "epoch": 1.92, - "learning_rate": 1.1325160537069468e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016527992896458822, + "loss": 0.0117, "step": 178020 }, { - "epoch": 1.92, - "learning_rate": 1.1308944671466561e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.0001652723612715742, + "loss": 0.0117, "step": 178030 }, { - "epoch": 1.92, - "learning_rate": 1.1292728805863656e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001652647935785602, + "loss": 0.0159, "step": 178040 }, { - "epoch": 1.92, - "learning_rate": 1.127651294026075e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.0001652572258855462, + "loss": 0.0093, "step": 178050 }, { - "epoch": 1.92, - "learning_rate": 1.1260297074657845e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016524965819253218, + "loss": 0.0128, "step": 178060 }, { - "epoch": 1.93, - "learning_rate": 1.1244081209054937e-05, - "loss": 0.004, + "epoch": 0.9, + "learning_rate": 0.00016524209049951816, + "loss": 0.0107, "step": 178070 }, { - "epoch": 1.93, - "learning_rate": 1.1227865343452032e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016523452280650417, + "loss": 0.011, "step": 178080 }, { - "epoch": 1.93, - "learning_rate": 1.1211649477849126e-05, - "loss": 0.0041, + "epoch": 0.9, + "learning_rate": 0.00016522695511349015, + "loss": 0.0162, "step": 178090 }, { - "epoch": 1.93, - "learning_rate": 1.119543361224622e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016521938742047613, + "loss": 0.0101, "step": 178100 }, { - "epoch": 1.93, - "learning_rate": 1.1179217746643313e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001652118197274621, + "loss": 0.0091, "step": 178110 }, { - "epoch": 1.93, - "learning_rate": 1.116300188104041e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016520425203444812, + "loss": 0.013, "step": 178120 }, { - "epoch": 1.93, - "learning_rate": 1.1146786015437504e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001651966843414341, + "loss": 0.0117, "step": 178130 }, { - "epoch": 1.93, - "learning_rate": 1.1130570149834598e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016518911664842008, + "loss": 0.0081, "step": 178140 }, { - "epoch": 1.93, - "learning_rate": 1.1114354284231693e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001651815489554061, + "loss": 0.0124, "step": 178150 }, { - "epoch": 1.93, - "learning_rate": 1.1098138418628785e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016517398126239207, + "loss": 0.0127, "step": 178160 }, { - "epoch": 1.93, - "learning_rate": 1.108192255302588e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016516641356937805, + "loss": 0.0122, "step": 178170 }, { - "epoch": 1.93, - "learning_rate": 1.1065706687422974e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016515884587636406, + "loss": 0.0115, "step": 178180 }, { - "epoch": 1.93, - "learning_rate": 1.1049490821820069e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016515127818335004, + "loss": 0.0107, "step": 178190 }, { - "epoch": 1.93, - "learning_rate": 1.1033274956217162e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016514371049033603, + "loss": 0.0114, "step": 178200 }, { - "epoch": 1.93, - "learning_rate": 1.1017059090614256e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016513614279732203, + "loss": 0.0128, "step": 178210 }, { - "epoch": 1.93, - "learning_rate": 1.100084322501135e-05, - "loss": 0.0037, + "epoch": 0.9, + "learning_rate": 0.00016512857510430802, + "loss": 0.0123, "step": 178220 }, { - "epoch": 1.93, - "learning_rate": 1.0984627359408443e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.000165121007411294, + "loss": 0.0114, "step": 178230 }, { - "epoch": 1.93, - "learning_rate": 1.0968411493805538e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016511343971828, + "loss": 0.0152, "step": 178240 }, { - "epoch": 1.93, - "learning_rate": 1.0952195628202632e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.000165105872025266, + "loss": 0.0131, "step": 178250 }, { - "epoch": 1.93, - "learning_rate": 1.0935979762599726e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016509830433225197, + "loss": 0.0113, "step": 178260 }, { - "epoch": 1.93, - "learning_rate": 1.091976389699682e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016509073663923795, + "loss": 0.0172, "step": 178270 }, { - "epoch": 1.93, - "learning_rate": 1.0903548031393914e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016508316894622396, + "loss": 0.0128, "step": 178280 }, { - "epoch": 1.93, - "learning_rate": 1.0887332165791008e-05, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.00016507560125320994, + "loss": 0.013, "step": 178290 }, { - "epoch": 1.93, - "learning_rate": 1.0871116300188104e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016506803356019592, + "loss": 0.0119, "step": 178300 }, { - "epoch": 1.93, - "learning_rate": 1.0854900434585199e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016506046586718193, + "loss": 0.0099, "step": 178310 }, { - "epoch": 1.93, - "learning_rate": 1.0838684568982291e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001650528981741679, + "loss": 0.0118, "step": 178320 }, { - "epoch": 1.93, - "learning_rate": 1.0822468703379386e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001650453304811539, + "loss": 0.0095, "step": 178330 }, { - "epoch": 1.93, - "learning_rate": 1.080625283777648e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.0001650377627881399, + "loss": 0.0099, "step": 178340 }, { - "epoch": 1.93, - "learning_rate": 1.0790036972173575e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016503019509512588, + "loss": 0.0137, "step": 178350 }, { - "epoch": 1.93, - "learning_rate": 1.0773821106570667e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016502262740211186, + "loss": 0.011, "step": 178360 }, { - "epoch": 1.93, - "learning_rate": 1.0757605240967762e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016501505970909787, + "loss": 0.0138, "step": 178370 }, { - "epoch": 1.93, - "learning_rate": 1.0741389375364856e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016500749201608385, + "loss": 0.0089, "step": 178380 }, { - "epoch": 1.93, - "learning_rate": 1.072517350976195e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016499992432306984, + "loss": 0.0141, "step": 178390 }, { - "epoch": 1.93, - "learning_rate": 1.0708957644159044e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016499235663005584, + "loss": 0.0121, "step": 178400 }, { - "epoch": 1.93, - "learning_rate": 1.0692741778556138e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016498478893704183, + "loss": 0.013, "step": 178410 }, { - "epoch": 1.93, - "learning_rate": 1.0676525912953232e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.0001649772212440278, + "loss": 0.0124, "step": 178420 }, { - "epoch": 1.93, - "learning_rate": 1.0660310047350327e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016496965355101382, + "loss": 0.0107, "step": 178430 }, { - "epoch": 1.93, - "learning_rate": 1.064409418174742e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.0001649620858579998, + "loss": 0.0146, "step": 178440 }, { - "epoch": 1.93, - "learning_rate": 1.0627878316144514e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016495451816498578, + "loss": 0.0133, "step": 178450 }, { - "epoch": 1.93, - "learning_rate": 1.0611662450541608e-05, - "loss": 0.0047, + "epoch": 0.9, + "learning_rate": 0.00016494695047197176, + "loss": 0.0119, "step": 178460 }, { - "epoch": 1.93, - "learning_rate": 1.0595446584938703e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016493938277895777, + "loss": 0.0093, "step": 178470 }, { - "epoch": 1.93, - "learning_rate": 1.0579230719335799e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016493181508594375, + "loss": 0.0112, "step": 178480 }, { - "epoch": 1.93, - "learning_rate": 1.0563014853732892e-05, - "loss": 0.0042, + "epoch": 0.9, + "learning_rate": 0.00016492424739292973, + "loss": 0.0208, "step": 178490 }, { - "epoch": 1.93, - "learning_rate": 1.0546798988129986e-05, - "loss": 0.0086, + "epoch": 0.9, + "learning_rate": 0.00016491667969991574, + "loss": 0.0219, "step": 178500 }, { - "epoch": 1.93, - "learning_rate": 1.053058312252708e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016490911200690172, + "loss": 0.0107, "step": 178510 }, { - "epoch": 1.93, - "learning_rate": 1.0514367256924173e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.0001649015443138877, + "loss": 0.0267, "step": 178520 }, { - "epoch": 1.93, - "learning_rate": 1.0498151391321268e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001648939766208737, + "loss": 0.0128, "step": 178530 }, { - "epoch": 1.93, - "learning_rate": 1.0481935525718362e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.0001648864089278597, + "loss": 0.0128, "step": 178540 }, { - "epoch": 1.93, - "learning_rate": 1.0465719660115457e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016487884123484567, + "loss": 0.0115, "step": 178550 }, { - "epoch": 1.93, - "learning_rate": 1.044950379451255e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016487127354183168, + "loss": 0.0133, "step": 178560 }, { - "epoch": 1.93, - "learning_rate": 1.0433287928909644e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016486370584881766, + "loss": 0.0131, "step": 178570 }, { - "epoch": 1.93, - "learning_rate": 1.0417072063306738e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016485613815580365, + "loss": 0.0102, "step": 178580 }, { - "epoch": 1.93, - "learning_rate": 1.0400856197703833e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016484857046278965, + "loss": 0.0105, "step": 178590 }, { - "epoch": 1.93, - "learning_rate": 1.0384640332100926e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016484100276977564, + "loss": 0.0111, "step": 178600 }, { - "epoch": 1.93, - "learning_rate": 1.036842446649802e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016483343507676162, + "loss": 0.012, "step": 178610 }, { - "epoch": 1.93, - "learning_rate": 1.0352208600895114e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.0001648258673837476, + "loss": 0.0086, "step": 178620 }, { - "epoch": 1.93, - "learning_rate": 1.0335992735292209e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001648182996907336, + "loss": 0.0113, "step": 178630 }, { - "epoch": 1.93, - "learning_rate": 1.0319776869689302e-05, - "loss": 0.0079, + "epoch": 0.9, + "learning_rate": 0.0001648107319977196, + "loss": 0.0101, "step": 178640 }, { - "epoch": 1.93, - "learning_rate": 1.0303561004086396e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016480316430470557, + "loss": 0.0119, "step": 178650 }, { - "epoch": 1.93, - "learning_rate": 1.0287345138483492e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016479559661169158, + "loss": 0.0107, "step": 178660 }, { - "epoch": 1.93, - "learning_rate": 1.0271129272880587e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016478802891867756, + "loss": 0.0094, "step": 178670 }, { - "epoch": 1.93, - "learning_rate": 1.0254913407277681e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016478046122566354, + "loss": 0.0101, "step": 178680 }, { - "epoch": 1.93, - "learning_rate": 1.0238697541674774e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016477289353264955, + "loss": 0.0115, "step": 178690 }, { - "epoch": 1.93, - "learning_rate": 1.0222481676071868e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016476532583963553, + "loss": 0.01, "step": 178700 }, { - "epoch": 1.93, - "learning_rate": 1.0206265810468963e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.0001647577581466215, + "loss": 0.0104, "step": 178710 }, { - "epoch": 1.93, - "learning_rate": 1.0190049944866057e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016475019045360752, + "loss": 0.0112, "step": 178720 }, { - "epoch": 1.93, - "learning_rate": 1.017383407926315e-05, - "loss": 0.0088, + "epoch": 0.9, + "learning_rate": 0.0001647426227605935, + "loss": 0.0117, "step": 178730 }, { - "epoch": 1.93, - "learning_rate": 1.0157618213660244e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016473505506757948, + "loss": 0.0123, "step": 178740 }, { - "epoch": 1.93, - "learning_rate": 1.0141402348057339e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.0001647274873745655, + "loss": 0.0158, "step": 178750 }, { - "epoch": 1.93, - "learning_rate": 1.0125186482454433e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016471991968155147, + "loss": 0.0112, "step": 178760 }, { - "epoch": 1.93, - "learning_rate": 1.0108970616851526e-05, - "loss": 0.0092, + "epoch": 0.9, + "learning_rate": 0.00016471235198853746, + "loss": 0.0115, "step": 178770 }, { - "epoch": 1.93, - "learning_rate": 1.009275475124862e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016470478429552344, + "loss": 0.0109, "step": 178780 }, { - "epoch": 1.93, - "learning_rate": 1.0076538885645715e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016469721660250945, + "loss": 0.0146, "step": 178790 }, { - "epoch": 1.93, - "learning_rate": 1.006032302004281e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.00016468964890949543, + "loss": 0.0112, "step": 178800 }, { - "epoch": 1.93, - "learning_rate": 1.0044107154439902e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.0001646820812164814, + "loss": 0.0119, "step": 178810 }, { - "epoch": 1.93, - "learning_rate": 1.0027891288836996e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016467451352346742, + "loss": 0.0112, "step": 178820 }, { - "epoch": 1.93, - "learning_rate": 1.001167542323409e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001646669458304534, + "loss": 0.0146, "step": 178830 }, { - "epoch": 1.93, - "learning_rate": 9.995459557631187e-06, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.00016465937813743938, + "loss": 0.0134, "step": 178840 }, { - "epoch": 1.93, - "learning_rate": 9.97924369202828e-06, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001646518104444254, + "loss": 0.012, "step": 178850 }, { - "epoch": 1.93, - "learning_rate": 9.963027826425374e-06, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016464424275141137, + "loss": 0.0108, "step": 178860 }, { - "epoch": 1.93, - "learning_rate": 9.946811960822469e-06, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016463667505839735, + "loss": 0.0084, "step": 178870 }, { - "epoch": 1.93, - "learning_rate": 9.930596095219563e-06, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016462910736538336, + "loss": 0.0092, "step": 178880 }, { - "epoch": 1.93, - "learning_rate": 9.914380229616656e-06, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016462153967236934, + "loss": 0.0154, "step": 178890 }, { - "epoch": 1.93, - "learning_rate": 9.89816436401375e-06, - "loss": 0.004, + "epoch": 0.9, + "learning_rate": 0.00016461397197935532, + "loss": 0.0109, "step": 178900 }, { - "epoch": 1.93, - "learning_rate": 9.881948498410845e-06, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016460640428634133, + "loss": 0.0132, "step": 178910 }, { - "epoch": 1.93, - "learning_rate": 9.865732632807939e-06, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001645988365933273, + "loss": 0.0105, "step": 178920 }, { - "epoch": 1.93, - "learning_rate": 9.849516767205032e-06, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.0001645912689003133, + "loss": 0.0105, "step": 178930 }, { - "epoch": 1.93, - "learning_rate": 9.833300901602126e-06, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.0001645837012072993, + "loss": 0.0108, "step": 178940 }, { - "epoch": 1.93, - "learning_rate": 9.81708503599922e-06, - "loss": 0.0076, + "epoch": 0.9, + "learning_rate": 0.00016457613351428528, + "loss": 0.0109, "step": 178950 }, { - "epoch": 1.93, - "learning_rate": 9.800869170396315e-06, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.00016456856582127127, + "loss": 0.0113, "step": 178960 }, { - "epoch": 1.93, - "learning_rate": 9.784653304793408e-06, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016456099812825725, + "loss": 0.0142, "step": 178970 }, { - "epoch": 1.93, - "learning_rate": 9.768437439190502e-06, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016455343043524326, + "loss": 0.0113, "step": 178980 }, { - "epoch": 1.93, - "learning_rate": 9.752221573587597e-06, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016454586274222924, + "loss": 0.0103, "step": 178990 }, { - "epoch": 1.94, - "learning_rate": 9.736005707984691e-06, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016453829504921522, + "loss": 0.0116, "step": 179000 }, { - "epoch": 1.94, - "eval_cer": 0.9215199856854233, - "eval_loss": 0.005271059460937977, - "eval_runtime": 121.1797, - "eval_samples_per_second": 16.504, - "eval_steps_per_second": 4.126, + "epoch": 0.9, + "eval_cer": 0.914462492734159, + "eval_loss": 0.008126331493258476, + "eval_runtime": 116.7985, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, "step": 179000 }, { - "epoch": 1.94, - "learning_rate": 9.719789842381784e-06, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016453072735620123, + "loss": 0.0122, "step": 179010 }, { - "epoch": 1.94, - "learning_rate": 9.70357397677888e-06, - "loss": 0.0077, + "epoch": 0.9, + "learning_rate": 0.0001645231596631872, + "loss": 0.0112, "step": 179020 }, { - "epoch": 1.94, - "learning_rate": 9.687358111175974e-06, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.0001645155919701732, + "loss": 0.0103, "step": 179030 }, { - "epoch": 1.94, - "learning_rate": 9.671142245573069e-06, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001645080242771592, + "loss": 0.0118, "step": 179040 }, { - "epoch": 1.94, - "learning_rate": 9.654926379970163e-06, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016450045658414518, + "loss": 0.0124, "step": 179050 }, { - "epoch": 1.94, - "learning_rate": 9.638710514367256e-06, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016449288889113116, + "loss": 0.0115, "step": 179060 }, { - "epoch": 1.94, - "learning_rate": 9.62249464876435e-06, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016448532119811717, + "loss": 0.0093, "step": 179070 }, { - "epoch": 1.94, - "learning_rate": 9.606278783161445e-06, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016447775350510315, + "loss": 0.0099, "step": 179080 }, { - "epoch": 1.94, - "learning_rate": 9.59006291755854e-06, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016447018581208913, + "loss": 0.0112, "step": 179090 }, { - "epoch": 1.94, - "learning_rate": 9.573847051955632e-06, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016446261811907514, + "loss": 0.011, "step": 179100 }, { - "epoch": 1.94, - "learning_rate": 9.557631186352727e-06, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.0001644550504260611, + "loss": 0.0172, "step": 179110 }, { - "epoch": 1.94, - "learning_rate": 9.541415320749821e-06, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016444748273304708, + "loss": 0.0158, "step": 179120 }, { - "epoch": 1.94, - "learning_rate": 9.525199455146915e-06, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016443991504003306, + "loss": 0.0119, "step": 179130 }, { - "epoch": 1.94, - "learning_rate": 9.508983589544008e-06, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016443234734701907, + "loss": 0.0134, "step": 179140 }, { - "epoch": 1.94, - "learning_rate": 9.492767723941103e-06, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016442477965400505, + "loss": 0.0099, "step": 179150 }, { - "epoch": 1.94, - "learning_rate": 9.476551858338197e-06, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016441721196099103, + "loss": 0.0115, "step": 179160 }, { - "epoch": 1.94, - "learning_rate": 9.46033599273529e-06, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.000164409644267977, + "loss": 0.0117, "step": 179170 }, { - "epoch": 1.94, - "learning_rate": 9.444120127132384e-06, - "loss": 0.0076, + "epoch": 0.9, + "learning_rate": 0.00016440207657496302, + "loss": 0.0097, "step": 179180 }, { - "epoch": 1.94, - "learning_rate": 9.427904261529479e-06, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.000164394508881949, + "loss": 0.0103, "step": 179190 }, { - "epoch": 1.94, - "learning_rate": 9.411688395926575e-06, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016438694118893498, + "loss": 0.0105, "step": 179200 }, { - "epoch": 1.94, - "learning_rate": 9.39547253032367e-06, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.000164379373495921, + "loss": 0.0112, "step": 179210 }, { - "epoch": 1.94, - "learning_rate": 9.379256664720762e-06, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016437180580290697, + "loss": 0.0147, "step": 179220 }, { - "epoch": 1.94, - "learning_rate": 9.363040799117856e-06, - "loss": 0.0116, + "epoch": 0.9, + "learning_rate": 0.00016436423810989295, + "loss": 0.0154, "step": 179230 }, { - "epoch": 1.94, - "learning_rate": 9.34682493351495e-06, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016435667041687896, + "loss": 0.0091, "step": 179240 }, { - "epoch": 1.94, - "learning_rate": 9.330609067912045e-06, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016434910272386494, + "loss": 0.0099, "step": 179250 }, { - "epoch": 1.94, - "learning_rate": 9.314393202309138e-06, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016434153503085093, + "loss": 0.0115, "step": 179260 }, { - "epoch": 1.94, - "learning_rate": 9.298177336706232e-06, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016433396733783693, + "loss": 0.0138, "step": 179270 }, { - "epoch": 1.94, - "learning_rate": 9.281961471103327e-06, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016432639964482292, + "loss": 0.0116, "step": 179280 }, { - "epoch": 1.94, - "learning_rate": 9.265745605500421e-06, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001643188319518089, + "loss": 0.0104, "step": 179290 }, { - "epoch": 1.94, - "learning_rate": 9.249529739897514e-06, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.0001643112642587949, + "loss": 0.0115, "step": 179300 }, { - "epoch": 1.94, - "learning_rate": 9.233313874294609e-06, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.0001643036965657809, + "loss": 0.0136, "step": 179310 }, { - "epoch": 1.94, - "learning_rate": 9.217098008691703e-06, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016429612887276687, + "loss": 0.0123, "step": 179320 }, { - "epoch": 1.94, - "learning_rate": 9.200882143088797e-06, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016428856117975288, + "loss": 0.0089, "step": 179330 }, { - "epoch": 1.94, - "learning_rate": 9.184666277485892e-06, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016428099348673886, + "loss": 0.0113, "step": 179340 }, { - "epoch": 1.94, - "learning_rate": 9.168450411882986e-06, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016427342579372484, + "loss": 0.0096, "step": 179350 }, { - "epoch": 1.94, - "learning_rate": 9.152234546280079e-06, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016426585810071082, + "loss": 0.0138, "step": 179360 }, { - "epoch": 1.94, - "learning_rate": 9.136018680677173e-06, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016425829040769683, + "loss": 0.0143, "step": 179370 }, { - "epoch": 1.94, - "learning_rate": 9.119802815074268e-06, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.0001642507227146828, + "loss": 0.011, "step": 179380 }, { - "epoch": 1.94, - "learning_rate": 9.103586949471362e-06, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.0001642431550216688, + "loss": 0.016, "step": 179390 }, { - "epoch": 1.94, - "learning_rate": 9.087371083868455e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001642355873286548, + "loss": 0.0085, "step": 179400 }, { - "epoch": 1.94, - "learning_rate": 9.07115521826555e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016422801963564078, + "loss": 0.0114, "step": 179410 }, { - "epoch": 1.94, - "learning_rate": 9.054939352662644e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016422045194262676, + "loss": 0.0136, "step": 179420 }, { - "epoch": 1.94, - "learning_rate": 9.038723487059738e-06, - "loss": 0.0086, + "epoch": 0.91, + "learning_rate": 0.00016421288424961277, + "loss": 0.0112, "step": 179430 }, { - "epoch": 1.94, - "learning_rate": 9.022507621456833e-06, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016420531655659875, + "loss": 0.0095, "step": 179440 }, { - "epoch": 1.94, - "learning_rate": 9.006291755853927e-06, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016419774886358474, + "loss": 0.0133, "step": 179450 }, { - "epoch": 1.94, - "learning_rate": 8.990075890251022e-06, - "loss": 0.0092, + "epoch": 0.91, + "learning_rate": 0.00016419018117057074, + "loss": 0.0114, "step": 179460 }, { - "epoch": 1.94, - "learning_rate": 8.973860024648114e-06, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016418261347755673, + "loss": 0.0114, "step": 179470 }, { - "epoch": 1.94, - "learning_rate": 8.957644159045209e-06, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.0001641750457845427, + "loss": 0.0123, "step": 179480 }, { - "epoch": 1.94, - "learning_rate": 8.941428293442303e-06, - "loss": 0.0079, + "epoch": 0.91, + "learning_rate": 0.00016416747809152872, + "loss": 0.0099, "step": 179490 }, { - "epoch": 1.94, - "learning_rate": 8.925212427839396e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.0001641599103985147, + "loss": 0.0091, "step": 179500 }, { - "epoch": 1.94, - "learning_rate": 8.90899656223649e-06, - "loss": 0.0081, + "epoch": 0.91, + "learning_rate": 0.00016415234270550068, + "loss": 0.0111, "step": 179510 }, { - "epoch": 1.94, - "learning_rate": 8.892780696633587e-06, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.00016414477501248666, + "loss": 0.0107, "step": 179520 }, { - "epoch": 1.94, - "learning_rate": 8.87656483103068e-06, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016413720731947267, + "loss": 0.0132, "step": 179530 }, { - "epoch": 1.94, - "learning_rate": 8.860348965427774e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016412963962645865, + "loss": 0.013, "step": 179540 }, { - "epoch": 1.94, - "learning_rate": 8.844133099824868e-06, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016412207193344463, + "loss": 0.0153, "step": 179550 }, { - "epoch": 1.94, - "learning_rate": 8.827917234221963e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016411450424043064, + "loss": 0.0129, "step": 179560 }, { - "epoch": 1.94, - "learning_rate": 8.811701368619055e-06, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016410693654741662, + "loss": 0.0094, "step": 179570 }, { - "epoch": 1.94, - "learning_rate": 8.79548550301615e-06, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.0001640993688544026, + "loss": 0.0216, "step": 179580 }, { - "epoch": 1.94, - "learning_rate": 8.779269637413244e-06, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001640918011613886, + "loss": 0.0112, "step": 179590 }, { - "epoch": 1.94, - "learning_rate": 8.763053771810339e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001640842334683746, + "loss": 0.0135, "step": 179600 }, { - "epoch": 1.94, - "learning_rate": 8.746837906207433e-06, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016407666577536058, + "loss": 0.0111, "step": 179610 }, { - "epoch": 1.94, - "learning_rate": 8.730622040604528e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016406909808234658, + "loss": 0.0102, "step": 179620 }, { - "epoch": 1.94, - "learning_rate": 8.71440617500162e-06, - "loss": 0.0042, + "epoch": 0.91, + "learning_rate": 0.00016406153038933257, + "loss": 0.0128, "step": 179630 }, { - "epoch": 1.94, - "learning_rate": 8.698190309398715e-06, - "loss": 0.0079, + "epoch": 0.91, + "learning_rate": 0.00016405396269631855, + "loss": 0.0116, "step": 179640 }, { - "epoch": 1.94, - "learning_rate": 8.68197444379581e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016404639500330455, + "loss": 0.0101, "step": 179650 }, { - "epoch": 1.94, - "learning_rate": 8.665758578192904e-06, - "loss": 0.0086, + "epoch": 0.91, + "learning_rate": 0.00016403882731029054, + "loss": 0.0109, "step": 179660 }, { - "epoch": 1.94, - "learning_rate": 8.649542712589996e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016403125961727652, + "loss": 0.0108, "step": 179670 }, { - "epoch": 1.94, - "learning_rate": 8.633326846987091e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001640236919242625, + "loss": 0.0129, "step": 179680 }, { - "epoch": 1.94, - "learning_rate": 8.617110981384185e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.0001640161242312485, + "loss": 0.017, "step": 179690 }, { - "epoch": 1.94, - "learning_rate": 8.60089511578128e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001640085565382345, + "loss": 0.0116, "step": 179700 }, { - "epoch": 1.94, - "learning_rate": 8.584679250178374e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016400098884522047, + "loss": 0.0136, "step": 179710 }, { - "epoch": 1.94, - "learning_rate": 8.568463384575469e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016399342115220648, + "loss": 0.0121, "step": 179720 }, { - "epoch": 1.94, - "learning_rate": 8.552247518972561e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016398585345919246, + "loss": 0.0084, "step": 179730 }, { - "epoch": 1.94, - "learning_rate": 8.536031653369656e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016397828576617844, + "loss": 0.0114, "step": 179740 }, { - "epoch": 1.94, - "learning_rate": 8.51981578776675e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016397071807316445, + "loss": 0.0114, "step": 179750 }, { - "epoch": 1.94, - "learning_rate": 8.503599922163845e-06, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016396315038015043, + "loss": 0.0088, "step": 179760 }, { - "epoch": 1.94, - "learning_rate": 8.487384056560937e-06, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016395558268713641, + "loss": 0.0116, "step": 179770 }, { - "epoch": 1.94, - "learning_rate": 8.471168190958032e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016394801499412242, + "loss": 0.0152, "step": 179780 }, { - "epoch": 1.94, - "learning_rate": 8.454952325355126e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.0001639404473011084, + "loss": 0.0115, "step": 179790 }, { - "epoch": 1.94, - "learning_rate": 8.43873645975222e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016393287960809439, + "loss": 0.0113, "step": 179800 }, { - "epoch": 1.94, - "learning_rate": 8.422520594149315e-06, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.0001639253119150804, + "loss": 0.0165, "step": 179810 }, { - "epoch": 1.94, - "learning_rate": 8.40630472854641e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016391774422206638, + "loss": 0.0098, "step": 179820 }, { - "epoch": 1.94, - "learning_rate": 8.390088862943502e-06, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016391017652905236, + "loss": 0.0113, "step": 179830 }, { - "epoch": 1.94, - "learning_rate": 8.373872997340597e-06, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.00016390260883603837, + "loss": 0.0115, "step": 179840 }, { - "epoch": 1.94, - "learning_rate": 8.357657131737691e-06, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016389504114302435, + "loss": 0.0126, "step": 179850 }, { - "epoch": 1.94, - "learning_rate": 8.341441266134786e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016388747345001033, + "loss": 0.0115, "step": 179860 }, { - "epoch": 1.94, - "learning_rate": 8.32522540053188e-06, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.0001638799057569963, + "loss": 0.0117, "step": 179870 }, { - "epoch": 1.94, - "learning_rate": 8.309009534928975e-06, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016387233806398232, + "loss": 0.0093, "step": 179880 }, { - "epoch": 1.94, - "learning_rate": 8.292793669326069e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001638647703709683, + "loss": 0.0101, "step": 179890 }, { - "epoch": 1.94, - "learning_rate": 8.276577803723162e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016385720267795428, + "loss": 0.0081, "step": 179900 }, { - "epoch": 1.94, - "learning_rate": 8.260361938120256e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001638496349849403, + "loss": 0.0092, "step": 179910 }, { - "epoch": 1.95, - "learning_rate": 8.24414607251735e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016384206729192627, + "loss": 0.01, "step": 179920 }, { - "epoch": 1.95, - "learning_rate": 8.227930206914445e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016383449959891225, + "loss": 0.0094, "step": 179930 }, { - "epoch": 1.95, - "learning_rate": 8.211714341311538e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016382693190589826, + "loss": 0.0129, "step": 179940 }, { - "epoch": 1.95, - "learning_rate": 8.195498475708632e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016381936421288424, + "loss": 0.0149, "step": 179950 }, { - "epoch": 1.95, - "learning_rate": 8.179282610105727e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016381179651987022, + "loss": 0.0094, "step": 179960 }, { - "epoch": 1.95, - "learning_rate": 8.163066744502821e-06, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016380422882685623, + "loss": 0.0134, "step": 179970 }, { - "epoch": 1.95, - "learning_rate": 8.146850878899916e-06, - "loss": 0.0101, + "epoch": 0.91, + "learning_rate": 0.00016379666113384221, + "loss": 0.0091, "step": 179980 }, { - "epoch": 1.95, - "learning_rate": 8.13063501329701e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.0001637890934408282, + "loss": 0.0098, "step": 179990 }, { - "epoch": 1.95, - "learning_rate": 8.114419147694103e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001637815257478142, + "loss": 0.0102, "step": 180000 }, { - "epoch": 1.95, - "eval_cer": 0.9215034822292522, - "eval_loss": 0.005232350900769234, - "eval_runtime": 121.4858, - "eval_samples_per_second": 16.463, - "eval_steps_per_second": 4.116, + "epoch": 0.91, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.008224265649914742, + "eval_runtime": 116.6551, + "eval_samples_per_second": 17.145, + "eval_steps_per_second": 4.286, "step": 180000 }, { - "epoch": 1.95, - "learning_rate": 8.098203282091197e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016377395805480019, + "loss": 0.0104, "step": 180010 }, { - "epoch": 1.95, - "learning_rate": 8.081987416488292e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016376639036178617, + "loss": 0.009, "step": 180020 }, { - "epoch": 1.95, - "learning_rate": 8.065771550885386e-06, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016375882266877215, + "loss": 0.0138, "step": 180030 }, { - "epoch": 1.95, - "learning_rate": 8.049555685282479e-06, - "loss": 0.0043, + "epoch": 0.91, + "learning_rate": 0.00016375125497575816, + "loss": 0.0099, "step": 180040 }, { - "epoch": 1.95, - "learning_rate": 8.033339819679575e-06, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016374368728274414, + "loss": 0.0122, "step": 180050 }, { - "epoch": 1.95, - "learning_rate": 8.017123954076668e-06, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.00016373611958973012, + "loss": 0.0136, "step": 180060 }, { - "epoch": 1.95, - "learning_rate": 8.000908088473762e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016372855189671613, + "loss": 0.0124, "step": 180070 }, { - "epoch": 1.95, - "learning_rate": 7.984692222870857e-06, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.0001637209842037021, + "loss": 0.012, "step": 180080 }, { - "epoch": 1.95, - "learning_rate": 7.968476357267951e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001637134165106881, + "loss": 0.0144, "step": 180090 }, { - "epoch": 1.95, - "learning_rate": 7.952260491665044e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001637058488176741, + "loss": 0.0098, "step": 180100 }, { - "epoch": 1.95, - "learning_rate": 7.936044626062138e-06, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016369828112466008, + "loss": 0.0116, "step": 180110 }, { - "epoch": 1.95, - "learning_rate": 7.919828760459233e-06, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016369071343164606, + "loss": 0.0117, "step": 180120 }, { - "epoch": 1.95, - "learning_rate": 7.903612894856327e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016368314573863207, + "loss": 0.0141, "step": 180130 }, { - "epoch": 1.95, - "learning_rate": 7.887397029253421e-06, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016367557804561805, + "loss": 0.0137, "step": 180140 }, { - "epoch": 1.95, - "learning_rate": 7.871181163650516e-06, - "loss": 0.0092, + "epoch": 0.91, + "learning_rate": 0.00016366801035260403, + "loss": 0.0102, "step": 180150 }, { - "epoch": 1.95, - "learning_rate": 7.854965298047609e-06, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016366044265959004, + "loss": 0.01, "step": 180160 }, { - "epoch": 1.95, - "learning_rate": 7.838749432444703e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016365287496657602, + "loss": 0.0135, "step": 180170 }, { - "epoch": 1.95, - "learning_rate": 7.822533566841798e-06, - "loss": 0.0092, + "epoch": 0.91, + "learning_rate": 0.000163645307273562, + "loss": 0.0099, "step": 180180 }, { - "epoch": 1.95, - "learning_rate": 7.806317701238892e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.000163637739580548, + "loss": 0.0117, "step": 180190 }, { - "epoch": 1.95, - "learning_rate": 7.790101835635985e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.000163630171887534, + "loss": 0.0101, "step": 180200 }, { - "epoch": 1.95, - "learning_rate": 7.773885970033079e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016362260419451998, + "loss": 0.0106, "step": 180210 }, { - "epoch": 1.95, - "learning_rate": 7.757670104430174e-06, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016361503650150596, + "loss": 0.0133, "step": 180220 }, { - "epoch": 1.95, - "learning_rate": 7.741454238827268e-06, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016360746880849197, + "loss": 0.0111, "step": 180230 }, { - "epoch": 1.95, - "learning_rate": 7.725238373224362e-06, - "loss": 0.004, + "epoch": 0.91, + "learning_rate": 0.00016359990111547795, + "loss": 0.0166, "step": 180240 }, { - "epoch": 1.95, - "learning_rate": 7.709022507621457e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016359233342246393, + "loss": 0.0103, "step": 180250 }, { - "epoch": 1.95, - "learning_rate": 7.69280664201855e-06, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016358476572944994, + "loss": 0.012, "step": 180260 }, { - "epoch": 1.95, - "learning_rate": 7.676590776415644e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016357719803643592, + "loss": 0.0113, "step": 180270 }, { - "epoch": 1.95, - "learning_rate": 7.660374910812738e-06, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.0001635696303434219, + "loss": 0.0109, "step": 180280 }, { - "epoch": 1.95, - "learning_rate": 7.644159045209833e-06, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.0001635620626504079, + "loss": 0.0108, "step": 180290 }, { - "epoch": 1.95, - "learning_rate": 7.6279431796069265e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001635544949573939, + "loss": 0.0105, "step": 180300 }, { - "epoch": 1.95, - "learning_rate": 7.61172731400402e-06, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016354692726437987, + "loss": 0.0112, "step": 180310 }, { - "epoch": 1.95, - "learning_rate": 7.595511448401115e-06, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016353935957136588, + "loss": 0.0114, "step": 180320 }, { - "epoch": 1.95, - "learning_rate": 7.57929558279821e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016353179187835186, + "loss": 0.0118, "step": 180330 }, { - "epoch": 1.95, - "learning_rate": 7.563079717195303e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016352422418533784, + "loss": 0.009, "step": 180340 }, { - "epoch": 1.95, - "learning_rate": 7.546863851592398e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016351665649232383, + "loss": 0.0114, "step": 180350 }, { - "epoch": 1.95, - "learning_rate": 7.5306479859894914e-06, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016350908879930983, + "loss": 0.0112, "step": 180360 }, { - "epoch": 1.95, - "learning_rate": 7.514432120386586e-06, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.0001635015211062958, + "loss": 0.0081, "step": 180370 }, { - "epoch": 1.95, - "learning_rate": 7.4982162547836795e-06, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016349395341328177, + "loss": 0.0107, "step": 180380 }, { - "epoch": 1.95, - "learning_rate": 7.482000389180774e-06, - "loss": 0.0094, + "epoch": 0.91, + "learning_rate": 0.00016348638572026778, + "loss": 0.0115, "step": 180390 }, { - "epoch": 1.95, - "learning_rate": 7.4657845235778675e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016347881802725376, + "loss": 0.0102, "step": 180400 }, { - "epoch": 1.95, - "learning_rate": 7.449568657974963e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016347125033423974, + "loss": 0.0083, "step": 180410 }, { - "epoch": 1.95, - "learning_rate": 7.433352792372056e-06, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016346368264122572, + "loss": 0.0111, "step": 180420 }, { - "epoch": 1.95, - "learning_rate": 7.417136926769151e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016345611494821173, + "loss": 0.0124, "step": 180430 }, { - "epoch": 1.95, - "learning_rate": 7.400921061166244e-06, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.0001634485472551977, + "loss": 0.0153, "step": 180440 }, { - "epoch": 1.95, - "learning_rate": 7.384705195563339e-06, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.0001634409795621837, + "loss": 0.0101, "step": 180450 }, { - "epoch": 1.95, - "learning_rate": 7.3684893299604324e-06, - "loss": 0.0041, + "epoch": 0.91, + "learning_rate": 0.0001634334118691697, + "loss": 0.0124, "step": 180460 }, { - "epoch": 1.95, - "learning_rate": 7.352273464357527e-06, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016342584417615568, + "loss": 0.0147, "step": 180470 }, { - "epoch": 1.95, - "learning_rate": 7.3360575987546205e-06, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016341827648314167, + "loss": 0.0126, "step": 180480 }, { - "epoch": 1.95, - "learning_rate": 7.319841733151715e-06, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016341070879012767, + "loss": 0.0176, "step": 180490 }, { - "epoch": 1.95, - "learning_rate": 7.303625867548809e-06, - "loss": 0.0096, + "epoch": 0.91, + "learning_rate": 0.00016340314109711366, + "loss": 0.0105, "step": 180500 }, { - "epoch": 1.95, - "learning_rate": 7.287410001945904e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016339557340409964, + "loss": 0.0094, "step": 180510 }, { - "epoch": 1.95, - "learning_rate": 7.271194136342997e-06, - "loss": 0.0042, + "epoch": 0.91, + "learning_rate": 0.00016338800571108565, + "loss": 0.011, "step": 180520 }, { - "epoch": 1.95, - "learning_rate": 7.254978270740092e-06, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016338043801807163, + "loss": 0.014, "step": 180530 }, { - "epoch": 1.95, - "learning_rate": 7.238762405137185e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001633728703250576, + "loss": 0.0174, "step": 180540 }, { - "epoch": 1.95, - "learning_rate": 7.22254653953428e-06, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016336530263204362, + "loss": 0.0089, "step": 180550 }, { - "epoch": 1.95, - "learning_rate": 7.206330673931373e-06, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.0001633577349390296, + "loss": 0.0105, "step": 180560 }, { - "epoch": 1.95, - "learning_rate": 7.190114808328468e-06, - "loss": 0.0093, + "epoch": 0.91, + "learning_rate": 0.00016335016724601558, + "loss": 0.0146, "step": 180570 }, { - "epoch": 1.95, - "learning_rate": 7.1738989427255615e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016334259955300156, + "loss": 0.0176, "step": 180580 }, { - "epoch": 1.95, - "learning_rate": 7.157683077122657e-06, - "loss": 0.008, + "epoch": 0.91, + "learning_rate": 0.00016333503185998757, + "loss": 0.0107, "step": 180590 }, { - "epoch": 1.95, - "learning_rate": 7.14146721151975e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016332746416697355, + "loss": 0.0103, "step": 180600 }, { - "epoch": 1.95, - "learning_rate": 7.125251345916845e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016331989647395953, + "loss": 0.0107, "step": 180610 }, { - "epoch": 1.95, - "learning_rate": 7.109035480313938e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016331232878094554, + "loss": 0.0107, "step": 180620 }, { - "epoch": 1.95, - "learning_rate": 7.092819614711033e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016330476108793152, + "loss": 0.0095, "step": 180630 }, { - "epoch": 1.95, - "learning_rate": 7.076603749108126e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001632971933949175, + "loss": 0.0116, "step": 180640 }, { - "epoch": 1.95, - "learning_rate": 7.060387883505221e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001632896257019035, + "loss": 0.0131, "step": 180650 }, { - "epoch": 1.95, - "learning_rate": 7.044172017902314e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001632820580088895, + "loss": 0.0107, "step": 180660 }, { - "epoch": 1.95, - "learning_rate": 7.027956152299409e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016327449031587548, + "loss": 0.01, "step": 180670 }, { - "epoch": 1.95, - "learning_rate": 7.011740286696504e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016326692262286148, + "loss": 0.0089, "step": 180680 }, { - "epoch": 1.95, - "learning_rate": 6.995524421093598e-06, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016325935492984747, + "loss": 0.0114, "step": 180690 }, { - "epoch": 1.95, - "learning_rate": 6.979308555490692e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016325178723683345, + "loss": 0.0102, "step": 180700 }, { - "epoch": 1.95, - "learning_rate": 6.963092689887786e-06, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016324421954381946, + "loss": 0.0129, "step": 180710 }, { - "epoch": 1.95, - "learning_rate": 6.94687682428488e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016323665185080544, + "loss": 0.01, "step": 180720 }, { - "epoch": 1.95, - "learning_rate": 6.930660958681974e-06, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016322908415779142, + "loss": 0.011, "step": 180730 }, { - "epoch": 1.95, - "learning_rate": 6.914445093079067e-06, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016322151646477743, + "loss": 0.0117, "step": 180740 }, { - "epoch": 1.95, - "learning_rate": 6.898229227476162e-06, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.0001632139487717634, + "loss": 0.0103, "step": 180750 }, { - "epoch": 1.95, - "learning_rate": 6.882013361873255e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001632063810787494, + "loss": 0.0158, "step": 180760 }, { - "epoch": 1.95, - "learning_rate": 6.865797496270351e-06, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016319881338573537, + "loss": 0.0128, "step": 180770 }, { - "epoch": 1.95, - "learning_rate": 6.849581630667445e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016319124569272138, + "loss": 0.01, "step": 180780 }, { - "epoch": 1.95, - "learning_rate": 6.833365765064539e-06, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016318367799970736, + "loss": 0.0094, "step": 180790 }, { - "epoch": 1.95, - "learning_rate": 6.817149899461633e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016317611030669334, + "loss": 0.0103, "step": 180800 }, { - "epoch": 1.95, - "learning_rate": 6.800934033858727e-06, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016316854261367935, + "loss": 0.0106, "step": 180810 }, { - "epoch": 1.95, - "learning_rate": 6.784718168255821e-06, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016316097492066533, + "loss": 0.0114, "step": 180820 }, { - "epoch": 1.95, - "learning_rate": 6.768502302652915e-06, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016315340722765131, + "loss": 0.0127, "step": 180830 }, { - "epoch": 1.95, - "learning_rate": 6.752286437050009e-06, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016314583953463732, + "loss": 0.0129, "step": 180840 }, { - "epoch": 1.96, - "learning_rate": 6.736070571447103e-06, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001631382718416233, + "loss": 0.0116, "step": 180850 }, { - "epoch": 1.96, - "learning_rate": 6.719854705844198e-06, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016313070414860929, + "loss": 0.0113, "step": 180860 }, { - "epoch": 1.96, - "learning_rate": 6.703638840241292e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001631231364555953, + "loss": 0.0112, "step": 180870 }, { - "epoch": 1.96, - "learning_rate": 6.687422974638386e-06, - "loss": 0.0042, + "epoch": 0.91, + "learning_rate": 0.00016311556876258128, + "loss": 0.0123, "step": 180880 }, { - "epoch": 1.96, - "learning_rate": 6.67120710903548e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016310800106956726, + "loss": 0.0102, "step": 180890 }, { - "epoch": 1.96, - "learning_rate": 6.654991243432574e-06, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016310043337655327, + "loss": 0.0144, "step": 180900 }, { - "epoch": 1.96, - "learning_rate": 6.638775377829668e-06, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016309286568353925, + "loss": 0.0112, "step": 180910 }, { - "epoch": 1.96, - "learning_rate": 6.622559512226762e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016308529799052523, + "loss": 0.0092, "step": 180920 }, { - "epoch": 1.96, - "learning_rate": 6.606343646623856e-06, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.0001630777302975112, + "loss": 0.0096, "step": 180930 }, { - "epoch": 1.96, - "learning_rate": 6.59012778102095e-06, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016307016260449722, + "loss": 0.0115, "step": 180940 }, { - "epoch": 1.96, - "learning_rate": 6.573911915418045e-06, - "loss": 0.0101, + "epoch": 0.91, + "learning_rate": 0.0001630625949114832, + "loss": 0.0128, "step": 180950 }, { - "epoch": 1.96, - "learning_rate": 6.557696049815139e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016305502721846918, + "loss": 0.0105, "step": 180960 }, { - "epoch": 1.96, - "learning_rate": 6.541480184212233e-06, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.0001630474595254552, + "loss": 0.0122, "step": 180970 }, { - "epoch": 1.96, - "learning_rate": 6.525264318609327e-06, - "loss": 0.0043, + "epoch": 0.91, + "learning_rate": 0.00016303989183244117, + "loss": 0.0095, "step": 180980 }, { - "epoch": 1.96, - "learning_rate": 6.509048453006421e-06, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016303232413942715, + "loss": 0.011, "step": 180990 }, { - "epoch": 1.96, - "learning_rate": 6.492832587403515e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016302475644641316, + "loss": 0.0117, "step": 181000 }, { - "epoch": 1.96, - "eval_cer": 0.921500876420383, - "eval_loss": 0.005276523530483246, - "eval_runtime": 121.2902, - "eval_samples_per_second": 16.489, - "eval_steps_per_second": 4.122, + "epoch": 0.91, + "eval_cer": 0.9144751078837893, + "eval_loss": 0.008274085819721222, + "eval_runtime": 116.712, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, "step": 181000 }, { - "epoch": 1.96, - "learning_rate": 6.476616721800609e-06, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016301718875339914, + "loss": 0.0135, "step": 181010 }, { - "epoch": 1.96, - "learning_rate": 6.460400856197703e-06, - "loss": 0.0084, + "epoch": 0.91, + "learning_rate": 0.00016300962106038512, + "loss": 0.0104, "step": 181020 }, { - "epoch": 1.96, - "learning_rate": 6.444184990594797e-06, - "loss": 0.0088, + "epoch": 0.91, + "learning_rate": 0.00016300205336737113, + "loss": 0.0161, "step": 181030 }, { - "epoch": 1.96, - "learning_rate": 6.427969124991892e-06, - "loss": 0.0085, + "epoch": 0.91, + "learning_rate": 0.00016299448567435711, + "loss": 0.0133, "step": 181040 }, { - "epoch": 1.96, - "learning_rate": 6.411753259388986e-06, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.0001629869179813431, + "loss": 0.0125, "step": 181050 }, { - "epoch": 1.96, - "learning_rate": 6.39553739378608e-06, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.0001629793502883291, + "loss": 0.01, "step": 181060 }, { - "epoch": 1.96, - "learning_rate": 6.379321528183174e-06, - "loss": 0.0084, + "epoch": 0.91, + "learning_rate": 0.00016297178259531509, + "loss": 0.011, "step": 181070 }, { - "epoch": 1.96, - "learning_rate": 6.363105662580268e-06, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016296421490230107, + "loss": 0.012, "step": 181080 }, { - "epoch": 1.96, - "learning_rate": 6.346889796977362e-06, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016295664720928705, + "loss": 0.0172, "step": 181090 }, { - "epoch": 1.96, - "learning_rate": 6.330673931374456e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016294907951627306, + "loss": 0.0121, "step": 181100 }, { - "epoch": 1.96, - "learning_rate": 6.31445806577155e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016294151182325904, + "loss": 0.0132, "step": 181110 }, { - "epoch": 1.96, - "learning_rate": 6.298242200168644e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016293394413024502, + "loss": 0.0124, "step": 181120 }, { - "epoch": 1.96, - "learning_rate": 6.282026334565739e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016292637643723103, + "loss": 0.0106, "step": 181130 }, { - "epoch": 1.96, - "learning_rate": 6.265810468962833e-06, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.000162918808744217, + "loss": 0.0103, "step": 181140 }, { - "epoch": 1.96, - "learning_rate": 6.2495946033599274e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.000162911241051203, + "loss": 0.0125, "step": 181150 }, { - "epoch": 1.96, - "learning_rate": 6.233378737757021e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.000162903673358189, + "loss": 0.0085, "step": 181160 }, { - "epoch": 1.96, - "learning_rate": 6.2171628721541155e-06, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016289610566517498, + "loss": 0.0128, "step": 181170 }, { - "epoch": 1.96, - "learning_rate": 6.200947006551209e-06, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016288853797216096, + "loss": 0.0177, "step": 181180 }, { - "epoch": 1.96, - "learning_rate": 6.1847311409483035e-06, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.00016288097027914697, + "loss": 0.0123, "step": 181190 }, { - "epoch": 1.96, - "learning_rate": 6.168515275345397e-06, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016287340258613295, + "loss": 0.0179, "step": 181200 }, { - "epoch": 1.96, - "learning_rate": 6.152299409742491e-06, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016286583489311893, + "loss": 0.0151, "step": 181210 }, { - "epoch": 1.96, - "learning_rate": 6.136083544139586e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016285826720010494, + "loss": 0.0134, "step": 181220 }, { - "epoch": 1.96, - "learning_rate": 6.11986767853668e-06, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016285069950709092, + "loss": 0.0125, "step": 181230 }, { - "epoch": 1.96, - "learning_rate": 6.103651812933774e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001628431318140769, + "loss": 0.0148, "step": 181240 }, { - "epoch": 1.96, - "learning_rate": 6.0874359473308684e-06, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.0001628355641210629, + "loss": 0.0166, "step": 181250 }, { - "epoch": 1.96, - "learning_rate": 6.071220081727962e-06, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001628279964280489, + "loss": 0.0099, "step": 181260 }, { - "epoch": 1.96, - "learning_rate": 6.0550042161250565e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016282042873503488, + "loss": 0.0088, "step": 181270 }, { - "epoch": 1.96, - "learning_rate": 6.03878835052215e-06, - "loss": 0.0079, + "epoch": 0.91, + "learning_rate": 0.00016281286104202086, + "loss": 0.0117, "step": 181280 }, { - "epoch": 1.96, - "learning_rate": 6.0225724849192445e-06, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016280529334900687, + "loss": 0.0105, "step": 181290 }, { - "epoch": 1.96, - "learning_rate": 6.006356619316338e-06, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016279772565599285, + "loss": 0.0113, "step": 181300 }, { - "epoch": 1.96, - "learning_rate": 5.990140753713433e-06, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016279015796297883, + "loss": 0.0119, "step": 181310 }, { - "epoch": 1.96, - "learning_rate": 5.973924888110527e-06, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.00016278259026996484, + "loss": 0.0134, "step": 181320 }, { - "epoch": 1.96, - "learning_rate": 5.957709022507621e-06, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016277502257695082, + "loss": 0.0111, "step": 181330 }, { - "epoch": 1.96, - "learning_rate": 5.941493156904715e-06, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.0001627674548839368, + "loss": 0.0132, "step": 181340 }, { - "epoch": 1.96, - "learning_rate": 5.925277291301809e-06, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.0001627598871909228, + "loss": 0.0114, "step": 181350 }, { - "epoch": 1.96, - "learning_rate": 5.909061425698903e-06, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001627523194979088, + "loss": 0.0106, "step": 181360 }, { - "epoch": 1.96, - "learning_rate": 5.8928455600959975e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016274475180489477, + "loss": 0.0103, "step": 181370 }, { - "epoch": 1.96, - "learning_rate": 5.876629694493091e-06, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016273718411188078, + "loss": 0.011, "step": 181380 }, { - "epoch": 1.96, - "learning_rate": 5.8604138288901855e-06, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016272961641886676, + "loss": 0.0136, "step": 181390 }, { - "epoch": 1.96, - "learning_rate": 5.84419796328728e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016272204872585274, + "loss": 0.0108, "step": 181400 }, { - "epoch": 1.96, - "learning_rate": 5.827982097684374e-06, - "loss": 0.0042, + "epoch": 0.92, + "learning_rate": 0.00016271448103283875, + "loss": 0.0122, "step": 181410 }, { - "epoch": 1.96, - "learning_rate": 5.811766232081468e-06, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.00016270691333982473, + "loss": 0.0108, "step": 181420 }, { - "epoch": 1.96, - "learning_rate": 5.795550366478562e-06, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016269934564681072, + "loss": 0.0103, "step": 181430 }, { - "epoch": 1.96, - "learning_rate": 5.779334500875656e-06, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.0001626917779537967, + "loss": 0.0096, "step": 181440 }, { - "epoch": 1.96, - "learning_rate": 5.76311863527275e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.0001626842102607827, + "loss": 0.0135, "step": 181450 }, { - "epoch": 1.96, - "learning_rate": 5.746902769669844e-06, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.0001626766425677687, + "loss": 0.011, "step": 181460 }, { - "epoch": 1.96, - "learning_rate": 5.7306869040669384e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016266907487475467, + "loss": 0.0131, "step": 181470 }, { - "epoch": 1.96, - "learning_rate": 5.714471038464032e-06, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016266150718174068, + "loss": 0.0087, "step": 181480 }, { - "epoch": 1.96, - "learning_rate": 5.698255172861127e-06, - "loss": 0.0037, + "epoch": 0.92, + "learning_rate": 0.00016265393948872666, + "loss": 0.0126, "step": 181490 }, { - "epoch": 1.96, - "learning_rate": 5.682039307258222e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016264637179571264, + "loss": 0.0088, "step": 181500 }, { - "epoch": 1.96, - "learning_rate": 5.665823441655315e-06, - "loss": 0.008, + "epoch": 0.92, + "learning_rate": 0.00016263880410269865, + "loss": 0.0153, "step": 181510 }, { - "epoch": 1.96, - "learning_rate": 5.649607576052409e-06, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016263123640968463, + "loss": 0.0109, "step": 181520 }, { - "epoch": 1.96, - "learning_rate": 5.633391710449503e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.0001626236687166706, + "loss": 0.0104, "step": 181530 }, { - "epoch": 1.96, - "learning_rate": 5.617175844846597e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016261610102365662, + "loss": 0.011, "step": 181540 }, { - "epoch": 1.96, - "learning_rate": 5.600959979243691e-06, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.0001626085333306426, + "loss": 0.0116, "step": 181550 }, { - "epoch": 1.96, - "learning_rate": 5.584744113640785e-06, - "loss": 0.0068, + "epoch": 0.92, + "learning_rate": 0.00016260096563762858, + "loss": 0.0135, "step": 181560 }, { - "epoch": 1.96, - "learning_rate": 5.5685282480378794e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001625933979446146, + "loss": 0.0114, "step": 181570 }, { - "epoch": 1.96, - "learning_rate": 5.552312382434975e-06, - "loss": 0.0085, + "epoch": 0.92, + "learning_rate": 0.00016258583025160057, + "loss": 0.0148, "step": 181580 }, { - "epoch": 1.96, - "learning_rate": 5.536096516832068e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016257826255858655, + "loss": 0.0096, "step": 181590 }, { - "epoch": 1.96, - "learning_rate": 5.519880651229163e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016257069486557254, + "loss": 0.0137, "step": 181600 }, { - "epoch": 1.96, - "learning_rate": 5.503664785626256e-06, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016256312717255854, + "loss": 0.0126, "step": 181610 }, { - "epoch": 1.96, - "learning_rate": 5.487448920023351e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016255555947954453, + "loss": 0.0123, "step": 181620 }, { - "epoch": 1.96, - "learning_rate": 5.471233054420444e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016254799178653048, + "loss": 0.0162, "step": 181630 }, { - "epoch": 1.96, - "learning_rate": 5.455017188817539e-06, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016254042409351646, + "loss": 0.0096, "step": 181640 }, { - "epoch": 1.96, - "learning_rate": 5.438801323214632e-06, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016253285640050247, + "loss": 0.0105, "step": 181650 }, { - "epoch": 1.96, - "learning_rate": 5.422585457611727e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016252528870748845, + "loss": 0.0104, "step": 181660 }, { - "epoch": 1.96, - "learning_rate": 5.406369592008821e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016251772101447443, + "loss": 0.0139, "step": 181670 }, { - "epoch": 1.96, - "learning_rate": 5.390153726405916e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016251015332146044, + "loss": 0.0111, "step": 181680 }, { - "epoch": 1.96, - "learning_rate": 5.373937860803009e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016250258562844642, + "loss": 0.013, "step": 181690 }, { - "epoch": 1.96, - "learning_rate": 5.357721995200104e-06, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.0001624950179354324, + "loss": 0.0112, "step": 181700 }, { - "epoch": 1.96, - "learning_rate": 5.341506129597197e-06, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.0001624874502424184, + "loss": 0.0107, "step": 181710 }, { - "epoch": 1.96, - "learning_rate": 5.325290263994292e-06, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.0001624798825494044, + "loss": 0.0107, "step": 181720 }, { - "epoch": 1.96, - "learning_rate": 5.309074398391385e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016247231485639038, + "loss": 0.0094, "step": 181730 }, { - "epoch": 1.96, - "learning_rate": 5.29285853278848e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016246474716337638, + "loss": 0.0124, "step": 181740 }, { - "epoch": 1.96, - "learning_rate": 5.276642667185573e-06, - "loss": 0.0093, + "epoch": 0.92, + "learning_rate": 0.00016245717947036237, + "loss": 0.0122, "step": 181750 }, { - "epoch": 1.96, - "learning_rate": 5.260426801582669e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016244961177734835, + "loss": 0.012, "step": 181760 }, { - "epoch": 1.97, - "learning_rate": 5.244210935979762e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016244204408433436, + "loss": 0.0091, "step": 181770 }, { - "epoch": 1.97, - "learning_rate": 5.227995070376857e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016243447639132034, + "loss": 0.0115, "step": 181780 }, { - "epoch": 1.97, - "learning_rate": 5.21177920477395e-06, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016242690869830632, + "loss": 0.0116, "step": 181790 }, { - "epoch": 1.97, - "learning_rate": 5.195563339171045e-06, - "loss": 0.0084, + "epoch": 0.92, + "learning_rate": 0.00016241934100529233, + "loss": 0.0138, "step": 181800 }, { - "epoch": 1.97, - "learning_rate": 5.179347473568138e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.0001624117733122783, + "loss": 0.013, "step": 181810 }, { - "epoch": 1.97, - "learning_rate": 5.163131607965233e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.0001624042056192643, + "loss": 0.0126, "step": 181820 }, { - "epoch": 1.97, - "learning_rate": 5.146915742362326e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016239663792625027, + "loss": 0.0116, "step": 181830 }, { - "epoch": 1.97, - "learning_rate": 5.130699876759421e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016238907023323628, + "loss": 0.0132, "step": 181840 }, { - "epoch": 1.97, - "learning_rate": 5.114484011156515e-06, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016238150254022226, + "loss": 0.0107, "step": 181850 }, { - "epoch": 1.97, - "learning_rate": 5.09826814555361e-06, - "loss": 0.0081, + "epoch": 0.92, + "learning_rate": 0.00016237393484720824, + "loss": 0.0105, "step": 181860 }, { - "epoch": 1.97, - "learning_rate": 5.082052279950703e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016236636715419425, + "loss": 0.0109, "step": 181870 }, { - "epoch": 1.97, - "learning_rate": 5.065836414347798e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016235879946118023, + "loss": 0.0103, "step": 181880 }, { - "epoch": 1.97, - "learning_rate": 5.049620548744891e-06, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016235123176816621, + "loss": 0.0159, "step": 181890 }, { - "epoch": 1.97, - "learning_rate": 5.033404683141986e-06, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.00016234366407515222, + "loss": 0.0104, "step": 181900 }, { - "epoch": 1.97, - "learning_rate": 5.017188817539079e-06, - "loss": 0.0087, + "epoch": 0.92, + "learning_rate": 0.0001623360963821382, + "loss": 0.0095, "step": 181910 }, { - "epoch": 1.97, - "learning_rate": 5.000972951936174e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016232852868912419, + "loss": 0.0142, "step": 181920 }, { - "epoch": 1.97, - "learning_rate": 4.984757086333267e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.0001623209609961102, + "loss": 0.0138, "step": 181930 }, { - "epoch": 1.97, - "learning_rate": 4.968541220730363e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016231339330309618, + "loss": 0.0173, "step": 181940 }, { - "epoch": 1.97, - "learning_rate": 4.952325355127457e-06, - "loss": 0.004, + "epoch": 0.92, + "learning_rate": 0.00016230582561008216, + "loss": 0.0096, "step": 181950 }, { - "epoch": 1.97, - "learning_rate": 4.936109489524551e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016229825791706817, + "loss": 0.0109, "step": 181960 }, { - "epoch": 1.97, - "learning_rate": 4.919893623921645e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016229069022405415, + "loss": 0.0121, "step": 181970 }, { - "epoch": 1.97, - "learning_rate": 4.903677758318739e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016228312253104013, + "loss": 0.0156, "step": 181980 }, { - "epoch": 1.97, - "learning_rate": 4.887461892715832e-06, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.0001622755548380261, + "loss": 0.0107, "step": 181990 }, { - "epoch": 1.97, - "learning_rate": 4.871246027112927e-06, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016226798714501212, + "loss": 0.0104, "step": 182000 }, { - "epoch": 1.97, - "eval_cer": 0.9215017450233394, - "eval_loss": 0.0052335127256810665, - "eval_runtime": 121.2359, - "eval_samples_per_second": 16.497, - "eval_steps_per_second": 4.124, + "epoch": 0.92, + "eval_cer": 0.9144857822411687, + "eval_loss": 0.008326300419867039, + "eval_runtime": 116.6222, + "eval_samples_per_second": 17.149, + "eval_steps_per_second": 4.287, "step": 182000 }, { - "epoch": 1.97, - "learning_rate": 4.85503016151002e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.0001622604194519981, + "loss": 0.0137, "step": 182010 }, { - "epoch": 1.97, - "learning_rate": 4.838814295907115e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016225285175898408, + "loss": 0.0108, "step": 182020 }, { - "epoch": 1.97, - "learning_rate": 4.82259843030421e-06, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.0001622452840659701, + "loss": 0.013, "step": 182030 }, { - "epoch": 1.97, - "learning_rate": 4.806382564701304e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016223771637295607, + "loss": 0.0097, "step": 182040 }, { - "epoch": 1.97, - "learning_rate": 4.790166699098398e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016223014867994205, + "loss": 0.0102, "step": 182050 }, { - "epoch": 1.97, - "learning_rate": 4.773950833495492e-06, - "loss": 0.004, + "epoch": 0.92, + "learning_rate": 0.00016222258098692806, + "loss": 0.0127, "step": 182060 }, { - "epoch": 1.97, - "learning_rate": 4.757734967892586e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016221501329391404, + "loss": 0.0123, "step": 182070 }, { - "epoch": 1.97, - "learning_rate": 4.74151910228968e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016220744560090002, + "loss": 0.01, "step": 182080 }, { - "epoch": 1.97, - "learning_rate": 4.725303236686774e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016219987790788603, + "loss": 0.0126, "step": 182090 }, { - "epoch": 1.97, - "learning_rate": 4.709087371083868e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016219231021487201, + "loss": 0.0107, "step": 182100 }, { - "epoch": 1.97, - "learning_rate": 4.692871505480962e-06, - "loss": 0.0081, + "epoch": 0.92, + "learning_rate": 0.000162184742521858, + "loss": 0.014, "step": 182110 }, { - "epoch": 1.97, - "learning_rate": 4.6766556398780565e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.000162177174828844, + "loss": 0.0118, "step": 182120 }, { - "epoch": 1.97, - "learning_rate": 4.66043977427515e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016216960713582999, + "loss": 0.012, "step": 182130 }, { - "epoch": 1.97, - "learning_rate": 4.6442239086722446e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016216203944281597, + "loss": 0.0107, "step": 182140 }, { - "epoch": 1.97, - "learning_rate": 4.628008043069339e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016215447174980195, + "loss": 0.0109, "step": 182150 }, { - "epoch": 1.97, - "learning_rate": 4.611792177466433e-06, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016214690405678796, + "loss": 0.0099, "step": 182160 }, { - "epoch": 1.97, - "learning_rate": 4.595576311863527e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016213933636377394, + "loss": 0.0134, "step": 182170 }, { - "epoch": 1.97, - "learning_rate": 4.579360446260621e-06, - "loss": 0.0083, + "epoch": 0.92, + "learning_rate": 0.00016213176867075992, + "loss": 0.0115, "step": 182180 }, { - "epoch": 1.97, - "learning_rate": 4.563144580657715e-06, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016212420097774593, + "loss": 0.0097, "step": 182190 }, { - "epoch": 1.97, - "learning_rate": 4.5469287150548095e-06, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.0001621166332847319, + "loss": 0.0098, "step": 182200 }, { - "epoch": 1.97, - "learning_rate": 4.530712849451903e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.0001621090655917179, + "loss": 0.0168, "step": 182210 }, { - "epoch": 1.97, - "learning_rate": 4.5144969838489975e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.0001621014978987039, + "loss": 0.0137, "step": 182220 }, { - "epoch": 1.97, - "learning_rate": 4.498281118246091e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016209393020568988, + "loss": 0.012, "step": 182230 }, { - "epoch": 1.97, - "learning_rate": 4.4820652526431856e-06, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016208636251267586, + "loss": 0.0123, "step": 182240 }, { - "epoch": 1.97, - "learning_rate": 4.46584938704028e-06, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016207879481966187, + "loss": 0.0098, "step": 182250 }, { - "epoch": 1.97, - "learning_rate": 4.449633521437374e-06, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016207122712664785, + "loss": 0.0173, "step": 182260 }, { - "epoch": 1.97, - "learning_rate": 4.433417655834468e-06, - "loss": 0.009, + "epoch": 0.92, + "learning_rate": 0.00016206365943363383, + "loss": 0.0123, "step": 182270 }, { - "epoch": 1.97, - "learning_rate": 4.4172017902315625e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016205609174061984, + "loss": 0.0121, "step": 182280 }, { - "epoch": 1.97, - "learning_rate": 4.400985924628656e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016204852404760582, + "loss": 0.0148, "step": 182290 }, { - "epoch": 1.97, - "learning_rate": 4.3847700590257505e-06, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.0001620409563545918, + "loss": 0.0107, "step": 182300 }, { - "epoch": 1.97, - "learning_rate": 4.368554193422844e-06, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016203338866157781, + "loss": 0.009, "step": 182310 }, { - "epoch": 1.97, - "learning_rate": 4.3523383278199385e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.0001620258209685638, + "loss": 0.0131, "step": 182320 }, { - "epoch": 1.97, - "learning_rate": 4.336122462217033e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016201825327554978, + "loss": 0.0131, "step": 182330 }, { - "epoch": 1.97, - "learning_rate": 4.3199065966141265e-06, - "loss": 0.0118, + "epoch": 0.92, + "learning_rate": 0.00016201068558253576, + "loss": 0.0108, "step": 182340 }, { - "epoch": 1.97, - "learning_rate": 4.303690731011221e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016200311788952177, + "loss": 0.0116, "step": 182350 }, { - "epoch": 1.97, - "learning_rate": 4.287474865408315e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016199555019650775, + "loss": 0.0144, "step": 182360 }, { - "epoch": 1.97, - "learning_rate": 4.27125899980541e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016198798250349373, + "loss": 0.0092, "step": 182370 }, { - "epoch": 1.97, - "learning_rate": 4.2550431342025035e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016198041481047974, + "loss": 0.0136, "step": 182380 }, { - "epoch": 1.97, - "learning_rate": 4.238827268599597e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016197284711746572, + "loss": 0.0104, "step": 182390 }, { - "epoch": 1.97, - "learning_rate": 4.2226114029966915e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.0001619652794244517, + "loss": 0.013, "step": 182400 }, { - "epoch": 1.97, - "learning_rate": 4.206395537393785e-06, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.0001619577117314377, + "loss": 0.012, "step": 182410 }, { - "epoch": 1.97, - "learning_rate": 4.19017967179088e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.0001619501440384237, + "loss": 0.0091, "step": 182420 }, { - "epoch": 1.97, - "learning_rate": 4.173963806187974e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016194257634540967, + "loss": 0.0109, "step": 182430 }, { - "epoch": 1.97, - "learning_rate": 4.157747940585068e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016193500865239568, + "loss": 0.0111, "step": 182440 }, { - "epoch": 1.97, - "learning_rate": 4.141532074982162e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016192744095938166, + "loss": 0.0112, "step": 182450 }, { - "epoch": 1.97, - "learning_rate": 4.125316209379256e-06, - "loss": 0.0088, + "epoch": 0.92, + "learning_rate": 0.00016191987326636764, + "loss": 0.0128, "step": 182460 }, { - "epoch": 1.97, - "learning_rate": 4.109100343776351e-06, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016191230557335365, + "loss": 0.0102, "step": 182470 }, { - "epoch": 1.97, - "learning_rate": 4.0928844781734444e-06, - "loss": 0.0085, + "epoch": 0.92, + "learning_rate": 0.00016190473788033963, + "loss": 0.0112, "step": 182480 }, { - "epoch": 1.97, - "learning_rate": 4.076668612570539e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016189717018732562, + "loss": 0.0114, "step": 182490 }, { - "epoch": 1.97, - "learning_rate": 4.060452746967633e-06, - "loss": 0.0092, + "epoch": 0.92, + "learning_rate": 0.0001618896024943116, + "loss": 0.0104, "step": 182500 }, { - "epoch": 1.97, - "learning_rate": 4.044236881364727e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.0001618820348012976, + "loss": 0.0094, "step": 182510 }, { - "epoch": 1.97, - "learning_rate": 4.028021015761821e-06, - "loss": 0.0085, + "epoch": 0.92, + "learning_rate": 0.0001618744671082836, + "loss": 0.0097, "step": 182520 }, { - "epoch": 1.97, - "learning_rate": 4.011805150158915e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016186689941526957, + "loss": 0.011, "step": 182530 }, { - "epoch": 1.97, - "learning_rate": 3.995589284556009e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016185933172225558, + "loss": 0.0113, "step": 182540 }, { - "epoch": 1.97, - "learning_rate": 3.979373418953104e-06, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016185176402924156, + "loss": 0.0093, "step": 182550 }, { - "epoch": 1.97, - "learning_rate": 3.963157553350197e-06, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016184419633622754, + "loss": 0.0122, "step": 182560 }, { - "epoch": 1.97, - "learning_rate": 3.946941687747292e-06, - "loss": 0.0039, + "epoch": 0.92, + "learning_rate": 0.00016183662864321355, + "loss": 0.0116, "step": 182570 }, { - "epoch": 1.97, - "learning_rate": 3.9307258221443854e-06, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016182906095019953, + "loss": 0.0103, "step": 182580 }, { - "epoch": 1.97, - "learning_rate": 3.91450995654148e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.0001618214932571855, + "loss": 0.009, "step": 182590 }, { - "epoch": 1.97, - "learning_rate": 3.898294090938574e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016181392556417152, + "loss": 0.0122, "step": 182600 }, { - "epoch": 1.97, - "learning_rate": 3.882078225335668e-06, - "loss": 0.0083, + "epoch": 0.92, + "learning_rate": 0.0001618063578711575, + "loss": 0.0111, "step": 182610 }, { - "epoch": 1.97, - "learning_rate": 3.865862359732762e-06, - "loss": 0.0099, + "epoch": 0.92, + "learning_rate": 0.00016179879017814348, + "loss": 0.0125, "step": 182620 }, { - "epoch": 1.97, - "learning_rate": 3.849646494129856e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.0001617912224851295, + "loss": 0.0121, "step": 182630 }, { - "epoch": 1.97, - "learning_rate": 3.83343062852695e-06, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.00016178365479211547, + "loss": 0.0105, "step": 182640 }, { - "epoch": 1.97, - "learning_rate": 3.817214762924045e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016177608709910145, + "loss": 0.012, "step": 182650 }, { - "epoch": 1.97, - "learning_rate": 3.800998897321139e-06, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016176851940608744, + "loss": 0.0107, "step": 182660 }, { - "epoch": 1.97, - "learning_rate": 3.784783031718233e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016176095171307344, + "loss": 0.0109, "step": 182670 }, { - "epoch": 1.97, - "learning_rate": 3.7685671661153273e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016175338402005943, + "loss": 0.0112, "step": 182680 }, { - "epoch": 1.97, - "learning_rate": 3.7523513005124213e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.0001617458163270454, + "loss": 0.0118, "step": 182690 }, { - "epoch": 1.98, - "learning_rate": 3.7361354349095153e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016173824863403142, + "loss": 0.0108, "step": 182700 }, { - "epoch": 1.98, - "learning_rate": 3.7199195693066093e-06, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.0001617306809410174, + "loss": 0.0108, "step": 182710 }, { - "epoch": 1.98, - "learning_rate": 3.7037037037037033e-06, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016172311324800338, + "loss": 0.0114, "step": 182720 }, { - "epoch": 1.98, - "learning_rate": 3.6874878381007978e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.0001617155455549894, + "loss": 0.014, "step": 182730 }, { - "epoch": 1.98, - "learning_rate": 3.6712719724978918e-06, - "loss": 0.0118, + "epoch": 0.92, + "learning_rate": 0.00016170797786197537, + "loss": 0.01, "step": 182740 }, { - "epoch": 1.98, - "learning_rate": 3.6550561068949858e-06, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016170041016896135, + "loss": 0.0113, "step": 182750 }, { - "epoch": 1.98, - "learning_rate": 3.63884024129208e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016169284247594736, + "loss": 0.0113, "step": 182760 }, { - "epoch": 1.98, - "learning_rate": 3.6226243756891742e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016168527478293334, + "loss": 0.0131, "step": 182770 }, { - "epoch": 1.98, - "learning_rate": 3.6064085100862682e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016167770708991932, + "loss": 0.0108, "step": 182780 }, { - "epoch": 1.98, - "learning_rate": 3.5901926444833623e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016167013939690533, + "loss": 0.0106, "step": 182790 }, { - "epoch": 1.98, - "learning_rate": 3.5739767788804563e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.0001616625717038913, + "loss": 0.0112, "step": 182800 }, { - "epoch": 1.98, - "learning_rate": 3.5577609132775503e-06, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.0001616550040108773, + "loss": 0.0129, "step": 182810 }, { - "epoch": 1.98, - "learning_rate": 3.5415450476746447e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.0001616474363178633, + "loss": 0.0116, "step": 182820 }, { - "epoch": 1.98, - "learning_rate": 3.5253291820717387e-06, - "loss": 0.0083, + "epoch": 0.92, + "learning_rate": 0.00016163986862484928, + "loss": 0.0122, "step": 182830 }, { - "epoch": 1.98, - "learning_rate": 3.5091133164688328e-06, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016163230093183526, + "loss": 0.01, "step": 182840 }, { - "epoch": 1.98, - "learning_rate": 3.4928974508659268e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016162473323882125, + "loss": 0.0095, "step": 182850 }, { - "epoch": 1.98, - "learning_rate": 3.476681585263021e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016161716554580725, + "loss": 0.0092, "step": 182860 }, { - "epoch": 1.98, - "learning_rate": 3.4604657196601152e-06, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016160959785279324, + "loss": 0.0118, "step": 182870 }, { - "epoch": 1.98, - "learning_rate": 3.4442498540572092e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.0001616020301597792, + "loss": 0.0093, "step": 182880 }, { - "epoch": 1.98, - "learning_rate": 3.4280339884543032e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016159446246676517, + "loss": 0.0098, "step": 182890 }, { - "epoch": 1.98, - "learning_rate": 3.4118181228513973e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016158689477375118, + "loss": 0.0131, "step": 182900 }, { - "epoch": 1.98, - "learning_rate": 3.3956022572484917e-06, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016157932708073716, + "loss": 0.0083, "step": 182910 }, { - "epoch": 1.98, - "learning_rate": 3.3793863916455857e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016157175938772314, + "loss": 0.0105, "step": 182920 }, { - "epoch": 1.98, - "learning_rate": 3.3631705260426797e-06, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016156419169470915, + "loss": 0.0119, "step": 182930 }, { - "epoch": 1.98, - "learning_rate": 3.3469546604397737e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016155662400169513, + "loss": 0.0091, "step": 182940 }, { - "epoch": 1.98, - "learning_rate": 3.330738794836868e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016154905630868111, + "loss": 0.0129, "step": 182950 }, { - "epoch": 1.98, - "learning_rate": 3.314522929233962e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016154148861566712, + "loss": 0.012, "step": 182960 }, { - "epoch": 1.98, - "learning_rate": 3.298307063631056e-06, - "loss": 0.0068, + "epoch": 0.92, + "learning_rate": 0.0001615339209226531, + "loss": 0.0135, "step": 182970 }, { - "epoch": 1.98, - "learning_rate": 3.2820911980281502e-06, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016152635322963909, + "loss": 0.0092, "step": 182980 }, { - "epoch": 1.98, - "learning_rate": 3.2658753324252442e-06, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.0001615187855366251, + "loss": 0.0105, "step": 182990 }, { - "epoch": 1.98, - "learning_rate": 3.249659466822339e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016151121784361108, + "loss": 0.0101, "step": 183000 }, { - "epoch": 1.98, - "eval_cer": 0.9215000078174266, - "eval_loss": 0.005184313748031855, - "eval_runtime": 121.1588, - "eval_samples_per_second": 16.507, - "eval_steps_per_second": 4.127, + "epoch": 0.92, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.00819355621933937, + "eval_runtime": 116.6466, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.286, "step": 183000 }, { - "epoch": 1.98, - "learning_rate": 3.2334436012194327e-06, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.00016150365015059706, + "loss": 0.0082, "step": 183010 }, { - "epoch": 1.98, - "learning_rate": 3.2172277356165267e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016149608245758307, + "loss": 0.0146, "step": 183020 }, { - "epoch": 1.98, - "learning_rate": 3.2010118700136207e-06, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016148851476456905, + "loss": 0.0106, "step": 183030 }, { - "epoch": 1.98, - "learning_rate": 3.1847960044107156e-06, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016148094707155503, + "loss": 0.0108, "step": 183040 }, { - "epoch": 1.98, - "learning_rate": 3.1685801388078096e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.000161473379378541, + "loss": 0.0117, "step": 183050 }, { - "epoch": 1.98, - "learning_rate": 3.1523642732049036e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016146581168552702, + "loss": 0.0125, "step": 183060 }, { - "epoch": 1.98, - "learning_rate": 3.1361484076019976e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.000161458243992513, + "loss": 0.0097, "step": 183070 }, { - "epoch": 1.98, - "learning_rate": 3.1199325419990916e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016145067629949898, + "loss": 0.0123, "step": 183080 }, { - "epoch": 1.98, - "learning_rate": 3.103716676396186e-06, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.000161443108606485, + "loss": 0.0116, "step": 183090 }, { - "epoch": 1.98, - "learning_rate": 3.08750081079328e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016143554091347097, + "loss": 0.0129, "step": 183100 }, { - "epoch": 1.98, - "learning_rate": 3.071284945190374e-06, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016142797322045695, + "loss": 0.0113, "step": 183110 }, { - "epoch": 1.98, - "learning_rate": 3.055069079587468e-06, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016142040552744296, + "loss": 0.0136, "step": 183120 }, { - "epoch": 1.98, - "learning_rate": 3.0388532139845625e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016141283783442894, + "loss": 0.0117, "step": 183130 }, { - "epoch": 1.98, - "learning_rate": 3.0226373483816566e-06, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.00016140527014141492, + "loss": 0.0092, "step": 183140 }, { - "epoch": 1.98, - "learning_rate": 3.0064214827787506e-06, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016139770244840093, + "loss": 0.0105, "step": 183150 }, { - "epoch": 1.98, - "learning_rate": 2.9902056171758446e-06, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016139013475538691, + "loss": 0.0102, "step": 183160 }, { - "epoch": 1.98, - "learning_rate": 2.9739897515729386e-06, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001613825670623729, + "loss": 0.0096, "step": 183170 }, { - "epoch": 1.98, - "learning_rate": 2.957773885970033e-06, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.0001613749993693589, + "loss": 0.011, "step": 183180 }, { - "epoch": 1.98, - "learning_rate": 2.941558020367127e-06, - "loss": 0.0042, + "epoch": 0.92, + "learning_rate": 0.00016136743167634489, + "loss": 0.011, "step": 183190 }, { - "epoch": 1.98, - "learning_rate": 2.925342154764221e-06, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.00016135986398333087, + "loss": 0.0123, "step": 183200 }, { - "epoch": 1.98, - "learning_rate": 2.909126289161315e-06, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016135229629031688, + "loss": 0.0118, "step": 183210 }, { - "epoch": 1.98, - "learning_rate": 2.8929104235584095e-06, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016134472859730286, + "loss": 0.0118, "step": 183220 }, { - "epoch": 1.98, - "learning_rate": 2.8766945579555035e-06, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016133716090428884, + "loss": 0.0127, "step": 183230 }, { - "epoch": 1.98, - "learning_rate": 2.8604786923525976e-06, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016132959321127482, + "loss": 0.0103, "step": 183240 }, { - "epoch": 1.98, - "learning_rate": 2.8442628267496916e-06, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016132202551826083, + "loss": 0.0096, "step": 183250 }, { - "epoch": 1.98, - "learning_rate": 2.8280469611467856e-06, - "loss": 0.0078, + "epoch": 0.92, + "learning_rate": 0.0001613144578252468, + "loss": 0.0119, "step": 183260 }, { - "epoch": 1.98, - "learning_rate": 2.81183109554388e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.0001613068901322328, + "loss": 0.0098, "step": 183270 }, { - "epoch": 1.98, - "learning_rate": 2.795615229940974e-06, - "loss": 0.0118, + "epoch": 0.92, + "learning_rate": 0.0001612993224392188, + "loss": 0.0092, "step": 183280 }, { - "epoch": 1.98, - "learning_rate": 2.779399364338068e-06, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016129175474620478, + "loss": 0.0099, "step": 183290 }, { - "epoch": 1.98, - "learning_rate": 2.763183498735162e-06, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016128418705319076, + "loss": 0.0108, "step": 183300 }, { - "epoch": 1.98, - "learning_rate": 2.7469676331322565e-06, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016127661936017677, + "loss": 0.0104, "step": 183310 }, { - "epoch": 1.98, - "learning_rate": 2.7307517675293505e-06, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.00016126905166716275, + "loss": 0.0088, "step": 183320 }, { - "epoch": 1.98, - "learning_rate": 2.7145359019264445e-06, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016126148397414873, + "loss": 0.0098, "step": 183330 }, { - "epoch": 1.98, - "learning_rate": 2.6983200363235385e-06, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016125391628113474, + "loss": 0.015, "step": 183340 }, { - "epoch": 1.98, - "learning_rate": 2.6821041707206326e-06, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016124634858812072, + "loss": 0.0126, "step": 183350 }, { - "epoch": 1.98, - "learning_rate": 2.665888305117727e-06, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.0001612387808951067, + "loss": 0.01, "step": 183360 }, { - "epoch": 1.98, - "learning_rate": 2.649672439514821e-06, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016123121320209271, + "loss": 0.0171, "step": 183370 }, { - "epoch": 1.98, - "learning_rate": 2.633456573911915e-06, - "loss": 0.0083, + "epoch": 0.93, + "learning_rate": 0.0001612236455090787, + "loss": 0.0222, "step": 183380 }, { - "epoch": 1.98, - "learning_rate": 2.617240708309009e-06, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016121607781606468, + "loss": 0.0118, "step": 183390 }, { - "epoch": 1.98, - "learning_rate": 2.6010248427061035e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016120851012305066, + "loss": 0.0094, "step": 183400 }, { - "epoch": 1.98, - "learning_rate": 2.5848089771031975e-06, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016120094243003667, + "loss": 0.0139, "step": 183410 }, { - "epoch": 1.98, - "learning_rate": 2.5685931115002915e-06, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016119337473702265, + "loss": 0.0157, "step": 183420 }, { - "epoch": 1.98, - "learning_rate": 2.5523772458973855e-06, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016118580704400863, + "loss": 0.0113, "step": 183430 }, { - "epoch": 1.98, - "learning_rate": 2.5361613802944795e-06, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016117823935099464, + "loss": 0.0094, "step": 183440 }, { - "epoch": 1.98, - "learning_rate": 2.5199455146915744e-06, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016117067165798062, + "loss": 0.0139, "step": 183450 }, { - "epoch": 1.98, - "learning_rate": 2.5037296490886684e-06, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.0001611631039649666, + "loss": 0.011, "step": 183460 }, { - "epoch": 1.98, - "learning_rate": 2.4875137834857624e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001611555362719526, + "loss": 0.0089, "step": 183470 }, { - "epoch": 1.98, - "learning_rate": 2.471297917882856e-06, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.0001611479685789386, + "loss": 0.0136, "step": 183480 }, { - "epoch": 1.98, - "learning_rate": 2.455082052279951e-06, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016114040088592457, + "loss": 0.0109, "step": 183490 }, { - "epoch": 1.98, - "learning_rate": 2.438866186677045e-06, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016113283319291058, + "loss": 0.0132, "step": 183500 }, { - "epoch": 1.98, - "learning_rate": 2.422650321074139e-06, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00016112526549989656, + "loss": 0.0117, "step": 183510 }, { - "epoch": 1.98, - "learning_rate": 2.406434455471233e-06, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016111769780688254, + "loss": 0.011, "step": 183520 }, { - "epoch": 1.98, - "learning_rate": 2.390218589868327e-06, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016111013011386855, + "loss": 0.0126, "step": 183530 }, { - "epoch": 1.98, - "learning_rate": 2.3740027242654214e-06, - "loss": 0.0086, + "epoch": 0.93, + "learning_rate": 0.00016110256242085453, + "loss": 0.0114, "step": 183540 }, { - "epoch": 1.98, - "learning_rate": 2.3577868586625154e-06, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016109499472784052, + "loss": 0.0094, "step": 183550 }, { - "epoch": 1.98, - "learning_rate": 2.3415709930596094e-06, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.0001610874270348265, + "loss": 0.0107, "step": 183560 }, { - "epoch": 1.98, - "learning_rate": 2.3253551274567034e-06, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.0001610798593418125, + "loss": 0.0107, "step": 183570 }, { - "epoch": 1.98, - "learning_rate": 2.3091392618537974e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001610722916487985, + "loss": 0.0081, "step": 183580 }, { - "epoch": 1.98, - "learning_rate": 2.2929233962508914e-06, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016106472395578447, + "loss": 0.0158, "step": 183590 }, { - "epoch": 1.98, - "learning_rate": 2.276707530647986e-06, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016105715626277048, + "loss": 0.0106, "step": 183600 }, { - "epoch": 1.98, - "learning_rate": 2.26049166504508e-06, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016104958856975646, + "loss": 0.0113, "step": 183610 }, { - "epoch": 1.99, - "learning_rate": 2.244275799442174e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016104202087674244, + "loss": 0.0147, "step": 183620 }, { - "epoch": 1.99, - "learning_rate": 2.228059933839268e-06, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016103445318372845, + "loss": 0.0113, "step": 183630 }, { - "epoch": 1.99, - "learning_rate": 2.2118440682363623e-06, - "loss": 0.0089, + "epoch": 0.93, + "learning_rate": 0.00016102688549071443, + "loss": 0.0127, "step": 183640 }, { - "epoch": 1.99, - "learning_rate": 2.1956282026334564e-06, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.0001610193177977004, + "loss": 0.0099, "step": 183650 }, { - "epoch": 1.99, - "learning_rate": 2.179412337030551e-06, - "loss": 0.0084, + "epoch": 0.93, + "learning_rate": 0.00016101175010468642, + "loss": 0.013, "step": 183660 }, { - "epoch": 1.99, - "learning_rate": 2.163196471427645e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001610041824116724, + "loss": 0.0105, "step": 183670 }, { - "epoch": 1.99, - "learning_rate": 2.1469806058247384e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016099661471865838, + "loss": 0.0097, "step": 183680 }, { - "epoch": 1.99, - "learning_rate": 2.130764740221833e-06, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.0001609890470256444, + "loss": 0.0115, "step": 183690 }, { - "epoch": 1.99, - "learning_rate": 2.114548874618927e-06, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016098147933263037, + "loss": 0.0127, "step": 183700 }, { - "epoch": 1.99, - "learning_rate": 2.0983330090160213e-06, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016097391163961635, + "loss": 0.0105, "step": 183710 }, { - "epoch": 1.99, - "learning_rate": 2.0821171434131153e-06, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016096634394660236, + "loss": 0.0127, "step": 183720 }, { - "epoch": 1.99, - "learning_rate": 2.0659012778102093e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016095877625358834, + "loss": 0.0094, "step": 183730 }, { - "epoch": 1.99, - "learning_rate": 2.0496854122073033e-06, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016095120856057433, + "loss": 0.0105, "step": 183740 }, { - "epoch": 1.99, - "learning_rate": 2.0334695466043978e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001609436408675603, + "loss": 0.014, "step": 183750 }, { - "epoch": 1.99, - "learning_rate": 2.0172536810014918e-06, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016093607317454632, + "loss": 0.0123, "step": 183760 }, { - "epoch": 1.99, - "learning_rate": 2.001037815398586e-06, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.0001609285054815323, + "loss": 0.0107, "step": 183770 }, { - "epoch": 1.99, - "learning_rate": 1.98482194979568e-06, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016092093778851828, + "loss": 0.0095, "step": 183780 }, { - "epoch": 1.99, - "learning_rate": 1.968606084192774e-06, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.0001609133700955043, + "loss": 0.0098, "step": 183790 }, { - "epoch": 1.99, - "learning_rate": 1.9523902185898683e-06, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016090580240249027, + "loss": 0.01, "step": 183800 }, { - "epoch": 1.99, - "learning_rate": 1.9361743529869623e-06, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016089823470947625, + "loss": 0.0118, "step": 183810 }, { - "epoch": 1.99, - "learning_rate": 1.9199584873840563e-06, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016089066701646226, + "loss": 0.0103, "step": 183820 }, { - "epoch": 1.99, - "learning_rate": 1.9037426217811505e-06, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.00016088309932344824, + "loss": 0.01, "step": 183830 }, { - "epoch": 1.99, - "learning_rate": 1.8875267561782447e-06, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016087553163043422, + "loss": 0.0098, "step": 183840 }, { - "epoch": 1.99, - "learning_rate": 1.8713108905753388e-06, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016086796393742023, + "loss": 0.0106, "step": 183850 }, { - "epoch": 1.99, - "learning_rate": 1.855095024972433e-06, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.0001608603962444062, + "loss": 0.0108, "step": 183860 }, { - "epoch": 1.99, - "learning_rate": 1.838879159369527e-06, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.0001608528285513922, + "loss": 0.0115, "step": 183870 }, { - "epoch": 1.99, - "learning_rate": 1.822663293766621e-06, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.0001608452608583782, + "loss": 0.0119, "step": 183880 }, { - "epoch": 1.99, - "learning_rate": 1.8064474281637152e-06, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016083769316536418, + "loss": 0.0106, "step": 183890 }, { - "epoch": 1.99, - "learning_rate": 1.7902315625608093e-06, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016083012547235016, + "loss": 0.009, "step": 183900 }, { - "epoch": 1.99, - "learning_rate": 1.7740156969579035e-06, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016082255777933615, + "loss": 0.0097, "step": 183910 }, { - "epoch": 1.99, - "learning_rate": 1.7577998313549975e-06, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016081499008632215, + "loss": 0.0123, "step": 183920 }, { - "epoch": 1.99, - "learning_rate": 1.7415839657520917e-06, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016080742239330814, + "loss": 0.0105, "step": 183930 }, { - "epoch": 1.99, - "learning_rate": 1.7253681001491857e-06, - "loss": 0.0081, + "epoch": 0.93, + "learning_rate": 0.00016079985470029412, + "loss": 0.0112, "step": 183940 }, { - "epoch": 1.99, - "learning_rate": 1.70915223454628e-06, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016079228700728013, + "loss": 0.0093, "step": 183950 }, { - "epoch": 1.99, - "learning_rate": 1.692936368943374e-06, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.0001607847193142661, + "loss": 0.013, "step": 183960 }, { - "epoch": 1.99, - "learning_rate": 1.676720503340468e-06, - "loss": 0.0071, + "epoch": 0.93, + "learning_rate": 0.0001607771516212521, + "loss": 0.0111, "step": 183970 }, { - "epoch": 1.99, - "learning_rate": 1.6605046377375624e-06, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.0001607695839282381, + "loss": 0.0076, "step": 183980 }, { - "epoch": 1.99, - "learning_rate": 1.6442887721346562e-06, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016076201623522408, + "loss": 0.0103, "step": 183990 }, { - "epoch": 1.99, - "learning_rate": 1.6280729065317507e-06, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016075444854221006, + "loss": 0.0133, "step": 184000 }, { - "epoch": 1.99, - "eval_cer": 0.9215069566410776, - "eval_loss": 0.0051878588274121284, - "eval_runtime": 121.2445, - "eval_samples_per_second": 16.496, - "eval_steps_per_second": 4.124, + "epoch": 0.93, + "eval_cer": 0.9144731670915385, + "eval_loss": 0.00799303688108921, + "eval_runtime": 116.5635, + "eval_samples_per_second": 17.158, + "eval_steps_per_second": 4.29, "step": 184000 }, { - "epoch": 1.99, - "learning_rate": 1.6118570409288447e-06, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016074688084919607, + "loss": 0.0113, "step": 184010 }, { - "epoch": 1.99, - "learning_rate": 1.595641175325939e-06, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016073931315618205, + "loss": 0.0116, "step": 184020 }, { - "epoch": 1.99, - "learning_rate": 1.579425309723033e-06, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016073174546316803, + "loss": 0.0128, "step": 184030 }, { - "epoch": 1.99, - "learning_rate": 1.5632094441201271e-06, - "loss": 0.0083, + "epoch": 0.93, + "learning_rate": 0.00016072417777015404, + "loss": 0.0098, "step": 184040 }, { - "epoch": 1.99, - "learning_rate": 1.5469935785172212e-06, - "loss": 0.0075, + "epoch": 0.93, + "learning_rate": 0.00016071661007714002, + "loss": 0.0088, "step": 184050 }, { - "epoch": 1.99, - "learning_rate": 1.5307777129143152e-06, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.000160709042384126, + "loss": 0.0113, "step": 184060 }, { - "epoch": 1.99, - "learning_rate": 1.5145618473114094e-06, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016070147469111198, + "loss": 0.0136, "step": 184070 }, { - "epoch": 1.99, - "learning_rate": 1.4983459817085034e-06, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.000160693906998098, + "loss": 0.0109, "step": 184080 }, { - "epoch": 1.99, - "learning_rate": 1.4821301161055976e-06, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016068633930508397, + "loss": 0.0123, "step": 184090 }, { - "epoch": 1.99, - "learning_rate": 1.4659142505026916e-06, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016067877161206996, + "loss": 0.0156, "step": 184100 }, { - "epoch": 1.99, - "learning_rate": 1.4496983848997859e-06, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016067120391905596, + "loss": 0.0137, "step": 184110 }, { - "epoch": 1.99, - "learning_rate": 1.4334825192968799e-06, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016066363622604195, + "loss": 0.0103, "step": 184120 }, { - "epoch": 1.99, - "learning_rate": 1.4172666536939741e-06, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016065606853302793, + "loss": 0.0108, "step": 184130 }, { - "epoch": 1.99, - "learning_rate": 1.4010507880910681e-06, - "loss": 0.0043, + "epoch": 0.93, + "learning_rate": 0.00016064850084001388, + "loss": 0.0084, "step": 184140 }, { - "epoch": 1.99, - "learning_rate": 1.3848349224881621e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001606409331469999, + "loss": 0.0106, "step": 184150 }, { - "epoch": 1.99, - "learning_rate": 1.3686190568852564e-06, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016063336545398587, + "loss": 0.0109, "step": 184160 }, { - "epoch": 1.99, - "learning_rate": 1.3524031912823504e-06, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016062579776097185, + "loss": 0.0114, "step": 184170 }, { - "epoch": 1.99, - "learning_rate": 1.3361873256794448e-06, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016061823006795786, + "loss": 0.0116, "step": 184180 }, { - "epoch": 1.99, - "learning_rate": 1.3199714600765386e-06, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016061066237494384, + "loss": 0.0105, "step": 184190 }, { - "epoch": 1.99, - "learning_rate": 1.303755594473633e-06, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016060309468192982, + "loss": 0.0093, "step": 184200 }, { - "epoch": 1.99, - "learning_rate": 1.287539728870727e-06, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016059552698891583, + "loss": 0.0096, "step": 184210 }, { - "epoch": 1.99, - "learning_rate": 1.2713238632678213e-06, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016058795929590181, + "loss": 0.011, "step": 184220 }, { - "epoch": 1.99, - "learning_rate": 1.2551079976649153e-06, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.0001605803916028878, + "loss": 0.0117, "step": 184230 }, { - "epoch": 1.99, - "learning_rate": 1.2388921320620093e-06, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.0001605728239098738, + "loss": 0.0124, "step": 184240 }, { - "epoch": 1.99, - "learning_rate": 1.2226762664591036e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016056525621685979, + "loss": 0.0107, "step": 184250 }, { - "epoch": 1.99, - "learning_rate": 1.2064604008561976e-06, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016055768852384577, + "loss": 0.0086, "step": 184260 }, { - "epoch": 1.99, - "learning_rate": 1.1902445352532918e-06, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016055012083083178, + "loss": 0.0119, "step": 184270 }, { - "epoch": 1.99, - "learning_rate": 1.1740286696503858e-06, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016054255313781776, + "loss": 0.0097, "step": 184280 }, { - "epoch": 1.99, - "learning_rate": 1.1578128040474798e-06, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016053498544480374, + "loss": 0.0094, "step": 184290 }, { - "epoch": 1.99, - "learning_rate": 1.141596938444574e-06, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016052741775178972, + "loss": 0.0095, "step": 184300 }, { - "epoch": 1.99, - "learning_rate": 1.1253810728416683e-06, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016051985005877573, + "loss": 0.012, "step": 184310 }, { - "epoch": 1.99, - "learning_rate": 1.1091652072387623e-06, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.0001605122823657617, + "loss": 0.0118, "step": 184320 }, { - "epoch": 1.99, - "learning_rate": 1.0929493416358565e-06, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001605047146727477, + "loss": 0.0119, "step": 184330 }, { - "epoch": 1.99, - "learning_rate": 1.0767334760329505e-06, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.0001604971469797337, + "loss": 0.012, "step": 184340 }, { - "epoch": 1.99, - "learning_rate": 1.0605176104300448e-06, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016048957928671968, + "loss": 0.0113, "step": 184350 }, { - "epoch": 1.99, - "learning_rate": 1.0443017448271388e-06, - "loss": 0.0034, + "epoch": 0.93, + "learning_rate": 0.00016048201159370566, + "loss": 0.0116, "step": 184360 }, { - "epoch": 1.99, - "learning_rate": 1.0280858792242328e-06, - "loss": 0.004, + "epoch": 0.93, + "learning_rate": 0.00016047444390069167, + "loss": 0.0111, "step": 184370 }, { - "epoch": 1.99, - "learning_rate": 1.011870013621327e-06, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016046687620767765, + "loss": 0.0139, "step": 184380 }, { - "epoch": 1.99, - "learning_rate": 9.95654148018421e-07, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.00016045930851466363, + "loss": 0.0134, "step": 184390 }, { - "epoch": 1.99, - "learning_rate": 9.794382824155152e-07, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016045174082164964, + "loss": 0.0121, "step": 184400 }, { - "epoch": 1.99, - "learning_rate": 9.632224168126095e-07, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016044417312863562, + "loss": 0.0099, "step": 184410 }, { - "epoch": 1.99, - "learning_rate": 9.470065512097035e-07, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.0001604366054356216, + "loss": 0.0129, "step": 184420 }, { - "epoch": 1.99, - "learning_rate": 9.307906856067976e-07, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016042903774260761, + "loss": 0.0103, "step": 184430 }, { - "epoch": 1.99, - "learning_rate": 9.145748200038918e-07, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.0001604214700495936, + "loss": 0.0097, "step": 184440 }, { - "epoch": 1.99, - "learning_rate": 8.98358954400986e-07, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016041390235657958, + "loss": 0.0121, "step": 184450 }, { - "epoch": 1.99, - "learning_rate": 8.8214308879808e-07, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00016040633466356556, + "loss": 0.0102, "step": 184460 }, { - "epoch": 1.99, - "learning_rate": 8.659272231951741e-07, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016039876697055157, + "loss": 0.0102, "step": 184470 }, { - "epoch": 1.99, - "learning_rate": 8.497113575922682e-07, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016039119927753755, + "loss": 0.0109, "step": 184480 }, { - "epoch": 1.99, - "learning_rate": 8.334954919893623e-07, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016038363158452353, + "loss": 0.0106, "step": 184490 }, { - "epoch": 1.99, - "learning_rate": 8.172796263864564e-07, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016037606389150954, + "loss": 0.0125, "step": 184500 }, { - "epoch": 1.99, - "learning_rate": 8.010637607835506e-07, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016036849619849552, + "loss": 0.0113, "step": 184510 }, { - "epoch": 1.99, - "learning_rate": 7.848478951806447e-07, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.0001603609285054815, + "loss": 0.0113, "step": 184520 }, { - "epoch": 1.99, - "learning_rate": 7.686320295777388e-07, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.0001603533608124675, + "loss": 0.0108, "step": 184530 }, { - "epoch": 1.99, - "learning_rate": 7.524161639748329e-07, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001603457931194535, + "loss": 0.0141, "step": 184540 }, { - "epoch": 2.0, - "learning_rate": 7.362002983719269e-07, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016033822542643947, + "loss": 0.0106, "step": 184550 }, { - "epoch": 2.0, - "learning_rate": 7.199844327690211e-07, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016033065773342548, + "loss": 0.0121, "step": 184560 }, { - "epoch": 2.0, - "learning_rate": 7.037685671661153e-07, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.00016032309004041146, + "loss": 0.0114, "step": 184570 }, { - "epoch": 2.0, - "learning_rate": 6.875527015632094e-07, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016031552234739744, + "loss": 0.0122, "step": 184580 }, { - "epoch": 2.0, - "learning_rate": 6.713368359603035e-07, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.00016030795465438345, + "loss": 0.0107, "step": 184590 }, { - "epoch": 2.0, - "learning_rate": 6.551209703573976e-07, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016030038696136943, + "loss": 0.0139, "step": 184600 }, { - "epoch": 2.0, - "learning_rate": 6.389051047544918e-07, - "loss": 0.0105, + "epoch": 0.93, + "learning_rate": 0.00016029281926835542, + "loss": 0.0121, "step": 184610 }, { - "epoch": 2.0, - "learning_rate": 6.226892391515859e-07, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016028525157534142, + "loss": 0.01, "step": 184620 }, { - "epoch": 2.0, - "learning_rate": 6.0647337354868e-07, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001602776838823274, + "loss": 0.0155, "step": 184630 }, { - "epoch": 2.0, - "learning_rate": 5.90257507945774e-07, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001602701161893134, + "loss": 0.0135, "step": 184640 }, { - "epoch": 2.0, - "learning_rate": 5.740416423428682e-07, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016026254849629937, + "loss": 0.01, "step": 184650 }, { - "epoch": 2.0, - "learning_rate": 5.578257767399623e-07, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016025498080328538, + "loss": 0.012, "step": 184660 }, { - "epoch": 2.0, - "learning_rate": 5.416099111370565e-07, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016024741311027136, + "loss": 0.0103, "step": 184670 }, { - "epoch": 2.0, - "learning_rate": 5.253940455341506e-07, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016023984541725734, + "loss": 0.012, "step": 184680 }, { - "epoch": 2.0, - "learning_rate": 5.091781799312447e-07, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016023227772424335, + "loss": 0.0099, "step": 184690 }, { - "epoch": 2.0, - "learning_rate": 4.929623143283388e-07, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016022471003122933, + "loss": 0.0115, "step": 184700 }, { - "epoch": 2.0, - "learning_rate": 4.767464487254329e-07, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001602171423382153, + "loss": 0.0085, "step": 184710 }, { - "epoch": 2.0, - "learning_rate": 4.6053058312252703e-07, - "loss": 0.0037, + "epoch": 0.93, + "learning_rate": 0.00016020957464520132, + "loss": 0.0135, "step": 184720 }, { - "epoch": 2.0, - "learning_rate": 4.4431471751962115e-07, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.0001602020069521873, + "loss": 0.0145, "step": 184730 }, { - "epoch": 2.0, - "learning_rate": 4.280988519167153e-07, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016019443925917328, + "loss": 0.0088, "step": 184740 }, { - "epoch": 2.0, - "learning_rate": 4.118829863138094e-07, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.0001601868715661593, + "loss": 0.0118, "step": 184750 }, { - "epoch": 2.0, - "learning_rate": 3.956671207109035e-07, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016017930387314527, + "loss": 0.0097, "step": 184760 }, { - "epoch": 2.0, - "learning_rate": 3.7945125510799763e-07, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016017173618013125, + "loss": 0.0103, "step": 184770 }, { - "epoch": 2.0, - "learning_rate": 3.6323538950509175e-07, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016016416848711726, + "loss": 0.0126, "step": 184780 }, { - "epoch": 2.0, - "learning_rate": 3.470195239021859e-07, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00016015660079410324, + "loss": 0.0096, "step": 184790 }, { - "epoch": 2.0, - "learning_rate": 3.3080365829928e-07, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016014903310108923, + "loss": 0.0148, "step": 184800 }, { - "epoch": 2.0, - "learning_rate": 3.145877926963741e-07, - "loss": 0.0082, + "epoch": 0.93, + "learning_rate": 0.0001601414654080752, + "loss": 0.01, "step": 184810 }, { - "epoch": 2.0, - "learning_rate": 2.983719270934682e-07, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016013389771506122, + "loss": 0.0127, "step": 184820 }, { - "epoch": 2.0, - "learning_rate": 2.8215606149056235e-07, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.0001601263300220472, + "loss": 0.0108, "step": 184830 }, { - "epoch": 2.0, - "learning_rate": 2.6594019588765647e-07, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016011876232903318, + "loss": 0.012, "step": 184840 }, { - "epoch": 2.0, - "learning_rate": 2.497243302847506e-07, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.0001601111946360192, + "loss": 0.0105, "step": 184850 }, { - "epoch": 2.0, - "learning_rate": 2.335084646818447e-07, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016010362694300517, + "loss": 0.0103, "step": 184860 }, { - "epoch": 2.0, - "learning_rate": 2.1729259907893883e-07, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016009605924999115, + "loss": 0.011, "step": 184870 }, { - "epoch": 2.0, - "learning_rate": 2.0107673347603292e-07, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016008849155697716, + "loss": 0.0081, "step": 184880 }, { - "epoch": 2.0, - "learning_rate": 1.8486086787312707e-07, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016008092386396314, + "loss": 0.0086, "step": 184890 }, { - "epoch": 2.0, - "learning_rate": 1.6864500227022116e-07, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016007335617094912, + "loss": 0.0127, "step": 184900 }, { - "epoch": 2.0, - "learning_rate": 1.524291366673153e-07, - "loss": 0.0083, + "epoch": 0.93, + "learning_rate": 0.00016006578847793513, + "loss": 0.0155, "step": 184910 }, { - "epoch": 2.0, - "learning_rate": 1.3621327106440942e-07, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001600582207849211, + "loss": 0.0109, "step": 184920 }, { - "epoch": 2.0, - "learning_rate": 1.1999740546150352e-07, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.0001600506530919071, + "loss": 0.0155, "step": 184930 }, { - "epoch": 2.0, - "learning_rate": 1.0378153985859765e-07, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.0001600430853988931, + "loss": 0.0117, "step": 184940 }, { - "epoch": 2.0, - "learning_rate": 8.756567425569176e-08, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016003551770587908, + "loss": 0.0119, "step": 184950 }, { - "epoch": 2.0, - "learning_rate": 7.134980865278588e-08, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016002795001286506, + "loss": 0.011, "step": 184960 }, { - "epoch": 2.0, - "learning_rate": 5.513394304988e-08, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00016002038231985105, + "loss": 0.0149, "step": 184970 }, { - "epoch": 2.0, - "learning_rate": 3.891807744697412e-08, + "epoch": 0.93, + "learning_rate": 0.00016001281462683705, + "loss": 0.0125, + "step": 184980 + }, + { + "epoch": 0.93, + "learning_rate": 0.00016000524693382304, + "loss": 0.0125, + "step": 184990 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015999767924080902, + "loss": 0.011, + "step": 185000 + }, + { + "epoch": 0.93, + "eval_cer": 0.914462492734159, + "eval_loss": 0.007860948331654072, + "eval_runtime": 116.6063, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, + "step": 185000 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015999011154779503, + "loss": 0.0116, + "step": 185010 + }, + { + "epoch": 0.93, + "learning_rate": 0.000159982543854781, + "loss": 0.012, + "step": 185020 + }, + { + "epoch": 0.93, + "learning_rate": 0.000159974976161767, + "loss": 0.0116, + "step": 185030 + }, + { + "epoch": 0.93, + "learning_rate": 0.000159967408468753, + "loss": 0.0079, + "step": 185040 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015995984077573898, + "loss": 0.0121, + "step": 185050 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015995227308272496, + "loss": 0.0135, + "step": 185060 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015994470538971097, + "loss": 0.0115, + "step": 185070 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015993713769669695, + "loss": 0.014, + "step": 185080 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015992957000368293, + "loss": 0.0133, + "step": 185090 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015992200231066894, + "loss": 0.0094, + "step": 185100 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015991443461765492, + "loss": 0.0103, + "step": 185110 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001599068669246409, + "loss": 0.0099, + "step": 185120 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015989929923162688, + "loss": 0.0108, + "step": 185130 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001598917315386129, + "loss": 0.0136, + "step": 185140 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015988416384559887, + "loss": 0.0139, + "step": 185150 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015987659615258486, + "loss": 0.0114, + "step": 185160 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015986902845957086, + "loss": 0.0136, + "step": 185170 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015986146076655685, + "loss": 0.0112, + "step": 185180 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015985389307354283, + "loss": 0.0153, + "step": 185190 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015984632538052884, + "loss": 0.0131, + "step": 185200 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015983875768751482, + "loss": 0.0103, + "step": 185210 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001598311899945008, + "loss": 0.0106, + "step": 185220 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001598236223014868, + "loss": 0.0123, + "step": 185230 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001598160546084728, + "loss": 0.008, + "step": 185240 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015980848691545877, + "loss": 0.012, + "step": 185250 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015980091922244478, + "loss": 0.0121, + "step": 185260 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015979335152943076, + "loss": 0.0111, + "step": 185270 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015978578383641674, + "loss": 0.0146, + "step": 185280 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015977821614340275, + "loss": 0.0119, + "step": 185290 + }, + { + "epoch": 0.93, + "learning_rate": 0.00015977064845038873, + "loss": 0.0132, + "step": 185300 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001597630807573747, + "loss": 0.0096, + "step": 185310 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001597555130643607, + "loss": 0.0105, + "step": 185320 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001597479453713467, + "loss": 0.0112, + "step": 185330 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015974037767833268, + "loss": 0.0115, + "step": 185340 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015973280998531867, + "loss": 0.012, + "step": 185350 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015972524229230467, + "loss": 0.011, + "step": 185360 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015971767459929066, + "loss": 0.0108, + "step": 185370 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015971010690627664, + "loss": 0.0099, + "step": 185380 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015970253921326265, + "loss": 0.0129, + "step": 185390 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001596949715202486, + "loss": 0.0131, + "step": 185400 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015968740382723458, + "loss": 0.0116, + "step": 185410 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015967983613422056, + "loss": 0.01, + "step": 185420 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015967226844120657, + "loss": 0.0126, + "step": 185430 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015966470074819255, + "loss": 0.012, + "step": 185440 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015965713305517854, + "loss": 0.0098, + "step": 185450 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015964956536216454, + "loss": 0.0106, + "step": 185460 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015964199766915053, + "loss": 0.0097, + "step": 185470 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001596344299761365, + "loss": 0.0099, + "step": 185480 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015962686228312252, + "loss": 0.0096, + "step": 185490 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001596192945901085, + "loss": 0.0108, + "step": 185500 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015961172689709448, + "loss": 0.0105, + "step": 185510 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015960415920408046, + "loss": 0.0134, + "step": 185520 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015959659151106647, + "loss": 0.0107, + "step": 185530 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015958902381805245, + "loss": 0.0136, + "step": 185540 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015958145612503843, + "loss": 0.0106, + "step": 185550 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015957388843202444, + "loss": 0.0099, + "step": 185560 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015956632073901042, + "loss": 0.0086, + "step": 185570 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001595587530459964, + "loss": 0.0096, + "step": 185580 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001595511853529824, + "loss": 0.0106, + "step": 185590 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001595436176599684, + "loss": 0.0107, + "step": 185600 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015953604996695437, + "loss": 0.0132, + "step": 185610 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015952848227394038, + "loss": 0.0111, + "step": 185620 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015952091458092636, + "loss": 0.0099, + "step": 185630 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015951334688791235, + "loss": 0.0086, + "step": 185640 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015950577919489835, + "loss": 0.0127, + "step": 185650 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015949821150188434, + "loss": 0.0112, + "step": 185660 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015949064380887032, + "loss": 0.0113, + "step": 185670 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015948307611585633, + "loss": 0.0143, + "step": 185680 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001594755084228423, + "loss": 0.0089, + "step": 185690 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001594679407298283, + "loss": 0.0097, + "step": 185700 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015946037303681427, + "loss": 0.0129, + "step": 185710 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015945280534380028, + "loss": 0.0104, + "step": 185720 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015944523765078626, + "loss": 0.013, + "step": 185730 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015943766995777224, + "loss": 0.0126, + "step": 185740 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015943010226475825, + "loss": 0.0141, + "step": 185750 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015942253457174423, + "loss": 0.0103, + "step": 185760 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001594149668787302, + "loss": 0.0125, + "step": 185770 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015940739918571622, + "loss": 0.0082, + "step": 185780 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001593998314927022, + "loss": 0.0079, + "step": 185790 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015939226379968818, + "loss": 0.01, + "step": 185800 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001593846961066742, + "loss": 0.0102, + "step": 185810 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015937712841366017, + "loss": 0.0099, + "step": 185820 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015936956072064616, + "loss": 0.0109, + "step": 185830 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015936199302763216, + "loss": 0.0145, + "step": 185840 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015935442533461815, + "loss": 0.01, + "step": 185850 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015934685764160413, + "loss": 0.0086, + "step": 185860 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001593392899485901, + "loss": 0.0128, + "step": 185870 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015933172225557612, + "loss": 0.0136, + "step": 185880 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001593241545625621, + "loss": 0.0108, + "step": 185890 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015931658686954808, + "loss": 0.0102, + "step": 185900 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001593090191765341, + "loss": 0.0113, + "step": 185910 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015930145148352007, + "loss": 0.0132, + "step": 185920 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015929388379050605, + "loss": 0.0095, + "step": 185930 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015928631609749206, + "loss": 0.0114, + "step": 185940 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015927874840447804, + "loss": 0.0119, + "step": 185950 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015927118071146402, + "loss": 0.0126, + "step": 185960 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015926361301845003, + "loss": 0.011, + "step": 185970 + }, + { + "epoch": 0.94, + "learning_rate": 0.000159256045325436, + "loss": 0.0141, + "step": 185980 + }, + { + "epoch": 0.94, + "learning_rate": 0.000159248477632422, + "loss": 0.015, + "step": 185990 + }, + { + "epoch": 0.94, + "learning_rate": 0.000159240909939408, + "loss": 0.009, + "step": 186000 + }, + { + "epoch": 0.94, + "eval_cer": 0.9144770486760401, + "eval_loss": 0.007943259552121162, + "eval_runtime": 116.7604, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, + "step": 186000 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015923334224639398, + "loss": 0.0097, + "step": 186010 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015922577455337997, + "loss": 0.0079, + "step": 186020 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015921820686036595, + "loss": 0.0128, + "step": 186030 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015921063916735196, + "loss": 0.0144, + "step": 186040 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015920307147433794, + "loss": 0.0111, + "step": 186050 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015919550378132392, + "loss": 0.0096, + "step": 186060 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015918793608830993, + "loss": 0.013, + "step": 186070 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001591803683952959, + "loss": 0.0161, + "step": 186080 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001591728007022819, + "loss": 0.0114, + "step": 186090 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001591652330092679, + "loss": 0.0094, + "step": 186100 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015915766531625388, + "loss": 0.0103, + "step": 186110 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015915009762323986, + "loss": 0.0126, + "step": 186120 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015914252993022587, + "loss": 0.0112, + "step": 186130 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015913496223721185, + "loss": 0.0088, + "step": 186140 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015912739454419783, + "loss": 0.0111, + "step": 186150 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015911982685118384, + "loss": 0.0117, + "step": 186160 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015911225915816982, + "loss": 0.0117, + "step": 186170 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001591046914651558, + "loss": 0.012, + "step": 186180 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001590971237721418, + "loss": 0.0109, + "step": 186190 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001590895560791278, + "loss": 0.0093, + "step": 186200 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015908198838611378, + "loss": 0.0102, + "step": 186210 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015907442069309976, + "loss": 0.0135, + "step": 186220 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015906685300008577, + "loss": 0.0086, + "step": 186230 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015905928530707175, + "loss": 0.0155, + "step": 186240 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015905171761405773, + "loss": 0.0118, + "step": 186250 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015904414992104374, + "loss": 0.0116, + "step": 186260 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015903658222802972, + "loss": 0.0095, + "step": 186270 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001590290145350157, + "loss": 0.0111, + "step": 186280 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001590214468420017, + "loss": 0.0091, + "step": 186290 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001590138791489877, + "loss": 0.0104, + "step": 186300 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015900631145597367, + "loss": 0.0116, + "step": 186310 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015899874376295968, + "loss": 0.0112, + "step": 186320 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015899117606994566, + "loss": 0.0107, + "step": 186330 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015898360837693164, + "loss": 0.0101, + "step": 186340 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015897604068391765, + "loss": 0.0103, + "step": 186350 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015896847299090363, + "loss": 0.0118, + "step": 186360 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015896090529788961, + "loss": 0.0097, + "step": 186370 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001589533376048756, + "loss": 0.0106, + "step": 186380 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001589457699118616, + "loss": 0.0124, + "step": 186390 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015893820221884759, + "loss": 0.0153, + "step": 186400 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015893063452583357, + "loss": 0.0115, + "step": 186410 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015892306683281958, + "loss": 0.012, + "step": 186420 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015891549913980556, + "loss": 0.009, + "step": 186430 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015890793144679154, + "loss": 0.0108, + "step": 186440 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015890036375377755, + "loss": 0.0126, + "step": 186450 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015889279606076353, + "loss": 0.0138, + "step": 186460 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001588852283677495, + "loss": 0.0125, + "step": 186470 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015887766067473552, + "loss": 0.0121, + "step": 186480 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001588700929817215, + "loss": 0.0104, + "step": 186490 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015886252528870748, + "loss": 0.0107, + "step": 186500 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001588549575956935, + "loss": 0.0085, + "step": 186510 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015884738990267947, + "loss": 0.0113, + "step": 186520 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015883982220966545, + "loss": 0.0113, + "step": 186530 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015883225451665143, + "loss": 0.0158, + "step": 186540 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015882468682363744, + "loss": 0.0127, + "step": 186550 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015881711913062342, + "loss": 0.0126, + "step": 186560 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001588095514376094, + "loss": 0.0101, + "step": 186570 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015880198374459541, + "loss": 0.0081, + "step": 186580 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001587944160515814, + "loss": 0.0106, + "step": 186590 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015878684835856738, + "loss": 0.011, + "step": 186600 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015877928066555339, + "loss": 0.011, + "step": 186610 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015877171297253937, + "loss": 0.0128, + "step": 186620 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015876414527952535, + "loss": 0.0105, + "step": 186630 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015875657758651136, + "loss": 0.0107, + "step": 186640 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001587490098934973, + "loss": 0.0127, + "step": 186650 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001587414422004833, + "loss": 0.0122, + "step": 186660 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015873387450746927, + "loss": 0.0093, + "step": 186670 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015872630681445528, + "loss": 0.0083, + "step": 186680 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015871873912144126, + "loss": 0.0115, + "step": 186690 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015871117142842725, + "loss": 0.0109, + "step": 186700 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015870360373541325, + "loss": 0.0138, + "step": 186710 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015869603604239924, + "loss": 0.0147, + "step": 186720 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015868846834938522, + "loss": 0.0085, + "step": 186730 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015868090065637123, + "loss": 0.0137, + "step": 186740 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001586733329633572, + "loss": 0.009, + "step": 186750 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001586657652703432, + "loss": 0.0097, + "step": 186760 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015865819757732917, + "loss": 0.0115, + "step": 186770 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015865062988431518, + "loss": 0.0125, + "step": 186780 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015864306219130116, + "loss": 0.0111, + "step": 186790 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015863549449828714, + "loss": 0.0114, + "step": 186800 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015862792680527315, + "loss": 0.0077, + "step": 186810 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015862035911225913, + "loss": 0.0107, + "step": 186820 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001586127914192451, + "loss": 0.0151, + "step": 186830 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015860522372623112, + "loss": 0.0114, + "step": 186840 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001585976560332171, + "loss": 0.0116, + "step": 186850 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015859008834020308, + "loss": 0.0129, + "step": 186860 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001585825206471891, + "loss": 0.0098, + "step": 186870 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015857495295417507, + "loss": 0.0087, + "step": 186880 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015856738526116106, + "loss": 0.01, + "step": 186890 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015855981756814706, + "loss": 0.0097, + "step": 186900 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015855224987513305, + "loss": 0.0105, + "step": 186910 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015854468218211903, + "loss": 0.0258, + "step": 186920 + }, + { + "epoch": 0.94, + "learning_rate": 0.000158537114489105, + "loss": 0.0128, + "step": 186930 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015852954679609102, + "loss": 0.0108, + "step": 186940 + }, + { + "epoch": 0.94, + "learning_rate": 0.000158521979103077, + "loss": 0.0101, + "step": 186950 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015851441141006298, + "loss": 0.0141, + "step": 186960 + }, + { + "epoch": 0.94, + "learning_rate": 0.000158506843717049, + "loss": 0.0093, + "step": 186970 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015849927602403497, + "loss": 0.013, + "step": 186980 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015849170833102095, + "loss": 0.0117, + "step": 186990 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015848414063800696, + "loss": 0.0092, + "step": 187000 + }, + { + "epoch": 0.94, + "eval_cer": 0.9144683151109114, + "eval_loss": 0.008203052915632725, + "eval_runtime": 116.5799, + "eval_samples_per_second": 17.156, + "eval_steps_per_second": 4.289, + "step": 187000 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015847657294499294, + "loss": 0.0105, + "step": 187010 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015846900525197892, + "loss": 0.0123, + "step": 187020 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015846143755896493, + "loss": 0.0105, + "step": 187030 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001584538698659509, + "loss": 0.0101, + "step": 187040 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001584463021729369, + "loss": 0.011, + "step": 187050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001584387344799229, + "loss": 0.0118, + "step": 187060 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015843116678690888, + "loss": 0.0107, + "step": 187070 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015842359909389487, + "loss": 0.0115, + "step": 187080 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015841603140088087, + "loss": 0.0144, + "step": 187090 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015840846370786686, + "loss": 0.0095, + "step": 187100 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015840089601485284, + "loss": 0.0094, + "step": 187110 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015839332832183882, + "loss": 0.0117, + "step": 187120 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015838576062882483, + "loss": 0.0097, + "step": 187130 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001583781929358108, + "loss": 0.0117, + "step": 187140 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001583706252427968, + "loss": 0.0119, + "step": 187150 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001583630575497828, + "loss": 0.0154, + "step": 187160 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015835548985676878, + "loss": 0.0117, + "step": 187170 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015834792216375476, + "loss": 0.0104, + "step": 187180 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015834035447074077, + "loss": 0.0125, + "step": 187190 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015833278677772675, + "loss": 0.0103, + "step": 187200 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015832521908471273, + "loss": 0.0092, + "step": 187210 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015831765139169874, + "loss": 0.0115, + "step": 187220 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015831008369868472, + "loss": 0.0091, + "step": 187230 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001583025160056707, + "loss": 0.012, + "step": 187240 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001582949483126567, + "loss": 0.0107, + "step": 187250 + }, + { + "epoch": 0.94, + "learning_rate": 0.0001582873806196427, + "loss": 0.013, + "step": 187260 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015827981292662868, + "loss": 0.0093, + "step": 187270 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015827224523361466, + "loss": 0.01, + "step": 187280 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015826467754060067, + "loss": 0.0129, + "step": 187290 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015825710984758665, + "loss": 0.0106, + "step": 187300 + }, + { + "epoch": 0.94, + "learning_rate": 0.00015824954215457263, + "loss": 0.0137, + "step": 187310 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015824197446155864, + "loss": 0.0125, + "step": 187320 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015823440676854462, + "loss": 0.0132, + "step": 187330 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001582268390755306, + "loss": 0.009, + "step": 187340 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001582192713825166, + "loss": 0.01, + "step": 187350 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001582117036895026, + "loss": 0.0105, + "step": 187360 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015820413599648857, + "loss": 0.0109, + "step": 187370 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015819656830347458, + "loss": 0.0111, + "step": 187380 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015818900061046056, + "loss": 0.0111, + "step": 187390 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015818143291744654, + "loss": 0.0107, + "step": 187400 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015817386522443255, + "loss": 0.0106, + "step": 187410 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015816629753141853, + "loss": 0.0117, + "step": 187420 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015815872983840451, + "loss": 0.0103, + "step": 187430 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001581511621453905, + "loss": 0.0115, + "step": 187440 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001581435944523765, + "loss": 0.009, + "step": 187450 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015813602675936249, + "loss": 0.0094, + "step": 187460 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015812845906634847, + "loss": 0.0108, + "step": 187470 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015812089137333448, + "loss": 0.011, + "step": 187480 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015811332368032046, + "loss": 0.014, + "step": 187490 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015810575598730644, + "loss": 0.0104, + "step": 187500 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015809818829429245, + "loss": 0.0112, + "step": 187510 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015809062060127843, + "loss": 0.0125, + "step": 187520 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001580830529082644, + "loss": 0.0116, + "step": 187530 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015807548521525042, + "loss": 0.0097, + "step": 187540 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001580679175222364, + "loss": 0.0106, + "step": 187550 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015806034982922238, + "loss": 0.0099, + "step": 187560 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001580527821362084, + "loss": 0.0089, + "step": 187570 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015804521444319437, + "loss": 0.0098, + "step": 187580 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015803764675018035, + "loss": 0.0096, + "step": 187590 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015803007905716636, + "loss": 0.0102, + "step": 187600 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015802251136415234, + "loss": 0.0095, + "step": 187610 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015801494367113832, + "loss": 0.0086, + "step": 187620 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001580073759781243, + "loss": 0.0103, + "step": 187630 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015799980828511031, + "loss": 0.0101, + "step": 187640 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001579922405920963, + "loss": 0.0092, + "step": 187650 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015798467289908228, + "loss": 0.012, + "step": 187660 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015797710520606829, + "loss": 0.0101, + "step": 187670 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015796953751305427, + "loss": 0.0102, + "step": 187680 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015796196982004025, + "loss": 0.0162, + "step": 187690 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015795440212702626, + "loss": 0.0118, + "step": 187700 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015794683443401224, + "loss": 0.0115, + "step": 187710 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015793926674099822, + "loss": 0.0102, + "step": 187720 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015793169904798423, + "loss": 0.0111, + "step": 187730 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001579241313549702, + "loss": 0.0103, + "step": 187740 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001579165636619562, + "loss": 0.01, + "step": 187750 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001579089959689422, + "loss": 0.0111, + "step": 187760 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015790142827592818, + "loss": 0.013, + "step": 187770 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015789386058291416, + "loss": 0.0097, + "step": 187780 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015788629288990014, + "loss": 0.0103, + "step": 187790 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015787872519688615, + "loss": 0.0123, + "step": 187800 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015787115750387213, + "loss": 0.0122, + "step": 187810 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015786358981085812, + "loss": 0.0125, + "step": 187820 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015785602211784412, + "loss": 0.0115, + "step": 187830 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001578484544248301, + "loss": 0.0089, + "step": 187840 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001578408867318161, + "loss": 0.0115, + "step": 187850 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001578333190388021, + "loss": 0.0122, + "step": 187860 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015782575134578808, + "loss": 0.0133, + "step": 187870 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015781818365277406, + "loss": 0.0117, + "step": 187880 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015781061595976007, + "loss": 0.012, + "step": 187890 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015780304826674605, + "loss": 0.0097, + "step": 187900 + }, + { + "epoch": 0.95, + "learning_rate": 0.000157795480573732, + "loss": 0.01, + "step": 187910 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015778791288071798, + "loss": 0.0114, + "step": 187920 + }, + { + "epoch": 0.95, + "learning_rate": 0.000157780345187704, + "loss": 0.0124, + "step": 187930 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015777277749468997, + "loss": 0.0115, + "step": 187940 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015776520980167596, + "loss": 0.0108, + "step": 187950 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015775764210866196, + "loss": 0.0098, + "step": 187960 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015775007441564795, + "loss": 0.0136, + "step": 187970 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015774250672263393, + "loss": 0.0113, + "step": 187980 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015773493902961994, + "loss": 0.0107, + "step": 187990 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015772737133660592, + "loss": 0.0113, + "step": 188000 + }, + { + "epoch": 0.95, + "eval_cer": 0.9144634631302844, + "eval_loss": 0.007855391129851341, + "eval_runtime": 116.599, + "eval_samples_per_second": 17.153, + "eval_steps_per_second": 4.288, + "step": 188000 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001577198036435919, + "loss": 0.0129, + "step": 188010 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015771223595057788, + "loss": 0.0086, + "step": 188020 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001577046682575639, + "loss": 0.0094, + "step": 188030 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015769710056454987, + "loss": 0.0116, + "step": 188040 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015768953287153585, + "loss": 0.0123, + "step": 188050 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015768196517852186, + "loss": 0.0144, + "step": 188060 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015767439748550784, + "loss": 0.0107, + "step": 188070 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015766682979249382, + "loss": 0.0162, + "step": 188080 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015765926209947983, + "loss": 0.0106, + "step": 188090 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001576516944064658, + "loss": 0.0096, + "step": 188100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001576441267134518, + "loss": 0.0101, + "step": 188110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001576365590204378, + "loss": 0.0105, + "step": 188120 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015762899132742378, + "loss": 0.0114, + "step": 188130 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015762142363440977, + "loss": 0.0119, + "step": 188140 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015761385594139577, + "loss": 0.0193, + "step": 188150 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015760628824838176, + "loss": 0.0105, + "step": 188160 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015759872055536774, + "loss": 0.0125, + "step": 188170 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015759115286235372, + "loss": 0.0126, + "step": 188180 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015758358516933973, + "loss": 0.0122, + "step": 188190 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001575760174763257, + "loss": 0.0094, + "step": 188200 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001575684497833117, + "loss": 0.0111, + "step": 188210 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001575608820902977, + "loss": 0.0177, + "step": 188220 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015755331439728368, + "loss": 0.0131, + "step": 188230 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015754574670426966, + "loss": 0.0095, + "step": 188240 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015753817901125567, + "loss": 0.0118, + "step": 188250 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015753061131824165, + "loss": 0.0136, + "step": 188260 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015752304362522763, + "loss": 0.0103, + "step": 188270 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015751547593221364, + "loss": 0.0129, + "step": 188280 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015750790823919962, + "loss": 0.008, + "step": 188290 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001575003405461856, + "loss": 0.0145, + "step": 188300 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001574927728531716, + "loss": 0.0092, + "step": 188310 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001574852051601576, + "loss": 0.0074, + "step": 188320 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015747763746714358, + "loss": 0.0131, + "step": 188330 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015747006977412956, + "loss": 0.0084, + "step": 188340 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015746250208111557, + "loss": 0.009, + "step": 188350 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015745493438810155, + "loss": 0.0124, + "step": 188360 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015744736669508753, + "loss": 0.0099, + "step": 188370 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015743979900207354, + "loss": 0.0109, + "step": 188380 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015743223130905952, + "loss": 0.0141, + "step": 188390 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001574246636160455, + "loss": 0.0107, + "step": 188400 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001574170959230315, + "loss": 0.01, + "step": 188410 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001574095282300175, + "loss": 0.0109, + "step": 188420 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015740196053700347, + "loss": 0.011, + "step": 188430 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015739439284398948, + "loss": 0.0098, + "step": 188440 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015738682515097546, + "loss": 0.0111, + "step": 188450 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015737925745796144, + "loss": 0.012, + "step": 188460 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015737168976494745, + "loss": 0.0101, + "step": 188470 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015736412207193343, + "loss": 0.0145, + "step": 188480 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015735655437891941, + "loss": 0.0085, + "step": 188490 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015734898668590542, + "loss": 0.0097, + "step": 188500 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001573414189928914, + "loss": 0.0104, + "step": 188510 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015733385129987739, + "loss": 0.0106, + "step": 188520 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015732628360686337, + "loss": 0.011, + "step": 188530 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015731871591384938, + "loss": 0.0121, + "step": 188540 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015731114822083536, + "loss": 0.01, + "step": 188550 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015730358052782134, + "loss": 0.0083, + "step": 188560 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015729601283480735, + "loss": 0.0116, + "step": 188570 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015728844514179333, + "loss": 0.0102, + "step": 188580 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001572808774487793, + "loss": 0.0147, + "step": 188590 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015727330975576532, + "loss": 0.0122, + "step": 188600 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001572657420627513, + "loss": 0.0106, + "step": 188610 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015725817436973728, + "loss": 0.0098, + "step": 188620 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001572506066767233, + "loss": 0.0113, + "step": 188630 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015724303898370927, + "loss": 0.0146, + "step": 188640 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015723547129069525, + "loss": 0.0117, + "step": 188650 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015722790359768126, + "loss": 0.0104, + "step": 188660 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015722033590466724, + "loss": 0.0114, + "step": 188670 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015721276821165322, + "loss": 0.01, + "step": 188680 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001572052005186392, + "loss": 0.0117, + "step": 188690 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015719763282562521, + "loss": 0.0088, + "step": 188700 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001571900651326112, + "loss": 0.0097, + "step": 188710 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015718249743959718, + "loss": 0.0093, + "step": 188720 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015717492974658319, + "loss": 0.0149, + "step": 188730 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015716736205356917, + "loss": 0.0106, + "step": 188740 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015715979436055515, + "loss": 0.0145, + "step": 188750 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015715222666754116, + "loss": 0.0096, + "step": 188760 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015714465897452714, + "loss": 0.0119, + "step": 188770 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015713709128151312, + "loss": 0.013, + "step": 188780 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015712952358849913, + "loss": 0.0107, + "step": 188790 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001571219558954851, + "loss": 0.012, + "step": 188800 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001571143882024711, + "loss": 0.0102, + "step": 188810 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001571068205094571, + "loss": 0.0105, + "step": 188820 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015709925281644308, + "loss": 0.0123, + "step": 188830 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015709168512342906, + "loss": 0.0121, + "step": 188840 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015708411743041504, + "loss": 0.0089, + "step": 188850 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015707654973740105, + "loss": 0.0112, + "step": 188860 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015706898204438703, + "loss": 0.0091, + "step": 188870 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015706141435137302, + "loss": 0.0136, + "step": 188880 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015705384665835902, + "loss": 0.0114, + "step": 188890 + }, + { + "epoch": 0.95, + "learning_rate": 0.000157046278965345, + "loss": 0.0123, + "step": 188900 + }, + { + "epoch": 0.95, + "learning_rate": 0.000157038711272331, + "loss": 0.012, + "step": 188910 + }, + { + "epoch": 0.95, + "learning_rate": 0.000157031143579317, + "loss": 0.0139, + "step": 188920 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015702357588630298, + "loss": 0.0113, + "step": 188930 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015701600819328896, + "loss": 0.011, + "step": 188940 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015700844050027497, + "loss": 0.011, + "step": 188950 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015700087280726095, + "loss": 0.014, + "step": 188960 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015699330511424693, + "loss": 0.0108, + "step": 188970 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015698573742123294, + "loss": 0.0092, + "step": 188980 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015697816972821892, + "loss": 0.0115, + "step": 188990 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001569706020352049, + "loss": 0.011, + "step": 189000 + }, + { + "epoch": 0.95, + "eval_cer": 0.914452788772905, + "eval_loss": 0.00806601531803608, + "eval_runtime": 116.7489, + "eval_samples_per_second": 17.131, + "eval_steps_per_second": 4.283, + "step": 189000 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015696303434219088, + "loss": 0.0111, + "step": 189010 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001569554666491769, + "loss": 0.0127, + "step": 189020 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015694789895616287, + "loss": 0.0139, + "step": 189030 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015694033126314885, + "loss": 0.0113, + "step": 189040 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015693276357013486, + "loss": 0.0078, + "step": 189050 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015692519587712084, + "loss": 0.0086, + "step": 189060 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015691762818410683, + "loss": 0.0113, + "step": 189070 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015691006049109283, + "loss": 0.01, + "step": 189080 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015690249279807882, + "loss": 0.0086, + "step": 189090 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001568949251050648, + "loss": 0.0109, + "step": 189100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001568873574120508, + "loss": 0.0137, + "step": 189110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001568797897190368, + "loss": 0.0101, + "step": 189120 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015687222202602277, + "loss": 0.0116, + "step": 189130 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015686465433300878, + "loss": 0.0092, + "step": 189140 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015685708663999476, + "loss": 0.0101, + "step": 189150 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015684951894698074, + "loss": 0.0123, + "step": 189160 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001568419512539667, + "loss": 0.0086, + "step": 189170 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001568343835609527, + "loss": 0.0103, + "step": 189180 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015682681586793868, + "loss": 0.0126, + "step": 189190 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015681924817492467, + "loss": 0.01, + "step": 189200 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015681168048191067, + "loss": 0.0118, + "step": 189210 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015680411278889666, + "loss": 0.0127, + "step": 189220 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015679654509588264, + "loss": 0.0202, + "step": 189230 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015678897740286862, + "loss": 0.0107, + "step": 189240 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015678140970985463, + "loss": 0.0112, + "step": 189250 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001567738420168406, + "loss": 0.0098, + "step": 189260 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001567662743238266, + "loss": 0.0149, + "step": 189270 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001567587066308126, + "loss": 0.0101, + "step": 189280 + }, + { + "epoch": 0.95, + "learning_rate": 0.00015675113893779858, + "loss": 0.0107, + "step": 189290 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015674357124478456, + "loss": 0.0113, + "step": 189300 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015673600355177057, + "loss": 0.0112, + "step": 189310 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015672843585875655, + "loss": 0.0077, + "step": 189320 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015672086816574253, + "loss": 0.0113, + "step": 189330 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015671330047272854, + "loss": 0.0103, + "step": 189340 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015670573277971452, + "loss": 0.0102, + "step": 189350 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566981650867005, + "loss": 0.0132, + "step": 189360 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566905973936865, + "loss": 0.0088, + "step": 189370 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566830297006725, + "loss": 0.0096, + "step": 189380 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015667546200765848, + "loss": 0.0092, + "step": 189390 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015666789431464446, + "loss": 0.0115, + "step": 189400 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015666032662163047, + "loss": 0.0137, + "step": 189410 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015665275892861645, + "loss": 0.011, + "step": 189420 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015664519123560243, + "loss": 0.0121, + "step": 189430 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015663762354258844, + "loss": 0.012, + "step": 189440 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015663005584957442, + "loss": 0.011, + "step": 189450 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566224881565604, + "loss": 0.0103, + "step": 189460 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566149204635464, + "loss": 0.0119, + "step": 189470 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001566073527705324, + "loss": 0.0121, + "step": 189480 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015659978507751837, + "loss": 0.0132, + "step": 189490 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015659221738450438, + "loss": 0.013, + "step": 189500 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015658464969149036, + "loss": 0.0111, + "step": 189510 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015657708199847634, + "loss": 0.0101, + "step": 189520 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015656951430546235, + "loss": 0.0119, + "step": 189530 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015656194661244833, + "loss": 0.0144, + "step": 189540 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015655437891943431, + "loss": 0.0126, + "step": 189550 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015654681122642032, + "loss": 0.0141, + "step": 189560 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001565392435334063, + "loss": 0.0121, + "step": 189570 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015653167584039229, + "loss": 0.0121, + "step": 189580 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015652410814737827, + "loss": 0.0111, + "step": 189590 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015651654045436428, + "loss": 0.0164, + "step": 189600 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015650897276135026, + "loss": 0.0104, + "step": 189610 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015650140506833624, + "loss": 0.01, + "step": 189620 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015649383737532225, + "loss": 0.0107, + "step": 189630 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015648626968230823, + "loss": 0.009, + "step": 189640 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001564787019892942, + "loss": 0.01, + "step": 189650 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015647113429628022, + "loss": 0.0113, + "step": 189660 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001564635666032662, + "loss": 0.01, + "step": 189670 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015645599891025218, + "loss": 0.0103, + "step": 189680 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001564484312172382, + "loss": 0.0125, + "step": 189690 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015644086352422417, + "loss": 0.0104, + "step": 189700 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015643329583121015, + "loss": 0.0115, + "step": 189710 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015642572813819616, + "loss": 0.0115, + "step": 189720 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015641816044518214, + "loss": 0.0129, + "step": 189730 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015641059275216812, + "loss": 0.0112, + "step": 189740 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001564030250591541, + "loss": 0.0146, + "step": 189750 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015639545736614011, + "loss": 0.0113, + "step": 189760 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001563878896731261, + "loss": 0.0109, + "step": 189770 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015638032198011208, + "loss": 0.0087, + "step": 189780 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015637275428709809, + "loss": 0.013, + "step": 189790 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015636518659408407, + "loss": 0.0112, + "step": 189800 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015635761890107005, + "loss": 0.0089, + "step": 189810 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015635005120805606, + "loss": 0.0102, + "step": 189820 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015634248351504204, + "loss": 0.0118, + "step": 189830 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015633491582202802, + "loss": 0.0108, + "step": 189840 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015632734812901403, + "loss": 0.0128, + "step": 189850 + }, + { + "epoch": 0.96, + "learning_rate": 0.000156319780436, + "loss": 0.0129, + "step": 189860 + }, + { + "epoch": 0.96, + "learning_rate": 0.000156312212742986, + "loss": 0.0146, + "step": 189870 + }, + { + "epoch": 0.96, + "learning_rate": 0.000156304645049972, + "loss": 0.0115, + "step": 189880 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015629707735695798, + "loss": 0.0125, + "step": 189890 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015628950966394396, + "loss": 0.0111, + "step": 189900 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015628194197092994, + "loss": 0.0099, + "step": 189910 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015627437427791595, + "loss": 0.0115, + "step": 189920 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015626680658490193, + "loss": 0.0115, + "step": 189930 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015625923889188792, + "loss": 0.0134, + "step": 189940 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015625167119887392, + "loss": 0.0137, + "step": 189950 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001562441035058599, + "loss": 0.0102, + "step": 189960 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001562365358128459, + "loss": 0.0099, + "step": 189970 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001562289681198319, + "loss": 0.0129, + "step": 189980 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015622140042681788, + "loss": 0.0099, + "step": 189990 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015621383273380386, + "loss": 0.0097, + "step": 190000 + }, + { + "epoch": 0.96, + "eval_cer": 0.9144372624348985, + "eval_loss": 0.007905209437012672, + "eval_runtime": 116.6163, + "eval_samples_per_second": 17.15, + "eval_steps_per_second": 4.288, + "step": 190000 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015620626504078987, + "loss": 0.0084, + "step": 190010 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015619869734777585, + "loss": 0.0122, + "step": 190020 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015619112965476183, + "loss": 0.0101, + "step": 190030 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015618356196174784, + "loss": 0.0118, + "step": 190040 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015617599426873382, + "loss": 0.0215, + "step": 190050 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001561684265757198, + "loss": 0.0112, + "step": 190060 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001561608588827058, + "loss": 0.0125, + "step": 190070 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001561532911896918, + "loss": 0.0126, + "step": 190080 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015614572349667777, + "loss": 0.0125, + "step": 190090 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015613815580366375, + "loss": 0.0092, + "step": 190100 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015613058811064976, + "loss": 0.0112, + "step": 190110 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015612302041763574, + "loss": 0.0096, + "step": 190120 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015611545272462173, + "loss": 0.0126, + "step": 190130 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015610788503160773, + "loss": 0.0112, + "step": 190140 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015610031733859372, + "loss": 0.0103, + "step": 190150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560927496455797, + "loss": 0.0125, + "step": 190160 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560851819525657, + "loss": 0.0109, + "step": 190170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560776142595517, + "loss": 0.0121, + "step": 190180 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015607004656653767, + "loss": 0.0132, + "step": 190190 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015606247887352368, + "loss": 0.0111, + "step": 190200 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015605491118050966, + "loss": 0.0108, + "step": 190210 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015604734348749564, + "loss": 0.0111, + "step": 190220 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015603977579448165, + "loss": 0.0101, + "step": 190230 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015603220810146763, + "loss": 0.0088, + "step": 190240 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560246404084536, + "loss": 0.0106, + "step": 190250 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560170727154396, + "loss": 0.0122, + "step": 190260 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001560095050224256, + "loss": 0.009, + "step": 190270 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015600193732941158, + "loss": 0.0112, + "step": 190280 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015599436963639756, + "loss": 0.0135, + "step": 190290 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015598680194338357, + "loss": 0.01, + "step": 190300 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015597923425036955, + "loss": 0.0093, + "step": 190310 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015597166655735554, + "loss": 0.0127, + "step": 190320 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015596409886434154, + "loss": 0.0094, + "step": 190330 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015595653117132753, + "loss": 0.011, + "step": 190340 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001559489634783135, + "loss": 0.0144, + "step": 190350 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015594139578529952, + "loss": 0.0136, + "step": 190360 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001559338280922855, + "loss": 0.0114, + "step": 190370 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015592626039927148, + "loss": 0.0125, + "step": 190380 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001559186927062575, + "loss": 0.0101, + "step": 190390 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015591112501324347, + "loss": 0.0085, + "step": 190400 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015590355732022945, + "loss": 0.0114, + "step": 190410 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558959896272154, + "loss": 0.0112, + "step": 190420 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558884219342014, + "loss": 0.0115, + "step": 190430 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558808542411874, + "loss": 0.0117, + "step": 190440 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015587328654817338, + "loss": 0.0104, + "step": 190450 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015586571885515938, + "loss": 0.0103, + "step": 190460 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015585815116214537, + "loss": 0.0116, + "step": 190470 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015585058346913135, + "loss": 0.0113, + "step": 190480 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015584301577611733, + "loss": 0.0103, + "step": 190490 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015583544808310334, + "loss": 0.0102, + "step": 190500 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015582788039008932, + "loss": 0.0087, + "step": 190510 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558203126970753, + "loss": 0.0127, + "step": 190520 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558127450040613, + "loss": 0.013, + "step": 190530 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001558051773110473, + "loss": 0.0117, + "step": 190540 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015579760961803327, + "loss": 0.0135, + "step": 190550 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015579004192501928, + "loss": 0.0127, + "step": 190560 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015578247423200526, + "loss": 0.0109, + "step": 190570 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015577490653899124, + "loss": 0.0144, + "step": 190580 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015576733884597725, + "loss": 0.0103, + "step": 190590 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015575977115296323, + "loss": 0.0139, + "step": 190600 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015575220345994921, + "loss": 0.0113, + "step": 190610 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015574463576693522, + "loss": 0.0121, + "step": 190620 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001557370680739212, + "loss": 0.0111, + "step": 190630 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015572950038090719, + "loss": 0.0127, + "step": 190640 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015572193268789317, + "loss": 0.0088, + "step": 190650 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015571436499487918, + "loss": 0.0107, + "step": 190660 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015570679730186516, + "loss": 0.0117, + "step": 190670 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015569922960885114, + "loss": 0.0096, + "step": 190680 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015569166191583715, + "loss": 0.0086, + "step": 190690 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015568409422282313, + "loss": 0.0094, + "step": 190700 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001556765265298091, + "loss": 0.0124, + "step": 190710 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015566895883679512, + "loss": 0.0153, + "step": 190720 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001556613911437811, + "loss": 0.0129, + "step": 190730 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015565382345076708, + "loss": 0.0149, + "step": 190740 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001556462557577531, + "loss": 0.0097, + "step": 190750 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015563868806473907, + "loss": 0.0132, + "step": 190760 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015563112037172505, + "loss": 0.0123, + "step": 190770 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015562355267871106, + "loss": 0.0087, + "step": 190780 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015561598498569704, + "loss": 0.0105, + "step": 190790 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015560841729268302, + "loss": 0.011, + "step": 190800 + }, + { + "epoch": 0.96, + "learning_rate": 0.000155600849599669, + "loss": 0.0134, + "step": 190810 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015559328190665501, + "loss": 0.0107, + "step": 190820 + }, + { + "epoch": 0.96, + "learning_rate": 0.000155585714213641, + "loss": 0.0108, + "step": 190830 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015557814652062698, + "loss": 0.0093, + "step": 190840 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015557057882761299, + "loss": 0.0116, + "step": 190850 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015556301113459897, + "loss": 0.0125, + "step": 190860 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015555544344158495, + "loss": 0.0064, + "step": 190870 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015554787574857096, + "loss": 0.0104, + "step": 190880 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015554030805555694, + "loss": 0.0098, + "step": 190890 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015553274036254292, + "loss": 0.0099, + "step": 190900 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015552517266952893, + "loss": 0.0113, + "step": 190910 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001555176049765149, + "loss": 0.0112, + "step": 190920 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001555100372835009, + "loss": 0.0103, + "step": 190930 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001555024695904869, + "loss": 0.0096, + "step": 190940 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015549490189747288, + "loss": 0.0077, + "step": 190950 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015548733420445886, + "loss": 0.0111, + "step": 190960 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015547976651144487, + "loss": 0.0095, + "step": 190970 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015547219881843085, + "loss": 0.0123, + "step": 190980 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015546463112541683, + "loss": 0.0103, + "step": 190990 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015545706343240282, + "loss": 0.0124, + "step": 191000 + }, + { + "epoch": 0.96, + "eval_cer": 0.9144634631302844, + "eval_loss": 0.007862123660743237, + "eval_runtime": 115.5241, + "eval_samples_per_second": 17.312, + "eval_steps_per_second": 4.328, + "step": 191000 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015544949573938882, + "loss": 0.0109, + "step": 191010 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001554419280463748, + "loss": 0.0134, + "step": 191020 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001554343603533608, + "loss": 0.0088, + "step": 191030 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001554267926603468, + "loss": 0.0132, + "step": 191040 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015541922496733278, + "loss": 0.0101, + "step": 191050 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015541165727431876, + "loss": 0.0096, + "step": 191060 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015540408958130477, + "loss": 0.012, + "step": 191070 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015539652188829075, + "loss": 0.0157, + "step": 191080 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015538895419527673, + "loss": 0.0133, + "step": 191090 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015538138650226274, + "loss": 0.0113, + "step": 191100 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015537381880924872, + "loss": 0.0111, + "step": 191110 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001553662511162347, + "loss": 0.0125, + "step": 191120 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001553586834232207, + "loss": 0.0174, + "step": 191130 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001553511157302067, + "loss": 0.0111, + "step": 191140 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015534354803719267, + "loss": 0.0113, + "step": 191150 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015533598034417865, + "loss": 0.0129, + "step": 191160 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015532841265116466, + "loss": 0.0097, + "step": 191170 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015532084495815064, + "loss": 0.0103, + "step": 191180 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015531327726513663, + "loss": 0.0137, + "step": 191190 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015530570957212263, + "loss": 0.0101, + "step": 191200 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015529814187910862, + "loss": 0.0096, + "step": 191210 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001552905741860946, + "loss": 0.0109, + "step": 191220 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001552830064930806, + "loss": 0.0105, + "step": 191230 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001552754388000666, + "loss": 0.0102, + "step": 191240 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015526787110705257, + "loss": 0.0149, + "step": 191250 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015526030341403858, + "loss": 0.014, + "step": 191260 + }, + { + "epoch": 0.96, + "learning_rate": 0.00015525273572102456, + "loss": 0.0121, + "step": 191270 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015524516802801054, + "loss": 0.0118, + "step": 191280 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015523760033499655, + "loss": 0.0139, + "step": 191290 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015523003264198253, + "loss": 0.0105, + "step": 191300 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001552224649489685, + "loss": 0.0109, + "step": 191310 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001552148972559545, + "loss": 0.0119, + "step": 191320 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001552073295629405, + "loss": 0.0111, + "step": 191330 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015519976186992648, + "loss": 0.0105, + "step": 191340 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015519219417691247, + "loss": 0.0094, + "step": 191350 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015518462648389847, + "loss": 0.0137, + "step": 191360 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015517705879088446, + "loss": 0.0113, + "step": 191370 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015516949109787044, + "loss": 0.0098, + "step": 191380 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015516192340485645, + "loss": 0.0133, + "step": 191390 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015515435571184243, + "loss": 0.0125, + "step": 191400 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001551467880188284, + "loss": 0.0124, + "step": 191410 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015513922032581442, + "loss": 0.0136, + "step": 191420 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001551316526328004, + "loss": 0.015, + "step": 191430 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015512408493978638, + "loss": 0.0105, + "step": 191440 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001551165172467724, + "loss": 0.0105, + "step": 191450 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015510894955375837, + "loss": 0.0118, + "step": 191460 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015510138186074435, + "loss": 0.0096, + "step": 191470 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015509381416773036, + "loss": 0.0122, + "step": 191480 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015508624647471634, + "loss": 0.0097, + "step": 191490 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015507867878170232, + "loss": 0.0143, + "step": 191500 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001550711110886883, + "loss": 0.0116, + "step": 191510 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001550635433956743, + "loss": 0.0118, + "step": 191520 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001550559757026603, + "loss": 0.0116, + "step": 191530 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015504840800964628, + "loss": 0.0128, + "step": 191540 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015504084031663228, + "loss": 0.0136, + "step": 191550 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015503327262361827, + "loss": 0.01, + "step": 191560 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015502570493060425, + "loss": 0.0093, + "step": 191570 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015501813723759026, + "loss": 0.0115, + "step": 191580 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015501056954457624, + "loss": 0.0097, + "step": 191590 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015500300185156222, + "loss": 0.0102, + "step": 191600 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015499543415854823, + "loss": 0.0102, + "step": 191610 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001549878664655342, + "loss": 0.0096, + "step": 191620 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001549802987725202, + "loss": 0.0115, + "step": 191630 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001549727310795062, + "loss": 0.0141, + "step": 191640 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015496516338649218, + "loss": 0.0089, + "step": 191650 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015495759569347816, + "loss": 0.0128, + "step": 191660 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015495002800046414, + "loss": 0.0102, + "step": 191670 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015494246030745012, + "loss": 0.0107, + "step": 191680 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001549348926144361, + "loss": 0.0121, + "step": 191690 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001549273249214221, + "loss": 0.0103, + "step": 191700 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015491975722840807, + "loss": 0.011, + "step": 191710 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015491218953539408, + "loss": 0.0096, + "step": 191720 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015490462184238006, + "loss": 0.0097, + "step": 191730 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015489705414936604, + "loss": 0.0122, + "step": 191740 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015488948645635205, + "loss": 0.0105, + "step": 191750 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015488191876333803, + "loss": 0.0092, + "step": 191760 + }, + { + "epoch": 0.97, + "learning_rate": 0.000154874351070324, + "loss": 0.012, + "step": 191770 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015486678337731002, + "loss": 0.0089, + "step": 191780 + }, + { + "epoch": 0.97, + "learning_rate": 0.000154859215684296, + "loss": 0.0121, + "step": 191790 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015485164799128198, + "loss": 0.0087, + "step": 191800 + }, + { + "epoch": 0.97, + "learning_rate": 0.000154844080298268, + "loss": 0.0121, + "step": 191810 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015483651260525397, + "loss": 0.0108, + "step": 191820 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015482894491223995, + "loss": 0.0094, + "step": 191830 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015482137721922596, + "loss": 0.0091, + "step": 191840 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015481380952621194, + "loss": 0.0105, + "step": 191850 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015480624183319793, + "loss": 0.0096, + "step": 191860 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015479867414018393, + "loss": 0.0118, + "step": 191870 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015479110644716992, + "loss": 0.0118, + "step": 191880 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001547835387541559, + "loss": 0.0119, + "step": 191890 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015477597106114188, + "loss": 0.0101, + "step": 191900 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001547684033681279, + "loss": 0.0118, + "step": 191910 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015476083567511387, + "loss": 0.0104, + "step": 191920 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015475326798209985, + "loss": 0.0099, + "step": 191930 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015474570028908586, + "loss": 0.0072, + "step": 191940 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015473813259607184, + "loss": 0.0123, + "step": 191950 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015473056490305782, + "loss": 0.0141, + "step": 191960 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015472299721004383, + "loss": 0.012, + "step": 191970 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001547154295170298, + "loss": 0.0118, + "step": 191980 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001547078618240158, + "loss": 0.0105, + "step": 191990 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001547002941310018, + "loss": 0.0106, + "step": 192000 + }, + { + "epoch": 0.97, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.008027549833059311, + "eval_runtime": 116.6747, + "eval_samples_per_second": 17.142, + "eval_steps_per_second": 4.285, + "step": 192000 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015469272643798778, + "loss": 0.0119, + "step": 192010 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015468515874497376, + "loss": 0.0099, + "step": 192020 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015467759105195977, + "loss": 0.0094, + "step": 192030 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015467002335894575, + "loss": 0.008, + "step": 192040 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015466245566593174, + "loss": 0.0118, + "step": 192050 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015465488797291772, + "loss": 0.0108, + "step": 192060 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015464732027990373, + "loss": 0.0099, + "step": 192070 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001546397525868897, + "loss": 0.0101, + "step": 192080 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001546321848938757, + "loss": 0.0125, + "step": 192090 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001546246172008617, + "loss": 0.0163, + "step": 192100 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015461704950784768, + "loss": 0.0126, + "step": 192110 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015460948181483366, + "loss": 0.0115, + "step": 192120 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015460191412181967, + "loss": 0.0102, + "step": 192130 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015459434642880565, + "loss": 0.0107, + "step": 192140 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015458677873579163, + "loss": 0.0112, + "step": 192150 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015457921104277764, + "loss": 0.0111, + "step": 192160 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015457164334976362, + "loss": 0.0125, + "step": 192170 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001545640756567496, + "loss": 0.0113, + "step": 192180 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001545565079637356, + "loss": 0.0102, + "step": 192190 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001545489402707216, + "loss": 0.0126, + "step": 192200 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015454137257770757, + "loss": 0.0102, + "step": 192210 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015453380488469356, + "loss": 0.0116, + "step": 192220 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015452623719167956, + "loss": 0.0105, + "step": 192230 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015451866949866555, + "loss": 0.0082, + "step": 192240 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015451110180565153, + "loss": 0.0119, + "step": 192250 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015450353411263754, + "loss": 0.0085, + "step": 192260 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015449596641962352, + "loss": 0.0105, + "step": 192270 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001544883987266095, + "loss": 0.0113, + "step": 192280 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001544808310335955, + "loss": 0.0121, + "step": 192290 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001544732633405815, + "loss": 0.0097, + "step": 192300 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015446569564756747, + "loss": 0.0103, + "step": 192310 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015445812795455348, + "loss": 0.0088, + "step": 192320 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015445056026153946, + "loss": 0.0123, + "step": 192330 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015444299256852544, + "loss": 0.0099, + "step": 192340 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015443542487551145, + "loss": 0.009, + "step": 192350 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015442785718249743, + "loss": 0.0097, + "step": 192360 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001544202894894834, + "loss": 0.0091, + "step": 192370 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015441272179646942, + "loss": 0.0096, + "step": 192380 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001544051541034554, + "loss": 0.0127, + "step": 192390 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015439758641044138, + "loss": 0.0105, + "step": 192400 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015439001871742737, + "loss": 0.0099, + "step": 192410 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015438245102441337, + "loss": 0.0112, + "step": 192420 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015437488333139936, + "loss": 0.012, + "step": 192430 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015436731563838534, + "loss": 0.0103, + "step": 192440 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015435974794537135, + "loss": 0.0123, + "step": 192450 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015435218025235733, + "loss": 0.0104, + "step": 192460 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001543446125593433, + "loss": 0.0112, + "step": 192470 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015433704486632932, + "loss": 0.0115, + "step": 192480 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001543294771733153, + "loss": 0.0091, + "step": 192490 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015432190948030128, + "loss": 0.0106, + "step": 192500 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001543143417872873, + "loss": 0.0088, + "step": 192510 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015430677409427327, + "loss": 0.0106, + "step": 192520 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015429920640125925, + "loss": 0.0108, + "step": 192530 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015429163870824526, + "loss": 0.0144, + "step": 192540 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015428407101523124, + "loss": 0.0077, + "step": 192550 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015427650332221722, + "loss": 0.0112, + "step": 192560 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001542689356292032, + "loss": 0.0129, + "step": 192570 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001542613679361892, + "loss": 0.007, + "step": 192580 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001542538002431752, + "loss": 0.0119, + "step": 192590 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015424623255016118, + "loss": 0.0097, + "step": 192600 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015423866485714718, + "loss": 0.0095, + "step": 192610 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015423109716413317, + "loss": 0.0093, + "step": 192620 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015422352947111915, + "loss": 0.0111, + "step": 192630 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015421596177810516, + "loss": 0.0098, + "step": 192640 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015420839408509114, + "loss": 0.0118, + "step": 192650 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015420082639207712, + "loss": 0.0117, + "step": 192660 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015419325869906313, + "loss": 0.0115, + "step": 192670 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001541856910060491, + "loss": 0.01, + "step": 192680 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001541781233130351, + "loss": 0.0101, + "step": 192690 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001541705556200211, + "loss": 0.012, + "step": 192700 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015416298792700708, + "loss": 0.0107, + "step": 192710 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015415542023399306, + "loss": 0.012, + "step": 192720 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015414785254097904, + "loss": 0.0115, + "step": 192730 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015414028484796505, + "loss": 0.0107, + "step": 192740 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015413271715495103, + "loss": 0.0091, + "step": 192750 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015412514946193701, + "loss": 0.009, + "step": 192760 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015411758176892302, + "loss": 0.0102, + "step": 192770 + }, + { + "epoch": 0.97, + "learning_rate": 0.000154110014075909, + "loss": 0.0153, + "step": 192780 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015410244638289499, + "loss": 0.0095, + "step": 192790 + }, + { + "epoch": 0.97, + "learning_rate": 0.000154094878689881, + "loss": 0.01, + "step": 192800 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015408731099686698, + "loss": 0.0119, + "step": 192810 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015407974330385296, + "loss": 0.0095, + "step": 192820 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015407217561083897, + "loss": 0.0129, + "step": 192830 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015406460791782495, + "loss": 0.0119, + "step": 192840 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015405704022481093, + "loss": 0.0105, + "step": 192850 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015404947253179694, + "loss": 0.012, + "step": 192860 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015404190483878292, + "loss": 0.0119, + "step": 192870 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001540343371457689, + "loss": 0.0109, + "step": 192880 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015402676945275488, + "loss": 0.0098, + "step": 192890 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001540192017597409, + "loss": 0.0125, + "step": 192900 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015401163406672687, + "loss": 0.0094, + "step": 192910 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015400406637371285, + "loss": 0.0079, + "step": 192920 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015399649868069886, + "loss": 0.0101, + "step": 192930 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015398893098768482, + "loss": 0.01, + "step": 192940 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001539813632946708, + "loss": 0.0104, + "step": 192950 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015397379560165678, + "loss": 0.0133, + "step": 192960 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001539662279086428, + "loss": 0.008, + "step": 192970 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015395866021562877, + "loss": 0.0126, + "step": 192980 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015395109252261475, + "loss": 0.009, + "step": 192990 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015394352482960076, + "loss": 0.0111, + "step": 193000 + }, + { + "epoch": 0.97, + "eval_cer": 0.9144644335264098, + "eval_loss": 0.008065390400588512, + "eval_runtime": 116.6291, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, + "step": 193000 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015393595713658674, + "loss": 0.012, + "step": 193010 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015392838944357272, + "loss": 0.0106, + "step": 193020 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015392082175055873, + "loss": 0.0099, + "step": 193030 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001539132540575447, + "loss": 0.0106, + "step": 193040 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001539056863645307, + "loss": 0.0093, + "step": 193050 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001538981186715167, + "loss": 0.0099, + "step": 193060 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015389055097850268, + "loss": 0.0127, + "step": 193070 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015388298328548866, + "loss": 0.0098, + "step": 193080 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015387541559247467, + "loss": 0.0118, + "step": 193090 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015386784789946065, + "loss": 0.0098, + "step": 193100 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015386028020644664, + "loss": 0.0134, + "step": 193110 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015385271251343262, + "loss": 0.0149, + "step": 193120 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015384514482041863, + "loss": 0.0102, + "step": 193130 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001538375771274046, + "loss": 0.012, + "step": 193140 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001538300094343906, + "loss": 0.0105, + "step": 193150 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001538224417413766, + "loss": 0.0114, + "step": 193160 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015381487404836258, + "loss": 0.0105, + "step": 193170 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015380730635534856, + "loss": 0.0096, + "step": 193180 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015379973866233457, + "loss": 0.0123, + "step": 193190 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015379217096932055, + "loss": 0.0125, + "step": 193200 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015378460327630653, + "loss": 0.0095, + "step": 193210 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015377703558329254, + "loss": 0.0122, + "step": 193220 + }, + { + "epoch": 0.97, + "learning_rate": 0.00015376946789027852, + "loss": 0.0094, + "step": 193230 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001537619001972645, + "loss": 0.0091, + "step": 193240 + }, + { + "epoch": 0.97, + "learning_rate": 0.0001537543325042505, + "loss": 0.0111, + "step": 193250 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001537467648112365, + "loss": 0.0102, + "step": 193260 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015373919711822247, + "loss": 0.0114, + "step": 193270 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015373162942520846, + "loss": 0.0129, + "step": 193280 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015372406173219446, + "loss": 0.0123, + "step": 193290 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015371649403918045, + "loss": 0.0087, + "step": 193300 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015370892634616643, + "loss": 0.0124, + "step": 193310 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015370135865315244, + "loss": 0.0096, + "step": 193320 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015369379096013842, + "loss": 0.012, + "step": 193330 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001536862232671244, + "loss": 0.0097, + "step": 193340 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001536786555741104, + "loss": 0.0152, + "step": 193350 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001536710878810964, + "loss": 0.012, + "step": 193360 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015366352018808237, + "loss": 0.0105, + "step": 193370 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015365595249506838, + "loss": 0.012, + "step": 193380 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015364838480205436, + "loss": 0.0124, + "step": 193390 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015364081710904034, + "loss": 0.0136, + "step": 193400 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015363324941602635, + "loss": 0.0138, + "step": 193410 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015362568172301233, + "loss": 0.0086, + "step": 193420 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001536181140299983, + "loss": 0.013, + "step": 193430 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015361054633698432, + "loss": 0.0126, + "step": 193440 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001536029786439703, + "loss": 0.012, + "step": 193450 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015359541095095628, + "loss": 0.0092, + "step": 193460 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015358784325794227, + "loss": 0.0109, + "step": 193470 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015358027556492827, + "loss": 0.009, + "step": 193480 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015357270787191426, + "loss": 0.008, + "step": 193490 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015356514017890024, + "loss": 0.0128, + "step": 193500 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015355757248588625, + "loss": 0.0126, + "step": 193510 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015355000479287223, + "loss": 0.0099, + "step": 193520 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001535424370998582, + "loss": 0.0096, + "step": 193530 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015353486940684422, + "loss": 0.015, + "step": 193540 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001535273017138302, + "loss": 0.0099, + "step": 193550 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015351973402081618, + "loss": 0.0115, + "step": 193560 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001535121663278022, + "loss": 0.0111, + "step": 193570 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015350459863478817, + "loss": 0.0124, + "step": 193580 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015349703094177415, + "loss": 0.0122, + "step": 193590 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015348946324876016, + "loss": 0.0093, + "step": 193600 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015348189555574614, + "loss": 0.0123, + "step": 193610 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015347432786273212, + "loss": 0.0137, + "step": 193620 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001534667601697181, + "loss": 0.0125, + "step": 193630 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001534591924767041, + "loss": 0.0102, + "step": 193640 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001534516247836901, + "loss": 0.0126, + "step": 193650 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015344405709067608, + "loss": 0.0097, + "step": 193660 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015343648939766208, + "loss": 0.009, + "step": 193670 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015342892170464807, + "loss": 0.0105, + "step": 193680 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015342135401163405, + "loss": 0.0094, + "step": 193690 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015341378631862006, + "loss": 0.0143, + "step": 193700 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015340621862560604, + "loss": 0.0107, + "step": 193710 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015339865093259202, + "loss": 0.01, + "step": 193720 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015339108323957803, + "loss": 0.0105, + "step": 193730 + }, + { + "epoch": 0.98, + "learning_rate": 0.000153383515546564, + "loss": 0.0106, + "step": 193740 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015337594785355, + "loss": 0.0155, + "step": 193750 + }, + { + "epoch": 0.98, + "learning_rate": 0.000153368380160536, + "loss": 0.0095, + "step": 193760 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015336081246752198, + "loss": 0.0122, + "step": 193770 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015335324477450796, + "loss": 0.0157, + "step": 193780 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015334567708149394, + "loss": 0.0108, + "step": 193790 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015333810938847995, + "loss": 0.0107, + "step": 193800 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015333054169546593, + "loss": 0.0117, + "step": 193810 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015332297400245191, + "loss": 0.0104, + "step": 193820 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015331540630943792, + "loss": 0.0082, + "step": 193830 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001533078386164239, + "loss": 0.0086, + "step": 193840 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015330027092340989, + "loss": 0.0109, + "step": 193850 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001532927032303959, + "loss": 0.0091, + "step": 193860 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015328513553738188, + "loss": 0.0115, + "step": 193870 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015327756784436786, + "loss": 0.0104, + "step": 193880 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015327000015135387, + "loss": 0.013, + "step": 193890 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015326243245833985, + "loss": 0.0127, + "step": 193900 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015325486476532583, + "loss": 0.0122, + "step": 193910 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015324729707231184, + "loss": 0.0101, + "step": 193920 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015323972937929782, + "loss": 0.0115, + "step": 193930 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001532321616862838, + "loss": 0.0139, + "step": 193940 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001532245939932698, + "loss": 0.0138, + "step": 193950 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001532170263002558, + "loss": 0.0119, + "step": 193960 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015320945860724177, + "loss": 0.0128, + "step": 193970 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015320189091422775, + "loss": 0.0111, + "step": 193980 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015319432322121376, + "loss": 0.012, + "step": 193990 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015318675552819974, + "loss": 0.0134, + "step": 194000 + }, + { + "epoch": 0.98, + "eval_cer": 0.9144683151109114, + "eval_loss": 0.007887054234743118, + "eval_runtime": 116.7404, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, + "step": 194000 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015317918783518572, + "loss": 0.0082, + "step": 194010 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015317162014217173, + "loss": 0.0086, + "step": 194020 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015316405244915771, + "loss": 0.0106, + "step": 194030 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001531564847561437, + "loss": 0.0085, + "step": 194040 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001531489170631297, + "loss": 0.0112, + "step": 194050 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015314134937011569, + "loss": 0.0109, + "step": 194060 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015313378167710167, + "loss": 0.0111, + "step": 194070 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015312621398408768, + "loss": 0.0089, + "step": 194080 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015311864629107366, + "loss": 0.0121, + "step": 194090 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015311107859805964, + "loss": 0.0137, + "step": 194100 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015310351090504565, + "loss": 0.0094, + "step": 194110 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015309594321203163, + "loss": 0.0129, + "step": 194120 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530883755190176, + "loss": 0.0112, + "step": 194130 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530808078260036, + "loss": 0.0109, + "step": 194140 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530732401329896, + "loss": 0.0101, + "step": 194150 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015306567243997558, + "loss": 0.0143, + "step": 194160 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015305810474696156, + "loss": 0.0102, + "step": 194170 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015305053705394757, + "loss": 0.0096, + "step": 194180 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015304296936093353, + "loss": 0.0097, + "step": 194190 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530354016679195, + "loss": 0.0104, + "step": 194200 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530278339749055, + "loss": 0.0098, + "step": 194210 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001530202662818915, + "loss": 0.0093, + "step": 194220 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015301269858887748, + "loss": 0.0117, + "step": 194230 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015300513089586346, + "loss": 0.0089, + "step": 194240 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015299756320284947, + "loss": 0.0105, + "step": 194250 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015298999550983545, + "loss": 0.0093, + "step": 194260 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015298242781682143, + "loss": 0.0135, + "step": 194270 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015297486012380744, + "loss": 0.0088, + "step": 194280 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015296729243079342, + "loss": 0.0123, + "step": 194290 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001529597247377794, + "loss": 0.0091, + "step": 194300 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001529521570447654, + "loss": 0.0092, + "step": 194310 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001529445893517514, + "loss": 0.0111, + "step": 194320 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015293702165873737, + "loss": 0.0114, + "step": 194330 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015292945396572338, + "loss": 0.012, + "step": 194340 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015292188627270936, + "loss": 0.0145, + "step": 194350 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015291431857969535, + "loss": 0.01, + "step": 194360 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015290675088668133, + "loss": 0.0097, + "step": 194370 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015289918319366734, + "loss": 0.0097, + "step": 194380 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015289161550065332, + "loss": 0.0125, + "step": 194390 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001528840478076393, + "loss": 0.0107, + "step": 194400 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001528764801146253, + "loss": 0.0139, + "step": 194410 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001528689124216113, + "loss": 0.0107, + "step": 194420 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015286134472859727, + "loss": 0.0116, + "step": 194430 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015285377703558328, + "loss": 0.0113, + "step": 194440 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015284620934256926, + "loss": 0.0108, + "step": 194450 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015283864164955524, + "loss": 0.0131, + "step": 194460 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015283107395654125, + "loss": 0.0117, + "step": 194470 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015282350626352723, + "loss": 0.0105, + "step": 194480 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001528159385705132, + "loss": 0.0112, + "step": 194490 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015280837087749922, + "loss": 0.0104, + "step": 194500 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001528008031844852, + "loss": 0.0089, + "step": 194510 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015279323549147118, + "loss": 0.0178, + "step": 194520 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015278566779845717, + "loss": 0.0098, + "step": 194530 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015277810010544317, + "loss": 0.0131, + "step": 194540 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015277053241242916, + "loss": 0.0108, + "step": 194550 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015276296471941514, + "loss": 0.0086, + "step": 194560 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015275539702640115, + "loss": 0.0103, + "step": 194570 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015274782933338713, + "loss": 0.0094, + "step": 194580 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001527402616403731, + "loss": 0.0123, + "step": 194590 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015273269394735912, + "loss": 0.009, + "step": 194600 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001527251262543451, + "loss": 0.0103, + "step": 194610 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015271755856133108, + "loss": 0.0107, + "step": 194620 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001527099908683171, + "loss": 0.0152, + "step": 194630 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015270242317530307, + "loss": 0.0113, + "step": 194640 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015269485548228905, + "loss": 0.0099, + "step": 194650 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015268728778927506, + "loss": 0.014, + "step": 194660 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015267972009626104, + "loss": 0.0133, + "step": 194670 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015267215240324702, + "loss": 0.0085, + "step": 194680 + }, + { + "epoch": 0.98, + "learning_rate": 0.000152664584710233, + "loss": 0.0111, + "step": 194690 + }, + { + "epoch": 0.98, + "learning_rate": 0.000152657017017219, + "loss": 0.0128, + "step": 194700 + }, + { + "epoch": 0.98, + "learning_rate": 0.000152649449324205, + "loss": 0.0087, + "step": 194710 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015264188163119098, + "loss": 0.0094, + "step": 194720 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015263431393817698, + "loss": 0.0116, + "step": 194730 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015262674624516297, + "loss": 0.0089, + "step": 194740 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015261917855214895, + "loss": 0.011, + "step": 194750 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015261161085913496, + "loss": 0.0102, + "step": 194760 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015260404316612094, + "loss": 0.0115, + "step": 194770 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015259647547310692, + "loss": 0.0125, + "step": 194780 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015258890778009293, + "loss": 0.0104, + "step": 194790 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001525813400870789, + "loss": 0.0103, + "step": 194800 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001525737723940649, + "loss": 0.0087, + "step": 194810 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001525662047010509, + "loss": 0.0113, + "step": 194820 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015255863700803688, + "loss": 0.0118, + "step": 194830 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015255106931502286, + "loss": 0.009, + "step": 194840 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015254350162200887, + "loss": 0.0114, + "step": 194850 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015253593392899485, + "loss": 0.0105, + "step": 194860 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015252836623598083, + "loss": 0.0108, + "step": 194870 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015252079854296681, + "loss": 0.01, + "step": 194880 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015251323084995282, + "loss": 0.0099, + "step": 194890 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001525056631569388, + "loss": 0.014, + "step": 194900 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015249809546392479, + "loss": 0.0111, + "step": 194910 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001524905277709108, + "loss": 0.0115, + "step": 194920 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015248296007789678, + "loss": 0.0086, + "step": 194930 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015247539238488276, + "loss": 0.0092, + "step": 194940 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015246782469186877, + "loss": 0.0107, + "step": 194950 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015246025699885475, + "loss": 0.0105, + "step": 194960 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015245268930584073, + "loss": 0.0094, + "step": 194970 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015244512161282674, + "loss": 0.0114, + "step": 194980 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015243755391981272, + "loss": 0.0114, + "step": 194990 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001524299862267987, + "loss": 0.0132, + "step": 195000 + }, + { + "epoch": 0.98, + "eval_cer": 0.9144712262992877, + "eval_loss": 0.007762947119772434, + "eval_runtime": 116.6633, + "eval_samples_per_second": 17.143, + "eval_steps_per_second": 4.286, + "step": 195000 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001524224185337847, + "loss": 0.0093, + "step": 195010 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001524148508407707, + "loss": 0.0135, + "step": 195020 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015240728314775667, + "loss": 0.0125, + "step": 195030 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015239971545474265, + "loss": 0.011, + "step": 195040 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015239214776172866, + "loss": 0.0137, + "step": 195050 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015238458006871464, + "loss": 0.0117, + "step": 195060 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015237701237570062, + "loss": 0.0097, + "step": 195070 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015236944468268663, + "loss": 0.0099, + "step": 195080 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015236187698967261, + "loss": 0.0106, + "step": 195090 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001523543092966586, + "loss": 0.01, + "step": 195100 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001523467416036446, + "loss": 0.0105, + "step": 195110 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015233917391063059, + "loss": 0.0126, + "step": 195120 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015233160621761657, + "loss": 0.0124, + "step": 195130 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015232403852460258, + "loss": 0.0135, + "step": 195140 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015231647083158856, + "loss": 0.0106, + "step": 195150 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015230890313857454, + "loss": 0.0124, + "step": 195160 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015230133544556055, + "loss": 0.0138, + "step": 195170 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015229376775254653, + "loss": 0.0099, + "step": 195180 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001522862000595325, + "loss": 0.0104, + "step": 195190 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001522786323665185, + "loss": 0.0143, + "step": 195200 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001522710646735045, + "loss": 0.0134, + "step": 195210 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015226349698049048, + "loss": 0.0109, + "step": 195220 + }, + { + "epoch": 0.98, + "learning_rate": 0.00015225592928747646, + "loss": 0.012, + "step": 195230 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015224836159446247, + "loss": 0.0086, + "step": 195240 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015224079390144845, + "loss": 0.0093, + "step": 195250 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015223322620843443, + "loss": 0.0089, + "step": 195260 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015222565851542044, + "loss": 0.0094, + "step": 195270 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015221809082240642, + "loss": 0.0097, + "step": 195280 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001522105231293924, + "loss": 0.0091, + "step": 195290 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015220295543637841, + "loss": 0.0097, + "step": 195300 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001521953877433644, + "loss": 0.0132, + "step": 195310 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015218782005035038, + "loss": 0.0126, + "step": 195320 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015218025235733639, + "loss": 0.009, + "step": 195330 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015217268466432237, + "loss": 0.0102, + "step": 195340 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015216511697130835, + "loss": 0.0111, + "step": 195350 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015215754927829436, + "loss": 0.0133, + "step": 195360 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015214998158528034, + "loss": 0.0106, + "step": 195370 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015214241389226632, + "loss": 0.0111, + "step": 195380 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001521348461992523, + "loss": 0.0114, + "step": 195390 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001521272785062383, + "loss": 0.0075, + "step": 195400 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001521197108132243, + "loss": 0.0108, + "step": 195410 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015211214312021027, + "loss": 0.0077, + "step": 195420 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015210457542719628, + "loss": 0.0118, + "step": 195430 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015209700773418226, + "loss": 0.0112, + "step": 195440 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015208944004116822, + "loss": 0.0097, + "step": 195450 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001520818723481542, + "loss": 0.0108, + "step": 195460 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001520743046551402, + "loss": 0.0113, + "step": 195470 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001520667369621262, + "loss": 0.0109, + "step": 195480 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015205916926911217, + "loss": 0.0128, + "step": 195490 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015205160157609818, + "loss": 0.0097, + "step": 195500 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015204403388308416, + "loss": 0.0096, + "step": 195510 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015203646619007014, + "loss": 0.0098, + "step": 195520 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015202889849705615, + "loss": 0.0086, + "step": 195530 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015202133080404213, + "loss": 0.0157, + "step": 195540 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001520137631110281, + "loss": 0.0133, + "step": 195550 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015200619541801412, + "loss": 0.0097, + "step": 195560 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001519986277250001, + "loss": 0.0097, + "step": 195570 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015199106003198608, + "loss": 0.0118, + "step": 195580 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015198349233897207, + "loss": 0.0098, + "step": 195590 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015197592464595807, + "loss": 0.0127, + "step": 195600 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015196835695294406, + "loss": 0.0136, + "step": 195610 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015196078925993004, + "loss": 0.0123, + "step": 195620 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015195322156691605, + "loss": 0.0114, + "step": 195630 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015194565387390203, + "loss": 0.0092, + "step": 195640 + }, + { + "epoch": 0.99, + "learning_rate": 0.000151938086180888, + "loss": 0.0101, + "step": 195650 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015193051848787402, + "loss": 0.0125, + "step": 195660 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015192295079486, + "loss": 0.0104, + "step": 195670 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015191538310184598, + "loss": 0.0102, + "step": 195680 + }, + { + "epoch": 0.99, + "learning_rate": 0.000151907815408832, + "loss": 0.0131, + "step": 195690 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015190024771581797, + "loss": 0.0127, + "step": 195700 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015189268002280395, + "loss": 0.0101, + "step": 195710 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015188511232978996, + "loss": 0.0131, + "step": 195720 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015187754463677594, + "loss": 0.0087, + "step": 195730 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015186997694376192, + "loss": 0.0106, + "step": 195740 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015186240925074793, + "loss": 0.0141, + "step": 195750 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001518548415577339, + "loss": 0.0104, + "step": 195760 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001518472738647199, + "loss": 0.0098, + "step": 195770 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015183970617170588, + "loss": 0.0118, + "step": 195780 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015183213847869188, + "loss": 0.0087, + "step": 195790 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015182457078567787, + "loss": 0.0139, + "step": 195800 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015181700309266385, + "loss": 0.0104, + "step": 195810 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015180943539964986, + "loss": 0.0083, + "step": 195820 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015180186770663584, + "loss": 0.0112, + "step": 195830 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015179430001362182, + "loss": 0.0091, + "step": 195840 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015178673232060783, + "loss": 0.0149, + "step": 195850 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001517791646275938, + "loss": 0.0119, + "step": 195860 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001517715969345798, + "loss": 0.0122, + "step": 195870 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001517640292415658, + "loss": 0.0137, + "step": 195880 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015175646154855178, + "loss": 0.0138, + "step": 195890 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015174889385553776, + "loss": 0.0124, + "step": 195900 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015174132616252377, + "loss": 0.0103, + "step": 195910 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015173375846950975, + "loss": 0.0112, + "step": 195920 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015172619077649573, + "loss": 0.0118, + "step": 195930 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015171862308348171, + "loss": 0.0128, + "step": 195940 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015171105539046772, + "loss": 0.0135, + "step": 195950 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001517034876974537, + "loss": 0.0157, + "step": 195960 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015169592000443969, + "loss": 0.0106, + "step": 195970 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001516883523114257, + "loss": 0.0113, + "step": 195980 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015168078461841168, + "loss": 0.0105, + "step": 195990 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015167321692539766, + "loss": 0.01, + "step": 196000 + }, + { + "epoch": 0.99, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.007811464369297028, + "eval_runtime": 116.6323, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, + "step": 196000 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015166564923238367, + "loss": 0.008, + "step": 196010 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015165808153936965, + "loss": 0.0087, + "step": 196020 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015165051384635563, + "loss": 0.0119, + "step": 196030 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015164294615334164, + "loss": 0.012, + "step": 196040 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015163537846032762, + "loss": 0.0102, + "step": 196050 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001516278107673136, + "loss": 0.0088, + "step": 196060 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001516202430742996, + "loss": 0.0115, + "step": 196070 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001516126753812856, + "loss": 0.0124, + "step": 196080 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015160510768827157, + "loss": 0.0101, + "step": 196090 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015159753999525755, + "loss": 0.0102, + "step": 196100 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015158997230224356, + "loss": 0.0099, + "step": 196110 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015158240460922954, + "loss": 0.0108, + "step": 196120 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015157483691621552, + "loss": 0.0086, + "step": 196130 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015156726922320153, + "loss": 0.0108, + "step": 196140 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015155970153018751, + "loss": 0.01, + "step": 196150 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001515521338371735, + "loss": 0.0099, + "step": 196160 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001515445661441595, + "loss": 0.0139, + "step": 196170 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015153699845114549, + "loss": 0.0098, + "step": 196180 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015152943075813147, + "loss": 0.0104, + "step": 196190 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015152186306511748, + "loss": 0.0084, + "step": 196200 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015151429537210346, + "loss": 0.0101, + "step": 196210 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015150672767908944, + "loss": 0.0088, + "step": 196220 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015149915998607545, + "loss": 0.0108, + "step": 196230 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015149159229306143, + "loss": 0.0084, + "step": 196240 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001514840246000474, + "loss": 0.0101, + "step": 196250 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015147645690703342, + "loss": 0.0127, + "step": 196260 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001514688892140194, + "loss": 0.0091, + "step": 196270 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015146132152100538, + "loss": 0.0094, + "step": 196280 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015145375382799136, + "loss": 0.0096, + "step": 196290 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015144618613497737, + "loss": 0.0099, + "step": 196300 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015143861844196335, + "loss": 0.0109, + "step": 196310 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015143105074894933, + "loss": 0.0106, + "step": 196320 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015142348305593534, + "loss": 0.0102, + "step": 196330 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015141591536292132, + "loss": 0.0124, + "step": 196340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001514083476699073, + "loss": 0.0113, + "step": 196350 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015140077997689331, + "loss": 0.0102, + "step": 196360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001513932122838793, + "loss": 0.0113, + "step": 196370 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015138564459086528, + "loss": 0.012, + "step": 196380 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015137807689785129, + "loss": 0.0122, + "step": 196390 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015137050920483727, + "loss": 0.0109, + "step": 196400 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015136294151182325, + "loss": 0.0115, + "step": 196410 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015135537381880926, + "loss": 0.0084, + "step": 196420 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015134780612579524, + "loss": 0.0127, + "step": 196430 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015134023843278122, + "loss": 0.0121, + "step": 196440 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001513326707397672, + "loss": 0.0089, + "step": 196450 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001513251030467532, + "loss": 0.0097, + "step": 196460 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001513175353537392, + "loss": 0.0083, + "step": 196470 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015130996766072517, + "loss": 0.0098, + "step": 196480 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015130239996771118, + "loss": 0.0106, + "step": 196490 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015129483227469716, + "loss": 0.0163, + "step": 196500 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015128726458168314, + "loss": 0.0097, + "step": 196510 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015127969688866915, + "loss": 0.0095, + "step": 196520 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015127212919565513, + "loss": 0.0121, + "step": 196530 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015126456150264112, + "loss": 0.0082, + "step": 196540 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015125699380962712, + "loss": 0.0093, + "step": 196550 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001512494261166131, + "loss": 0.0099, + "step": 196560 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001512418584235991, + "loss": 0.0099, + "step": 196570 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001512342907305851, + "loss": 0.0079, + "step": 196580 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015122672303757108, + "loss": 0.0116, + "step": 196590 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015121915534455706, + "loss": 0.0108, + "step": 196600 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015121158765154304, + "loss": 0.0091, + "step": 196610 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015120401995852905, + "loss": 0.0125, + "step": 196620 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015119645226551503, + "loss": 0.0112, + "step": 196630 + }, + { + "epoch": 0.99, + "learning_rate": 0.000151188884572501, + "loss": 0.0094, + "step": 196640 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015118131687948702, + "loss": 0.0148, + "step": 196650 + }, + { + "epoch": 0.99, + "learning_rate": 0.000151173749186473, + "loss": 0.0133, + "step": 196660 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015116618149345898, + "loss": 0.0141, + "step": 196670 + }, + { + "epoch": 0.99, + "learning_rate": 0.000151158613800445, + "loss": 0.0078, + "step": 196680 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015115104610743097, + "loss": 0.0129, + "step": 196690 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015114347841441695, + "loss": 0.0119, + "step": 196700 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001511359107214029, + "loss": 0.0118, + "step": 196710 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015112834302838892, + "loss": 0.0108, + "step": 196720 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001511207753353749, + "loss": 0.0094, + "step": 196730 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015111320764236088, + "loss": 0.0107, + "step": 196740 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001511056399493469, + "loss": 0.0111, + "step": 196750 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015109807225633287, + "loss": 0.0135, + "step": 196760 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015109050456331885, + "loss": 0.0098, + "step": 196770 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015108293687030486, + "loss": 0.0173, + "step": 196780 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015107536917729084, + "loss": 0.011, + "step": 196790 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015106780148427682, + "loss": 0.011, + "step": 196800 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015106023379126283, + "loss": 0.0121, + "step": 196810 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001510526660982488, + "loss": 0.0112, + "step": 196820 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001510450984052348, + "loss": 0.0111, + "step": 196830 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015103753071222078, + "loss": 0.0096, + "step": 196840 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015102996301920678, + "loss": 0.0128, + "step": 196850 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015102239532619277, + "loss": 0.0096, + "step": 196860 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015101482763317875, + "loss": 0.0112, + "step": 196870 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015100725994016476, + "loss": 0.0132, + "step": 196880 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015099969224715074, + "loss": 0.0111, + "step": 196890 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015099212455413672, + "loss": 0.0099, + "step": 196900 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015098455686112273, + "loss": 0.0134, + "step": 196910 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001509769891681087, + "loss": 0.0098, + "step": 196920 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001509694214750947, + "loss": 0.0121, + "step": 196930 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001509618537820807, + "loss": 0.0112, + "step": 196940 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015095428608906668, + "loss": 0.0115, + "step": 196950 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015094671839605266, + "loss": 0.0111, + "step": 196960 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015093915070303867, + "loss": 0.0105, + "step": 196970 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015093158301002465, + "loss": 0.0087, + "step": 196980 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015092401531701063, + "loss": 0.0118, + "step": 196990 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015091644762399662, + "loss": 0.0106, + "step": 197000 + }, + { + "epoch": 0.99, + "eval_cer": 0.9144877230334195, + "eval_loss": 0.007818542420864105, + "eval_runtime": 116.7928, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, + "step": 197000 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015090887993098262, + "loss": 0.0102, + "step": 197010 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001509013122379686, + "loss": 0.0127, + "step": 197020 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001508937445449546, + "loss": 0.0101, + "step": 197030 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001508861768519406, + "loss": 0.0111, + "step": 197040 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015087860915892658, + "loss": 0.0098, + "step": 197050 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015087104146591256, + "loss": 0.0121, + "step": 197060 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015086347377289857, + "loss": 0.0101, + "step": 197070 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015085590607988455, + "loss": 0.0107, + "step": 197080 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015084833838687053, + "loss": 0.0124, + "step": 197090 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015084077069385654, + "loss": 0.0102, + "step": 197100 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015083320300084252, + "loss": 0.0111, + "step": 197110 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001508256353078285, + "loss": 0.0092, + "step": 197120 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001508180676148145, + "loss": 0.0094, + "step": 197130 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001508104999218005, + "loss": 0.0127, + "step": 197140 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015080293222878647, + "loss": 0.0106, + "step": 197150 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015079536453577245, + "loss": 0.0106, + "step": 197160 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015078779684275846, + "loss": 0.0103, + "step": 197170 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015078022914974444, + "loss": 0.0134, + "step": 197180 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015077266145673043, + "loss": 0.0124, + "step": 197190 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015076509376371643, + "loss": 0.0109, + "step": 197200 + }, + { + "epoch": 0.99, + "learning_rate": 0.00015075752607070242, + "loss": 0.016, + "step": 197210 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001507499583776884, + "loss": 0.0101, + "step": 197220 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001507423906846744, + "loss": 0.0101, + "step": 197230 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001507348229916604, + "loss": 0.0124, + "step": 197240 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015072725529864637, + "loss": 0.011, + "step": 197250 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015071968760563238, + "loss": 0.0118, + "step": 197260 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015071211991261836, + "loss": 0.0135, + "step": 197270 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015070455221960434, + "loss": 0.0103, + "step": 197280 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015069698452659035, + "loss": 0.0112, + "step": 197290 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015068941683357633, + "loss": 0.0096, + "step": 197300 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001506818491405623, + "loss": 0.0117, + "step": 197310 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015067428144754832, + "loss": 0.0114, + "step": 197320 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001506667137545343, + "loss": 0.0112, + "step": 197330 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015065914606152028, + "loss": 0.0129, + "step": 197340 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015065157836850626, + "loss": 0.0166, + "step": 197350 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015064401067549227, + "loss": 0.0115, + "step": 197360 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015063644298247825, + "loss": 0.0096, + "step": 197370 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015062887528946424, + "loss": 0.0094, + "step": 197380 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015062130759645024, + "loss": 0.0089, + "step": 197390 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015061373990343623, + "loss": 0.0114, + "step": 197400 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001506061722104222, + "loss": 0.008, + "step": 197410 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015059860451740822, + "loss": 0.0102, + "step": 197420 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001505910368243942, + "loss": 0.0113, + "step": 197430 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015058346913138018, + "loss": 0.0086, + "step": 197440 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001505759014383662, + "loss": 0.0109, + "step": 197450 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015056833374535217, + "loss": 0.0096, + "step": 197460 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015056076605233815, + "loss": 0.0111, + "step": 197470 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015055319835932416, + "loss": 0.0107, + "step": 197480 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015054563066631014, + "loss": 0.0103, + "step": 197490 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015053806297329612, + "loss": 0.0103, + "step": 197500 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001505304952802821, + "loss": 0.0098, + "step": 197510 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001505229275872681, + "loss": 0.0097, + "step": 197520 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001505153598942541, + "loss": 0.0122, + "step": 197530 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015050779220124007, + "loss": 0.0116, + "step": 197540 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015050022450822608, + "loss": 0.0107, + "step": 197550 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015049265681521206, + "loss": 0.0085, + "step": 197560 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015048508912219805, + "loss": 0.0086, + "step": 197570 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015047752142918405, + "loss": 0.0131, + "step": 197580 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015046995373617004, + "loss": 0.0094, + "step": 197590 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015046238604315602, + "loss": 0.0102, + "step": 197600 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015045481835014203, + "loss": 0.0099, + "step": 197610 + }, + { + "epoch": 1.0, + "learning_rate": 0.000150447250657128, + "loss": 0.0079, + "step": 197620 + }, + { + "epoch": 1.0, + "learning_rate": 0.000150439682964114, + "loss": 0.011, + "step": 197630 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001504321152711, + "loss": 0.0078, + "step": 197640 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015042454757808598, + "loss": 0.0097, + "step": 197650 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015041697988507196, + "loss": 0.0119, + "step": 197660 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015040941219205794, + "loss": 0.011, + "step": 197670 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015040184449904395, + "loss": 0.0128, + "step": 197680 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015039427680602993, + "loss": 0.0114, + "step": 197690 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001503867091130159, + "loss": 0.0098, + "step": 197700 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015037914142000192, + "loss": 0.0092, + "step": 197710 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001503715737269879, + "loss": 0.0114, + "step": 197720 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015036400603397388, + "loss": 0.0096, + "step": 197730 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001503564383409599, + "loss": 0.0112, + "step": 197740 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015034887064794587, + "loss": 0.0099, + "step": 197750 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015034130295493186, + "loss": 0.0086, + "step": 197760 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015033373526191786, + "loss": 0.0073, + "step": 197770 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015032616756890385, + "loss": 0.0081, + "step": 197780 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015031859987588983, + "loss": 0.0086, + "step": 197790 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015031103218287584, + "loss": 0.0102, + "step": 197800 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015030346448986182, + "loss": 0.0136, + "step": 197810 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502958967968478, + "loss": 0.011, + "step": 197820 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502883291038338, + "loss": 0.013, + "step": 197830 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502807614108198, + "loss": 0.0079, + "step": 197840 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015027319371780577, + "loss": 0.0102, + "step": 197850 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015026562602479175, + "loss": 0.0109, + "step": 197860 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015025805833177776, + "loss": 0.0102, + "step": 197870 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015025049063876374, + "loss": 0.0104, + "step": 197880 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015024292294574972, + "loss": 0.0114, + "step": 197890 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015023535525273573, + "loss": 0.0141, + "step": 197900 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502277875597217, + "loss": 0.0093, + "step": 197910 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502202198667077, + "loss": 0.0095, + "step": 197920 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001502126521736937, + "loss": 0.0093, + "step": 197930 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015020508448067968, + "loss": 0.0118, + "step": 197940 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015019751678766567, + "loss": 0.009, + "step": 197950 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015018994909465162, + "loss": 0.0109, + "step": 197960 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015018238140163763, + "loss": 0.0111, + "step": 197970 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001501748137086236, + "loss": 0.0077, + "step": 197980 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001501672460156096, + "loss": 0.0113, + "step": 197990 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001501596783225956, + "loss": 0.0091, + "step": 198000 + }, + { + "epoch": 1.0, + "eval_cer": 0.9144508479806542, + "eval_loss": 0.007899566553533077, + "eval_runtime": 116.6273, + "eval_samples_per_second": 17.149, + "eval_steps_per_second": 4.287, + "step": 198000 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015015211062958158, + "loss": 0.0115, + "step": 198010 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015014454293656756, + "loss": 0.0108, + "step": 198020 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015013697524355357, + "loss": 0.0132, + "step": 198030 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015012940755053955, + "loss": 0.0086, + "step": 198040 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015012183985752553, + "loss": 0.0124, + "step": 198050 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015011427216451152, + "loss": 0.0122, + "step": 198060 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015010670447149752, + "loss": 0.013, + "step": 198070 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500991367784835, + "loss": 0.0101, + "step": 198080 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500915690854695, + "loss": 0.007, + "step": 198090 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500840013924555, + "loss": 0.0124, + "step": 198100 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015007643369944148, + "loss": 0.0075, + "step": 198110 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015006886600642746, + "loss": 0.0101, + "step": 198120 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015006129831341347, + "loss": 0.0134, + "step": 198130 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015005373062039945, + "loss": 0.0106, + "step": 198140 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015004616292738543, + "loss": 0.0164, + "step": 198150 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015003859523437144, + "loss": 0.0095, + "step": 198160 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015003102754135742, + "loss": 0.0103, + "step": 198170 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500234598483434, + "loss": 0.0145, + "step": 198180 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500158921553294, + "loss": 0.0115, + "step": 198190 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001500083244623154, + "loss": 0.0108, + "step": 198200 + }, + { + "epoch": 1.0, + "learning_rate": 0.00015000075676930137, + "loss": 0.0138, + "step": 198210 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014999318907628738, + "loss": 0.0088, + "step": 198220 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014998562138327336, + "loss": 0.01, + "step": 198230 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014997805369025937, + "loss": 0.0105, + "step": 198240 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014997048599724535, + "loss": 0.0092, + "step": 198250 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014996291830423133, + "loss": 0.0114, + "step": 198260 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014995535061121734, + "loss": 0.0114, + "step": 198270 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001499477829182033, + "loss": 0.0106, + "step": 198280 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001499402152251893, + "loss": 0.0107, + "step": 198290 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001499326475321753, + "loss": 0.0087, + "step": 198300 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014992507983916127, + "loss": 0.0094, + "step": 198310 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014991751214614728, + "loss": 0.0105, + "step": 198320 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014990994445313326, + "loss": 0.0088, + "step": 198330 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014990237676011924, + "loss": 0.0093, + "step": 198340 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014989480906710525, + "loss": 0.0089, + "step": 198350 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014988724137409123, + "loss": 0.0106, + "step": 198360 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001498796736810772, + "loss": 0.0083, + "step": 198370 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014987210598806322, + "loss": 0.0092, + "step": 198380 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001498645382950492, + "loss": 0.0089, + "step": 198390 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014985697060203518, + "loss": 0.0096, + "step": 198400 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014984940290902116, + "loss": 0.0117, + "step": 198410 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014984183521600717, + "loss": 0.01, + "step": 198420 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014983426752299315, + "loss": 0.0067, + "step": 198430 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014982669982997914, + "loss": 0.011, + "step": 198440 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014981913213696514, + "loss": 0.0089, + "step": 198450 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014981156444395113, + "loss": 0.0103, + "step": 198460 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001498039967509371, + "loss": 0.0125, + "step": 198470 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014979642905792312, + "loss": 0.0086, + "step": 198480 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001497888613649091, + "loss": 0.0097, + "step": 198490 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014978129367189508, + "loss": 0.0067, + "step": 198500 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001497737259788811, + "loss": 0.0101, + "step": 198510 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014976615828586707, + "loss": 0.0114, + "step": 198520 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014975859059285305, + "loss": 0.009, + "step": 198530 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014975102289983906, + "loss": 0.0081, + "step": 198540 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014974345520682504, + "loss": 0.0108, + "step": 198550 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014973588751381102, + "loss": 0.0095, + "step": 198560 + }, + { + "epoch": 1.0, + "learning_rate": 0.000149728319820797, + "loss": 0.0093, + "step": 198570 + }, + { + "epoch": 1.0, + "learning_rate": 0.000149720752127783, + "loss": 0.01, + "step": 198580 + }, + { + "epoch": 1.0, + "learning_rate": 0.000149713184434769, + "loss": 0.0128, + "step": 198590 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014970561674175497, + "loss": 0.0158, + "step": 198600 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014969804904874098, + "loss": 0.015, + "step": 198610 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014969048135572696, + "loss": 0.0128, + "step": 198620 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014968291366271295, + "loss": 0.011, + "step": 198630 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014967534596969895, + "loss": 0.0096, + "step": 198640 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014966777827668494, + "loss": 0.0108, + "step": 198650 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014966021058367092, + "loss": 0.0095, + "step": 198660 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014965264289065693, + "loss": 0.0113, + "step": 198670 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001496450751976429, + "loss": 0.0095, + "step": 198680 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001496375075046289, + "loss": 0.0101, + "step": 198690 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001496299398116149, + "loss": 0.0108, + "step": 198700 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014962237211860088, + "loss": 0.0107, + "step": 198710 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014961480442558686, + "loss": 0.0074, + "step": 198720 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014960723673257287, + "loss": 0.0135, + "step": 198730 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014959966903955885, + "loss": 0.0103, + "step": 198740 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014959210134654483, + "loss": 0.0113, + "step": 198750 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001495845336535308, + "loss": 0.0097, + "step": 198760 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014957696596051682, + "loss": 0.0079, + "step": 198770 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001495693982675028, + "loss": 0.009, + "step": 198780 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014956183057448878, + "loss": 0.011, + "step": 198790 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001495542628814748, + "loss": 0.0112, + "step": 198800 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014954669518846077, + "loss": 0.011, + "step": 198810 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014953912749544676, + "loss": 0.0096, + "step": 198820 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014953155980243276, + "loss": 0.0077, + "step": 198830 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014952399210941875, + "loss": 0.012, + "step": 198840 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014951642441640473, + "loss": 0.0103, + "step": 198850 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014950885672339074, + "loss": 0.0099, + "step": 198860 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014950128903037672, + "loss": 0.0119, + "step": 198870 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001494937213373627, + "loss": 0.0111, + "step": 198880 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001494861536443487, + "loss": 0.0093, + "step": 198890 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001494785859513347, + "loss": 0.0116, + "step": 198900 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014947101825832067, + "loss": 0.0091, + "step": 198910 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014946345056530665, + "loss": 0.0067, + "step": 198920 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014945588287229263, + "loss": 0.0138, + "step": 198930 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014944831517927861, + "loss": 0.0096, + "step": 198940 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014944074748626462, + "loss": 0.0139, + "step": 198950 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001494331797932506, + "loss": 0.0083, + "step": 198960 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014942561210023659, + "loss": 0.0093, + "step": 198970 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001494180444072226, + "loss": 0.0119, + "step": 198980 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014941047671420858, + "loss": 0.0098, + "step": 198990 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014940290902119456, + "loss": 0.0085, + "step": 199000 + }, + { + "epoch": 1.0, + "eval_cer": 0.914462492734159, + "eval_loss": 0.00810973159968853, + "eval_runtime": 117.6891, + "eval_samples_per_second": 16.994, + "eval_steps_per_second": 4.248, + "step": 199000 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014939534132818057, + "loss": 0.009, + "step": 199010 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014938777363516655, + "loss": 0.0097, + "step": 199020 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014938020594215253, + "loss": 0.0093, + "step": 199030 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014937263824913854, + "loss": 0.0087, + "step": 199040 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014936507055612452, + "loss": 0.008, + "step": 199050 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001493575028631105, + "loss": 0.0094, + "step": 199060 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001493499351700965, + "loss": 0.0084, + "step": 199070 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001493423674770825, + "loss": 0.0079, + "step": 199080 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014933479978406847, + "loss": 0.0093, + "step": 199090 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014932723209105445, + "loss": 0.0095, + "step": 199100 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014931966439804046, + "loss": 0.0083, + "step": 199110 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014931209670502644, + "loss": 0.0098, + "step": 199120 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014930452901201242, + "loss": 0.0098, + "step": 199130 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014929696131899843, + "loss": 0.0107, + "step": 199140 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014928939362598441, + "loss": 0.0079, + "step": 199150 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001492818259329704, + "loss": 0.0087, + "step": 199160 + }, + { + "epoch": 1.0, + "learning_rate": 0.0001492742582399564, + "loss": 0.0103, + "step": 199170 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014926669054694239, + "loss": 0.0108, + "step": 199180 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014925912285392837, + "loss": 0.0162, + "step": 199190 + }, + { + "epoch": 1.0, + "learning_rate": 0.00014925155516091438, + "loss": 0.0074, + "step": 199200 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014924398746790036, + "loss": 0.011, + "step": 199210 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014923641977488634, + "loss": 0.0111, + "step": 199220 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014922885208187235, + "loss": 0.0081, + "step": 199230 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014922128438885833, + "loss": 0.0115, + "step": 199240 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001492137166958443, + "loss": 0.0077, + "step": 199250 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014920614900283032, + "loss": 0.0101, + "step": 199260 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001491985813098163, + "loss": 0.01, + "step": 199270 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014919101361680228, + "loss": 0.0098, + "step": 199280 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014918344592378826, + "loss": 0.0078, + "step": 199290 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014917587823077427, + "loss": 0.0102, + "step": 199300 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014916831053776025, + "loss": 0.0084, + "step": 199310 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014916074284474623, + "loss": 0.0094, + "step": 199320 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014915317515173224, + "loss": 0.0081, + "step": 199330 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014914560745871822, + "loss": 0.0102, + "step": 199340 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001491380397657042, + "loss": 0.0083, + "step": 199350 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014913047207269021, + "loss": 0.0084, + "step": 199360 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001491229043796762, + "loss": 0.0101, + "step": 199370 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014911533668666218, + "loss": 0.0096, + "step": 199380 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014910776899364819, + "loss": 0.008, + "step": 199390 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014910020130063417, + "loss": 0.0093, + "step": 199400 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014909263360762015, + "loss": 0.0102, + "step": 199410 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014908506591460616, + "loss": 0.0093, + "step": 199420 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014907749822159214, + "loss": 0.0085, + "step": 199430 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014906993052857812, + "loss": 0.0085, + "step": 199440 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001490623628355641, + "loss": 0.0091, + "step": 199450 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001490547951425501, + "loss": 0.012, + "step": 199460 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001490472274495361, + "loss": 0.0105, + "step": 199470 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014903965975652207, + "loss": 0.0089, + "step": 199480 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014903209206350808, + "loss": 0.0097, + "step": 199490 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014902452437049406, + "loss": 0.0127, + "step": 199500 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014901695667748004, + "loss": 0.0092, + "step": 199510 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014900938898446605, + "loss": 0.01, + "step": 199520 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014900182129145203, + "loss": 0.0153, + "step": 199530 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014899425359843802, + "loss": 0.0097, + "step": 199540 + }, + { + "epoch": 1.01, + "learning_rate": 0.000148986685905424, + "loss": 0.0117, + "step": 199550 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014897911821240998, + "loss": 0.0114, + "step": 199560 + }, + { + "epoch": 1.01, + "learning_rate": 0.000148971550519396, + "loss": 0.0081, + "step": 199570 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014896398282638197, + "loss": 0.0093, + "step": 199580 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014895641513336795, + "loss": 0.0107, + "step": 199590 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014894884744035396, + "loss": 0.0106, + "step": 199600 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014894127974733994, + "loss": 0.0105, + "step": 199610 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014893371205432592, + "loss": 0.0102, + "step": 199620 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014892614436131193, + "loss": 0.0113, + "step": 199630 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001489185766682979, + "loss": 0.009, + "step": 199640 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001489110089752839, + "loss": 0.0085, + "step": 199650 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014890344128226987, + "loss": 0.0095, + "step": 199660 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014889587358925588, + "loss": 0.0142, + "step": 199670 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014888830589624186, + "loss": 0.0162, + "step": 199680 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014888073820322785, + "loss": 0.0112, + "step": 199690 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014887317051021385, + "loss": 0.01, + "step": 199700 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014886560281719984, + "loss": 0.0089, + "step": 199710 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014885803512418582, + "loss": 0.0101, + "step": 199720 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014885046743117183, + "loss": 0.0114, + "step": 199730 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001488428997381578, + "loss": 0.0106, + "step": 199740 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001488353320451438, + "loss": 0.0077, + "step": 199750 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001488277643521298, + "loss": 0.0069, + "step": 199760 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014882019665911578, + "loss": 0.0109, + "step": 199770 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014881262896610176, + "loss": 0.0105, + "step": 199780 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014880506127308777, + "loss": 0.0082, + "step": 199790 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014879749358007375, + "loss": 0.0137, + "step": 199800 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014878992588705973, + "loss": 0.0094, + "step": 199810 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001487823581940457, + "loss": 0.0089, + "step": 199820 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014877479050103172, + "loss": 0.0105, + "step": 199830 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001487672228080177, + "loss": 0.0118, + "step": 199840 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014875965511500368, + "loss": 0.0099, + "step": 199850 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001487520874219897, + "loss": 0.0095, + "step": 199860 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014874451972897567, + "loss": 0.009, + "step": 199870 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014873695203596166, + "loss": 0.0112, + "step": 199880 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014872938434294766, + "loss": 0.0104, + "step": 199890 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014872181664993365, + "loss": 0.0079, + "step": 199900 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014871424895691963, + "loss": 0.0098, + "step": 199910 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014870668126390564, + "loss": 0.0096, + "step": 199920 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014869911357089162, + "loss": 0.0091, + "step": 199930 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486915458778776, + "loss": 0.0114, + "step": 199940 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486839781848636, + "loss": 0.0097, + "step": 199950 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486764104918496, + "loss": 0.0089, + "step": 199960 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014866884279883557, + "loss": 0.0083, + "step": 199970 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014866127510582155, + "loss": 0.0083, + "step": 199980 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014865370741280756, + "loss": 0.0102, + "step": 199990 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014864613971979354, + "loss": 0.0085, + "step": 200000 + }, + { + "epoch": 1.01, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.007801192346960306, + "eval_runtime": 117.4252, + "eval_samples_per_second": 17.032, + "eval_steps_per_second": 4.258, + "step": 200000 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014863857202677952, + "loss": 0.0097, + "step": 200010 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014863100433376553, + "loss": 0.0116, + "step": 200020 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486234366407515, + "loss": 0.01, + "step": 200030 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486158689477375, + "loss": 0.0106, + "step": 200040 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001486083012547235, + "loss": 0.009, + "step": 200050 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014860073356170948, + "loss": 0.0097, + "step": 200060 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014859316586869547, + "loss": 0.0088, + "step": 200070 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014858559817568147, + "loss": 0.0089, + "step": 200080 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014857803048266746, + "loss": 0.0094, + "step": 200090 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014857046278965344, + "loss": 0.0099, + "step": 200100 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014856289509663945, + "loss": 0.0111, + "step": 200110 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014855532740362543, + "loss": 0.0089, + "step": 200120 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001485477597106114, + "loss": 0.009, + "step": 200130 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014854019201759742, + "loss": 0.0108, + "step": 200140 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001485326243245834, + "loss": 0.0074, + "step": 200150 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014852505663156938, + "loss": 0.0089, + "step": 200160 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014851748893855536, + "loss": 0.0093, + "step": 200170 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014850992124554134, + "loss": 0.0089, + "step": 200180 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014850235355252732, + "loss": 0.0087, + "step": 200190 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014849478585951333, + "loss": 0.0114, + "step": 200200 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014848721816649931, + "loss": 0.0094, + "step": 200210 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001484796504734853, + "loss": 0.0091, + "step": 200220 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001484720827804713, + "loss": 0.0075, + "step": 200230 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014846451508745729, + "loss": 0.0082, + "step": 200240 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014845694739444327, + "loss": 0.0095, + "step": 200250 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014844937970142928, + "loss": 0.0083, + "step": 200260 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014844181200841526, + "loss": 0.0106, + "step": 200270 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014843424431540124, + "loss": 0.0085, + "step": 200280 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014842667662238725, + "loss": 0.0112, + "step": 200290 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014841910892937323, + "loss": 0.0095, + "step": 200300 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001484115412363592, + "loss": 0.0104, + "step": 200310 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014840397354334522, + "loss": 0.0104, + "step": 200320 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001483964058503312, + "loss": 0.0079, + "step": 200330 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014838883815731718, + "loss": 0.0083, + "step": 200340 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014838127046430316, + "loss": 0.0099, + "step": 200350 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014837370277128917, + "loss": 0.0074, + "step": 200360 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014836613507827515, + "loss": 0.0176, + "step": 200370 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014835856738526113, + "loss": 0.0103, + "step": 200380 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014835099969224714, + "loss": 0.0098, + "step": 200390 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014834343199923312, + "loss": 0.0109, + "step": 200400 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001483358643062191, + "loss": 0.0095, + "step": 200410 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014832829661320511, + "loss": 0.0097, + "step": 200420 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001483207289201911, + "loss": 0.0099, + "step": 200430 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014831316122717708, + "loss": 0.015, + "step": 200440 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014830559353416309, + "loss": 0.0131, + "step": 200450 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014829802584114907, + "loss": 0.0498, + "step": 200460 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014829045814813505, + "loss": 0.0123, + "step": 200470 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014828289045512106, + "loss": 0.0098, + "step": 200480 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014827532276210704, + "loss": 0.0117, + "step": 200490 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014826775506909302, + "loss": 0.0111, + "step": 200500 + }, + { + "epoch": 1.01, + "learning_rate": 0.000148260187376079, + "loss": 0.0098, + "step": 200510 + }, + { + "epoch": 1.01, + "learning_rate": 0.000148252619683065, + "loss": 0.0111, + "step": 200520 + }, + { + "epoch": 1.01, + "learning_rate": 0.000148245051990051, + "loss": 0.008, + "step": 200530 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014823748429703697, + "loss": 0.0123, + "step": 200540 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014822991660402298, + "loss": 0.0089, + "step": 200550 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014822234891100896, + "loss": 0.008, + "step": 200560 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014821478121799494, + "loss": 0.0079, + "step": 200570 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014820721352498095, + "loss": 0.0071, + "step": 200580 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014819964583196693, + "loss": 0.0119, + "step": 200590 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014819207813895292, + "loss": 0.0127, + "step": 200600 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014818451044593892, + "loss": 0.0112, + "step": 200610 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001481769427529249, + "loss": 0.0087, + "step": 200620 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001481693750599109, + "loss": 0.01, + "step": 200630 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001481618073668969, + "loss": 0.0106, + "step": 200640 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014815423967388288, + "loss": 0.0104, + "step": 200650 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014814667198086886, + "loss": 0.0076, + "step": 200660 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014813910428785487, + "loss": 0.0091, + "step": 200670 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014813153659484085, + "loss": 0.0104, + "step": 200680 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014812396890182683, + "loss": 0.0108, + "step": 200690 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001481164012088128, + "loss": 0.0101, + "step": 200700 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014810883351579882, + "loss": 0.0098, + "step": 200710 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001481012658227848, + "loss": 0.0102, + "step": 200720 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014809369812977078, + "loss": 0.0089, + "step": 200730 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001480861304367568, + "loss": 0.0109, + "step": 200740 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014807856274374277, + "loss": 0.0091, + "step": 200750 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014807099505072875, + "loss": 0.0095, + "step": 200760 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014806342735771476, + "loss": 0.0106, + "step": 200770 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014805585966470074, + "loss": 0.0088, + "step": 200780 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014804829197168673, + "loss": 0.0124, + "step": 200790 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001480407242786727, + "loss": 0.0088, + "step": 200800 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001480331565856587, + "loss": 0.0109, + "step": 200810 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001480255888926447, + "loss": 0.0111, + "step": 200820 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014801802119963068, + "loss": 0.0091, + "step": 200830 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014801045350661666, + "loss": 0.0111, + "step": 200840 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014800288581360267, + "loss": 0.0117, + "step": 200850 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014799531812058865, + "loss": 0.0105, + "step": 200860 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014798775042757463, + "loss": 0.0085, + "step": 200870 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001479801827345606, + "loss": 0.0118, + "step": 200880 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014797261504154662, + "loss": 0.0112, + "step": 200890 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001479650473485326, + "loss": 0.0112, + "step": 200900 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014795747965551858, + "loss": 0.0099, + "step": 200910 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001479499119625046, + "loss": 0.0114, + "step": 200920 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014794234426949057, + "loss": 0.0092, + "step": 200930 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014793477657647656, + "loss": 0.0111, + "step": 200940 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014792720888346256, + "loss": 0.0083, + "step": 200950 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014791964119044855, + "loss": 0.0099, + "step": 200960 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014791207349743453, + "loss": 0.0085, + "step": 200970 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014790450580442054, + "loss": 0.0159, + "step": 200980 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014789693811140652, + "loss": 0.0129, + "step": 200990 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478893704183925, + "loss": 0.0094, + "step": 201000 + }, + { + "epoch": 1.01, + "eval_cer": 0.914447936792278, + "eval_loss": 0.007961818017065525, + "eval_runtime": 117.347, + "eval_samples_per_second": 17.043, + "eval_steps_per_second": 4.261, + "step": 201000 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478818027253785, + "loss": 0.0099, + "step": 201010 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478742350323645, + "loss": 0.0091, + "step": 201020 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014786666733935047, + "loss": 0.0101, + "step": 201030 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014785909964633645, + "loss": 0.0135, + "step": 201040 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014785153195332246, + "loss": 0.0141, + "step": 201050 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014784396426030844, + "loss": 0.0078, + "step": 201060 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014783639656729442, + "loss": 0.011, + "step": 201070 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014782882887428043, + "loss": 0.0122, + "step": 201080 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478212611812664, + "loss": 0.01, + "step": 201090 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478136934882524, + "loss": 0.0103, + "step": 201100 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001478061257952384, + "loss": 0.0109, + "step": 201110 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014779855810222438, + "loss": 0.0091, + "step": 201120 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014779099040921037, + "loss": 0.0093, + "step": 201130 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014778342271619637, + "loss": 0.0084, + "step": 201140 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014777585502318236, + "loss": 0.0116, + "step": 201150 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014776828733016834, + "loss": 0.0088, + "step": 201160 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014776071963715435, + "loss": 0.0102, + "step": 201170 + }, + { + "epoch": 1.01, + "learning_rate": 0.00014775315194414033, + "loss": 0.0106, + "step": 201180 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001477455842511263, + "loss": 0.0099, + "step": 201190 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014773801655811232, + "loss": 0.0082, + "step": 201200 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001477304488650983, + "loss": 0.0084, + "step": 201210 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014772288117208428, + "loss": 0.0108, + "step": 201220 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014771531347907026, + "loss": 0.0087, + "step": 201230 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014770774578605627, + "loss": 0.0091, + "step": 201240 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014770017809304225, + "loss": 0.0095, + "step": 201250 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014769261040002823, + "loss": 0.012, + "step": 201260 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014768504270701424, + "loss": 0.0117, + "step": 201270 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014767747501400022, + "loss": 0.0094, + "step": 201280 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001476699073209862, + "loss": 0.0102, + "step": 201290 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001476623396279722, + "loss": 0.0091, + "step": 201300 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001476547719349582, + "loss": 0.0099, + "step": 201310 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014764720424194418, + "loss": 0.0094, + "step": 201320 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014763963654893018, + "loss": 0.0101, + "step": 201330 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014763206885591617, + "loss": 0.0078, + "step": 201340 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014762450116290215, + "loss": 0.011, + "step": 201350 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014761693346988816, + "loss": 0.0092, + "step": 201360 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014760936577687414, + "loss": 0.0096, + "step": 201370 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014760179808386012, + "loss": 0.0086, + "step": 201380 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001475942303908461, + "loss": 0.0102, + "step": 201390 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001475866626978321, + "loss": 0.0091, + "step": 201400 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001475790950048181, + "loss": 0.0143, + "step": 201410 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014757152731180407, + "loss": 0.0086, + "step": 201420 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014756395961879005, + "loss": 0.0101, + "step": 201430 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014755639192577603, + "loss": 0.0089, + "step": 201440 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014754882423276204, + "loss": 0.0119, + "step": 201450 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014754125653974802, + "loss": 0.0099, + "step": 201460 + }, + { + "epoch": 1.02, + "learning_rate": 0.000147533688846734, + "loss": 0.0092, + "step": 201470 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014752612115372001, + "loss": 0.0099, + "step": 201480 + }, + { + "epoch": 1.02, + "learning_rate": 0.000147518553460706, + "loss": 0.0089, + "step": 201490 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014751098576769198, + "loss": 0.0093, + "step": 201500 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014750341807467799, + "loss": 0.0085, + "step": 201510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014749585038166397, + "loss": 0.0085, + "step": 201520 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014748828268864995, + "loss": 0.0117, + "step": 201530 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014748071499563596, + "loss": 0.0107, + "step": 201540 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014747314730262194, + "loss": 0.0091, + "step": 201550 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014746557960960792, + "loss": 0.0093, + "step": 201560 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014745801191659393, + "loss": 0.0087, + "step": 201570 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001474504442235799, + "loss": 0.0122, + "step": 201580 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001474428765305659, + "loss": 0.009, + "step": 201590 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014743530883755187, + "loss": 0.0093, + "step": 201600 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014742774114453788, + "loss": 0.0069, + "step": 201610 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014742017345152386, + "loss": 0.008, + "step": 201620 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014741260575850984, + "loss": 0.0137, + "step": 201630 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014740503806549585, + "loss": 0.0089, + "step": 201640 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014739747037248183, + "loss": 0.0082, + "step": 201650 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014738990267946782, + "loss": 0.0107, + "step": 201660 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014738233498645382, + "loss": 0.0089, + "step": 201670 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001473747672934398, + "loss": 0.0077, + "step": 201680 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001473671996004258, + "loss": 0.0103, + "step": 201690 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001473596319074118, + "loss": 0.0092, + "step": 201700 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014735206421439778, + "loss": 0.0083, + "step": 201710 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014734449652138376, + "loss": 0.0103, + "step": 201720 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014733692882836977, + "loss": 0.015, + "step": 201730 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014732936113535575, + "loss": 0.0099, + "step": 201740 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014732179344234173, + "loss": 0.0091, + "step": 201750 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001473142257493277, + "loss": 0.0131, + "step": 201760 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014730665805631372, + "loss": 0.0111, + "step": 201770 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001472990903632997, + "loss": 0.0105, + "step": 201780 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014729152267028568, + "loss": 0.0094, + "step": 201790 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001472839549772717, + "loss": 0.0139, + "step": 201800 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014727638728425767, + "loss": 0.0096, + "step": 201810 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014726881959124365, + "loss": 0.0109, + "step": 201820 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014726125189822966, + "loss": 0.011, + "step": 201830 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014725368420521564, + "loss": 0.0092, + "step": 201840 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014724611651220163, + "loss": 0.0099, + "step": 201850 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014723854881918763, + "loss": 0.0108, + "step": 201860 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014723098112617362, + "loss": 0.0077, + "step": 201870 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001472234134331596, + "loss": 0.012, + "step": 201880 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001472158457401456, + "loss": 0.0085, + "step": 201890 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001472082780471316, + "loss": 0.0081, + "step": 201900 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014720071035411757, + "loss": 0.0077, + "step": 201910 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014719314266110355, + "loss": 0.009, + "step": 201920 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014718557496808956, + "loss": 0.0094, + "step": 201930 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014717800727507554, + "loss": 0.011, + "step": 201940 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014717043958206152, + "loss": 0.0107, + "step": 201950 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014716287188904753, + "loss": 0.0086, + "step": 201960 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001471553041960335, + "loss": 0.0099, + "step": 201970 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001471477365030195, + "loss": 0.0105, + "step": 201980 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001471401688100055, + "loss": 0.008, + "step": 201990 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014713260111699148, + "loss": 0.009, + "step": 202000 + }, + { + "epoch": 1.02, + "eval_cer": 0.9144954862024227, + "eval_loss": 0.007912137545645237, + "eval_runtime": 117.0882, + "eval_samples_per_second": 17.081, + "eval_steps_per_second": 4.27, + "step": 202000 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014712503342397746, + "loss": 0.0113, + "step": 202010 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014711746573096347, + "loss": 0.0106, + "step": 202020 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014710989803794945, + "loss": 0.0126, + "step": 202030 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014710233034493544, + "loss": 0.0107, + "step": 202040 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014709476265192142, + "loss": 0.0111, + "step": 202050 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470871949589074, + "loss": 0.0086, + "step": 202060 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470796272658934, + "loss": 0.0098, + "step": 202070 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470720595728794, + "loss": 0.009, + "step": 202080 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014706449187986537, + "loss": 0.0108, + "step": 202090 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014705692418685138, + "loss": 0.0099, + "step": 202100 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014704935649383736, + "loss": 0.0098, + "step": 202110 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014704178880082334, + "loss": 0.0108, + "step": 202120 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014703422110780932, + "loss": 0.0107, + "step": 202130 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014702665341479533, + "loss": 0.0092, + "step": 202140 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470190857217813, + "loss": 0.009, + "step": 202150 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470115180287673, + "loss": 0.0084, + "step": 202160 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001470039503357533, + "loss": 0.0118, + "step": 202170 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014699638264273928, + "loss": 0.0094, + "step": 202180 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014698881494972527, + "loss": 0.0087, + "step": 202190 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014698124725671127, + "loss": 0.0129, + "step": 202200 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014697367956369726, + "loss": 0.0133, + "step": 202210 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014696611187068324, + "loss": 0.0087, + "step": 202220 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014695854417766925, + "loss": 0.0078, + "step": 202230 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014695097648465523, + "loss": 0.0098, + "step": 202240 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001469434087916412, + "loss": 0.0114, + "step": 202250 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014693584109862722, + "loss": 0.0098, + "step": 202260 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001469282734056132, + "loss": 0.0074, + "step": 202270 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014692070571259918, + "loss": 0.0088, + "step": 202280 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014691313801958516, + "loss": 0.0101, + "step": 202290 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014690557032657117, + "loss": 0.0098, + "step": 202300 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014689800263355715, + "loss": 0.0111, + "step": 202310 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014689043494054313, + "loss": 0.0127, + "step": 202320 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014688286724752914, + "loss": 0.0075, + "step": 202330 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014687529955451512, + "loss": 0.0084, + "step": 202340 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468677318615011, + "loss": 0.0105, + "step": 202350 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468601641684871, + "loss": 0.0088, + "step": 202360 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468525964754731, + "loss": 0.0096, + "step": 202370 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014684502878245908, + "loss": 0.0097, + "step": 202380 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014683746108944508, + "loss": 0.0119, + "step": 202390 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014682989339643107, + "loss": 0.0079, + "step": 202400 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014682232570341705, + "loss": 0.0113, + "step": 202410 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014681475801040306, + "loss": 0.0093, + "step": 202420 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014680719031738904, + "loss": 0.0107, + "step": 202430 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014679962262437502, + "loss": 0.0089, + "step": 202440 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146792054931361, + "loss": 0.0079, + "step": 202450 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146784487238347, + "loss": 0.0108, + "step": 202460 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146776919545333, + "loss": 0.011, + "step": 202470 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014676935185231897, + "loss": 0.0095, + "step": 202480 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014676178415930498, + "loss": 0.0083, + "step": 202490 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014675421646629096, + "loss": 0.0087, + "step": 202500 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014674664877327694, + "loss": 0.009, + "step": 202510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014673908108026295, + "loss": 0.0089, + "step": 202520 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014673151338724893, + "loss": 0.0103, + "step": 202530 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014672394569423491, + "loss": 0.0107, + "step": 202540 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014671637800122092, + "loss": 0.0122, + "step": 202550 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001467088103082069, + "loss": 0.0078, + "step": 202560 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014670124261519289, + "loss": 0.0089, + "step": 202570 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466936749221789, + "loss": 0.0092, + "step": 202580 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014668610722916488, + "loss": 0.0077, + "step": 202590 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014667853953615086, + "loss": 0.0095, + "step": 202600 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014667097184313687, + "loss": 0.0124, + "step": 202610 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014666340415012285, + "loss": 0.0125, + "step": 202620 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014665583645710883, + "loss": 0.0091, + "step": 202630 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466482687640948, + "loss": 0.0127, + "step": 202640 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014664070107108082, + "loss": 0.0093, + "step": 202650 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466331333780668, + "loss": 0.0077, + "step": 202660 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014662556568505278, + "loss": 0.009, + "step": 202670 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014661799799203876, + "loss": 0.009, + "step": 202680 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014661043029902474, + "loss": 0.0097, + "step": 202690 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014660286260601075, + "loss": 0.0108, + "step": 202700 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014659529491299673, + "loss": 0.008, + "step": 202710 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014658772721998272, + "loss": 0.0108, + "step": 202720 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014658015952696872, + "loss": 0.0106, + "step": 202730 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465725918339547, + "loss": 0.0076, + "step": 202740 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465650241409407, + "loss": 0.0103, + "step": 202750 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465574564479267, + "loss": 0.0091, + "step": 202760 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014654988875491268, + "loss": 0.0123, + "step": 202770 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014654232106189866, + "loss": 0.0091, + "step": 202780 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014653475336888467, + "loss": 0.0102, + "step": 202790 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014652718567587065, + "loss": 0.0102, + "step": 202800 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014651961798285663, + "loss": 0.008, + "step": 202810 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465120502898426, + "loss": 0.009, + "step": 202820 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014650448259682862, + "loss": 0.0087, + "step": 202830 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464969149038146, + "loss": 0.0105, + "step": 202840 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014648934721080058, + "loss": 0.0101, + "step": 202850 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464817795177866, + "loss": 0.0102, + "step": 202860 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014647421182477257, + "loss": 0.0074, + "step": 202870 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014646664413175856, + "loss": 0.0104, + "step": 202880 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014645907643874456, + "loss": 0.0068, + "step": 202890 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014645150874573055, + "loss": 0.0109, + "step": 202900 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014644394105271653, + "loss": 0.0077, + "step": 202910 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014643637335970254, + "loss": 0.0091, + "step": 202920 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014642880566668852, + "loss": 0.0073, + "step": 202930 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464212379736745, + "loss": 0.0098, + "step": 202940 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464136702806605, + "loss": 0.0105, + "step": 202950 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464061025876465, + "loss": 0.0083, + "step": 202960 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014639853489463247, + "loss": 0.0143, + "step": 202970 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014639096720161845, + "loss": 0.0102, + "step": 202980 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014638339950860446, + "loss": 0.0104, + "step": 202990 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014637583181559044, + "loss": 0.0112, + "step": 203000 + }, + { + "epoch": 1.02, + "eval_cer": 0.9144663743186606, + "eval_loss": 0.0076591866090893745, + "eval_runtime": 117.2192, + "eval_samples_per_second": 17.062, + "eval_steps_per_second": 4.266, + "step": 203000 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014636826412257642, + "loss": 0.0068, + "step": 203010 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014636069642956243, + "loss": 0.0078, + "step": 203020 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463531287365484, + "loss": 0.0119, + "step": 203030 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463455610435344, + "loss": 0.0111, + "step": 203040 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463379933505204, + "loss": 0.0103, + "step": 203050 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014633042565750638, + "loss": 0.0069, + "step": 203060 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014632285796449237, + "loss": 0.0126, + "step": 203070 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014631529027147837, + "loss": 0.0096, + "step": 203080 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014630772257846436, + "loss": 0.0093, + "step": 203090 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014630015488545034, + "loss": 0.0112, + "step": 203100 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014629258719243635, + "loss": 0.0092, + "step": 203110 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014628501949942233, + "loss": 0.0113, + "step": 203120 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462774518064083, + "loss": 0.0084, + "step": 203130 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014626988411339432, + "loss": 0.0112, + "step": 203140 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462623164203803, + "loss": 0.0112, + "step": 203150 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014625474872736628, + "loss": 0.0124, + "step": 203160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014624718103435226, + "loss": 0.0087, + "step": 203170 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014623961334133827, + "loss": 0.0082, + "step": 203180 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014623204564832425, + "loss": 0.0099, + "step": 203190 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014622447795531023, + "loss": 0.0091, + "step": 203200 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014621691026229624, + "loss": 0.0085, + "step": 203210 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014620934256928222, + "loss": 0.01, + "step": 203220 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001462017748762682, + "loss": 0.0103, + "step": 203230 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461942071832542, + "loss": 0.0097, + "step": 203240 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461866394902402, + "loss": 0.0103, + "step": 203250 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014617907179722618, + "loss": 0.0112, + "step": 203260 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014617150410421218, + "loss": 0.0121, + "step": 203270 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014616393641119817, + "loss": 0.0097, + "step": 203280 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014615636871818415, + "loss": 0.0122, + "step": 203290 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014614880102517016, + "loss": 0.0086, + "step": 203300 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461412333321561, + "loss": 0.011, + "step": 203310 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014613366563914212, + "loss": 0.0109, + "step": 203320 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461260979461281, + "loss": 0.0095, + "step": 203330 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014611853025311408, + "loss": 0.0088, + "step": 203340 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014611096256010006, + "loss": 0.0085, + "step": 203350 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014610339486708607, + "loss": 0.0097, + "step": 203360 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014609582717407205, + "loss": 0.0085, + "step": 203370 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014608825948105803, + "loss": 0.0098, + "step": 203380 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014608069178804404, + "loss": 0.0085, + "step": 203390 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014607312409503002, + "loss": 0.0095, + "step": 203400 + }, + { + "epoch": 1.03, + "learning_rate": 0.000146065556402016, + "loss": 0.0063, + "step": 203410 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014605798870900201, + "loss": 0.0093, + "step": 203420 + }, + { + "epoch": 1.03, + "learning_rate": 0.000146050421015988, + "loss": 0.01, + "step": 203430 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014604285332297398, + "loss": 0.0097, + "step": 203440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014603528562995999, + "loss": 0.009, + "step": 203450 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014602771793694597, + "loss": 0.0107, + "step": 203460 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014602015024393195, + "loss": 0.008, + "step": 203470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014601258255091796, + "loss": 0.0097, + "step": 203480 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014600501485790394, + "loss": 0.0107, + "step": 203490 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014599744716488992, + "loss": 0.0069, + "step": 203500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014598987947187593, + "loss": 0.0118, + "step": 203510 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459823117788619, + "loss": 0.0086, + "step": 203520 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459747440858479, + "loss": 0.0093, + "step": 203530 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014596717639283387, + "loss": 0.0102, + "step": 203540 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014595960869981988, + "loss": 0.009, + "step": 203550 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014595204100680586, + "loss": 0.0115, + "step": 203560 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014594447331379184, + "loss": 0.0093, + "step": 203570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014593690562077785, + "loss": 0.0092, + "step": 203580 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014592933792776383, + "loss": 0.0089, + "step": 203590 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014592177023474982, + "loss": 0.0102, + "step": 203600 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014591420254173582, + "loss": 0.0102, + "step": 203610 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459066348487218, + "loss": 0.0117, + "step": 203620 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458990671557078, + "loss": 0.0095, + "step": 203630 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458914994626938, + "loss": 0.0096, + "step": 203640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014588393176967978, + "loss": 0.0098, + "step": 203650 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014587636407666576, + "loss": 0.0112, + "step": 203660 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014586879638365177, + "loss": 0.0091, + "step": 203670 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014586122869063775, + "loss": 0.0091, + "step": 203680 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014585366099762373, + "loss": 0.0123, + "step": 203690 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458460933046097, + "loss": 0.0098, + "step": 203700 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014583852561159572, + "loss": 0.0117, + "step": 203710 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458309579185817, + "loss": 0.0095, + "step": 203720 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014582339022556768, + "loss": 0.0101, + "step": 203730 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458158225325537, + "loss": 0.0086, + "step": 203740 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014580825483953967, + "loss": 0.0114, + "step": 203750 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014580068714652565, + "loss": 0.0103, + "step": 203760 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014579311945351166, + "loss": 0.009, + "step": 203770 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014578555176049764, + "loss": 0.0099, + "step": 203780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014577798406748363, + "loss": 0.0109, + "step": 203790 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014577041637446963, + "loss": 0.0094, + "step": 203800 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014576284868145562, + "loss": 0.0113, + "step": 203810 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457552809884416, + "loss": 0.0124, + "step": 203820 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457477132954276, + "loss": 0.0104, + "step": 203830 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457401456024136, + "loss": 0.0105, + "step": 203840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014573257790939957, + "loss": 0.0132, + "step": 203850 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014572501021638555, + "loss": 0.0131, + "step": 203860 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014571744252337156, + "loss": 0.0109, + "step": 203870 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014570987483035754, + "loss": 0.0103, + "step": 203880 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014570230713734352, + "loss": 0.0121, + "step": 203890 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014569473944432953, + "loss": 0.0119, + "step": 203900 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456871717513155, + "loss": 0.0101, + "step": 203910 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456796040583015, + "loss": 0.0117, + "step": 203920 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014567203636528747, + "loss": 0.0107, + "step": 203930 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014566446867227346, + "loss": 0.0096, + "step": 203940 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014565690097925946, + "loss": 0.0089, + "step": 203950 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014564933328624545, + "loss": 0.0073, + "step": 203960 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014564176559323143, + "loss": 0.0089, + "step": 203970 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014563419790021744, + "loss": 0.0104, + "step": 203980 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014562663020720342, + "loss": 0.0087, + "step": 203990 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456190625141894, + "loss": 0.0129, + "step": 204000 + }, + { + "epoch": 1.03, + "eval_cer": 0.9144741374876638, + "eval_loss": 0.007685788441449404, + "eval_runtime": 116.7131, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, + "step": 204000 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456114948211754, + "loss": 0.0097, + "step": 204010 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456039271281614, + "loss": 0.0117, + "step": 204020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014559635943514737, + "loss": 0.0079, + "step": 204030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014558879174213338, + "loss": 0.0103, + "step": 204040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014558122404911936, + "loss": 0.0096, + "step": 204050 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014557365635610534, + "loss": 0.008, + "step": 204060 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014556608866309132, + "loss": 0.0097, + "step": 204070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014555852097007733, + "loss": 0.0095, + "step": 204080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455509532770633, + "loss": 0.0104, + "step": 204090 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455433855840493, + "loss": 0.0104, + "step": 204100 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455358178910353, + "loss": 0.0085, + "step": 204110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014552825019802128, + "loss": 0.0133, + "step": 204120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014552068250500727, + "loss": 0.0113, + "step": 204130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014551311481199327, + "loss": 0.0101, + "step": 204140 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014550554711897926, + "loss": 0.008, + "step": 204150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014549797942596524, + "loss": 0.0104, + "step": 204160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014549041173295125, + "loss": 0.0104, + "step": 204170 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014548284403993723, + "loss": 0.0098, + "step": 204180 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454752763469232, + "loss": 0.009, + "step": 204190 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014546770865390922, + "loss": 0.0093, + "step": 204200 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454601409608952, + "loss": 0.0102, + "step": 204210 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014545257326788118, + "loss": 0.0134, + "step": 204220 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014544500557486716, + "loss": 0.0116, + "step": 204230 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014543743788185317, + "loss": 0.0145, + "step": 204240 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014542987018883915, + "loss": 0.0131, + "step": 204250 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014542230249582513, + "loss": 0.0092, + "step": 204260 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014541473480281114, + "loss": 0.0095, + "step": 204270 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014540716710979712, + "loss": 0.0092, + "step": 204280 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453995994167831, + "loss": 0.0087, + "step": 204290 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453920317237691, + "loss": 0.0116, + "step": 204300 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453844640307551, + "loss": 0.0102, + "step": 204310 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014537689633774108, + "loss": 0.0114, + "step": 204320 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014536932864472708, + "loss": 0.0109, + "step": 204330 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014536176095171307, + "loss": 0.0112, + "step": 204340 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014535419325869905, + "loss": 0.0093, + "step": 204350 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014534662556568506, + "loss": 0.0092, + "step": 204360 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014533905787267104, + "loss": 0.0123, + "step": 204370 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014533149017965702, + "loss": 0.009, + "step": 204380 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145323922486643, + "loss": 0.0106, + "step": 204390 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145316354793629, + "loss": 0.0101, + "step": 204400 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145308787100615, + "loss": 0.0129, + "step": 204410 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014530121940760097, + "loss": 0.0094, + "step": 204420 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014529365171458698, + "loss": 0.0116, + "step": 204430 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014528608402157296, + "loss": 0.0095, + "step": 204440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014527851632855894, + "loss": 0.0114, + "step": 204450 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014527094863554495, + "loss": 0.0093, + "step": 204460 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014526338094253093, + "loss": 0.0084, + "step": 204470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014525581324951691, + "loss": 0.0095, + "step": 204480 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014524824555650292, + "loss": 0.0102, + "step": 204490 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452406778634889, + "loss": 0.0102, + "step": 204500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014523311017047489, + "loss": 0.0083, + "step": 204510 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452255424774609, + "loss": 0.0098, + "step": 204520 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014521797478444688, + "loss": 0.0112, + "step": 204530 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014521040709143286, + "loss": 0.0112, + "step": 204540 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014520283939841887, + "loss": 0.0103, + "step": 204550 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014519527170540482, + "loss": 0.0103, + "step": 204560 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014518770401239083, + "loss": 0.0155, + "step": 204570 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451801363193768, + "loss": 0.0085, + "step": 204580 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451725686263628, + "loss": 0.009, + "step": 204590 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014516500093334877, + "loss": 0.0116, + "step": 204600 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014515743324033478, + "loss": 0.0101, + "step": 204610 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014514986554732076, + "loss": 0.0123, + "step": 204620 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014514229785430674, + "loss": 0.0081, + "step": 204630 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014513473016129275, + "loss": 0.01, + "step": 204640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014512716246827873, + "loss": 0.013, + "step": 204650 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014511959477526472, + "loss": 0.009, + "step": 204660 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014511202708225072, + "loss": 0.0089, + "step": 204670 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451044593892367, + "loss": 0.0136, + "step": 204680 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450968916962227, + "loss": 0.0098, + "step": 204690 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450893240032087, + "loss": 0.0125, + "step": 204700 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014508175631019468, + "loss": 0.0101, + "step": 204710 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014507418861718066, + "loss": 0.0109, + "step": 204720 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014506662092416667, + "loss": 0.0129, + "step": 204730 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014505905323115265, + "loss": 0.0087, + "step": 204740 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014505148553813863, + "loss": 0.0107, + "step": 204750 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450439178451246, + "loss": 0.0156, + "step": 204760 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014503635015211062, + "loss": 0.0087, + "step": 204770 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450287824590966, + "loss": 0.0073, + "step": 204780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014502121476608258, + "loss": 0.008, + "step": 204790 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450136470730686, + "loss": 0.0084, + "step": 204800 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014500607938005457, + "loss": 0.0102, + "step": 204810 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014499851168704055, + "loss": 0.0112, + "step": 204820 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014499094399402656, + "loss": 0.0088, + "step": 204830 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014498337630101254, + "loss": 0.0097, + "step": 204840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014497580860799853, + "loss": 0.0086, + "step": 204850 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014496824091498453, + "loss": 0.0077, + "step": 204860 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014496067322197052, + "loss": 0.0092, + "step": 204870 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449531055289565, + "loss": 0.0108, + "step": 204880 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449455378359425, + "loss": 0.0111, + "step": 204890 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449379701429285, + "loss": 0.0098, + "step": 204900 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014493040244991447, + "loss": 0.0112, + "step": 204910 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014492283475690045, + "loss": 0.0082, + "step": 204920 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014491526706388646, + "loss": 0.0109, + "step": 204930 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014490769937087244, + "loss": 0.0086, + "step": 204940 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014490013167785842, + "loss": 0.0087, + "step": 204950 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014489256398484443, + "loss": 0.0114, + "step": 204960 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448849962918304, + "loss": 0.01, + "step": 204970 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448774285988164, + "loss": 0.0073, + "step": 204980 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448698609058024, + "loss": 0.0077, + "step": 204990 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014486229321278838, + "loss": 0.0101, + "step": 205000 + }, + { + "epoch": 1.03, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.007726417388767004, + "eval_runtime": 116.6083, + "eval_samples_per_second": 17.151, + "eval_steps_per_second": 4.288, + "step": 205000 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014485472551977436, + "loss": 0.0074, + "step": 205010 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014484715782676037, + "loss": 0.0116, + "step": 205020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014483959013374635, + "loss": 0.0089, + "step": 205030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014483202244073234, + "loss": 0.0081, + "step": 205040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014482445474771834, + "loss": 0.0119, + "step": 205050 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014481688705470433, + "loss": 0.0079, + "step": 205060 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448093193616903, + "loss": 0.0084, + "step": 205070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014480175166867632, + "loss": 0.0103, + "step": 205080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001447941839756623, + "loss": 0.013, + "step": 205090 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014478661628264828, + "loss": 0.0105, + "step": 205100 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014477904858963426, + "loss": 0.0088, + "step": 205110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014477148089662027, + "loss": 0.0107, + "step": 205120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014476391320360625, + "loss": 0.0088, + "step": 205130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014475634551059223, + "loss": 0.0085, + "step": 205140 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014474877781757824, + "loss": 0.0087, + "step": 205150 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014474121012456422, + "loss": 0.0076, + "step": 205160 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001447336424315502, + "loss": 0.011, + "step": 205170 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001447260747385362, + "loss": 0.012, + "step": 205180 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014471850704552217, + "loss": 0.011, + "step": 205190 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014471093935250817, + "loss": 0.01, + "step": 205200 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014470337165949416, + "loss": 0.0123, + "step": 205210 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014469580396648014, + "loss": 0.0109, + "step": 205220 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014468823627346615, + "loss": 0.0093, + "step": 205230 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014468066858045213, + "loss": 0.0094, + "step": 205240 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446731008874381, + "loss": 0.0103, + "step": 205250 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014466553319442412, + "loss": 0.0082, + "step": 205260 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446579655014101, + "loss": 0.009, + "step": 205270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014465039780839608, + "loss": 0.0119, + "step": 205280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014464283011538206, + "loss": 0.0084, + "step": 205290 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014463526242236807, + "loss": 0.0083, + "step": 205300 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014462769472935405, + "loss": 0.0115, + "step": 205310 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014462012703634003, + "loss": 0.0095, + "step": 205320 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014461255934332604, + "loss": 0.009, + "step": 205330 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014460499165031202, + "loss": 0.0096, + "step": 205340 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144597423957298, + "loss": 0.0134, + "step": 205350 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144589856264284, + "loss": 0.0081, + "step": 205360 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014458228857127, + "loss": 0.0103, + "step": 205370 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014457472087825598, + "loss": 0.0089, + "step": 205380 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014456715318524198, + "loss": 0.0101, + "step": 205390 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014455958549222797, + "loss": 0.0081, + "step": 205400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014455201779921395, + "loss": 0.0104, + "step": 205410 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014454445010619996, + "loss": 0.0136, + "step": 205420 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014453688241318594, + "loss": 0.0105, + "step": 205430 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014452931472017192, + "loss": 0.0083, + "step": 205440 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014452174702715793, + "loss": 0.0091, + "step": 205450 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445141793341439, + "loss": 0.0103, + "step": 205460 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445066116411299, + "loss": 0.0091, + "step": 205470 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014449904394811587, + "loss": 0.0117, + "step": 205480 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014449147625510188, + "loss": 0.011, + "step": 205490 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014448390856208786, + "loss": 0.0097, + "step": 205500 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014447634086907384, + "loss": 0.0082, + "step": 205510 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014446877317605985, + "loss": 0.0077, + "step": 205520 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014446120548304583, + "loss": 0.0106, + "step": 205530 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014445363779003181, + "loss": 0.0116, + "step": 205540 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014444607009701782, + "loss": 0.0111, + "step": 205550 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444385024040038, + "loss": 0.0081, + "step": 205560 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014443093471098979, + "loss": 0.0096, + "step": 205570 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444233670179758, + "loss": 0.0108, + "step": 205580 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014441579932496178, + "loss": 0.0076, + "step": 205590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014440823163194776, + "loss": 0.0106, + "step": 205600 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014440066393893377, + "loss": 0.0106, + "step": 205610 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014439309624591975, + "loss": 0.0089, + "step": 205620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014438552855290573, + "loss": 0.0099, + "step": 205630 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443779608598917, + "loss": 0.0117, + "step": 205640 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014437039316687772, + "loss": 0.0088, + "step": 205650 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443628254738637, + "loss": 0.0078, + "step": 205660 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014435525778084968, + "loss": 0.0135, + "step": 205670 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443476900878357, + "loss": 0.0093, + "step": 205680 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014434012239482167, + "loss": 0.0097, + "step": 205690 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014433255470180765, + "loss": 0.0102, + "step": 205700 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014432498700879366, + "loss": 0.0102, + "step": 205710 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014431741931577964, + "loss": 0.011, + "step": 205720 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014430985162276562, + "loss": 0.0096, + "step": 205730 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014430228392975163, + "loss": 0.0122, + "step": 205740 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014429471623673761, + "loss": 0.0117, + "step": 205750 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442871485437236, + "loss": 0.0094, + "step": 205760 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442795808507096, + "loss": 0.01, + "step": 205770 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014427201315769559, + "loss": 0.0115, + "step": 205780 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014426444546468157, + "loss": 0.0081, + "step": 205790 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014425687777166755, + "loss": 0.0088, + "step": 205800 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014424931007865356, + "loss": 0.0095, + "step": 205810 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442417423856395, + "loss": 0.0092, + "step": 205820 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014423417469262552, + "loss": 0.0106, + "step": 205830 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442266069996115, + "loss": 0.0065, + "step": 205840 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014421903930659748, + "loss": 0.0106, + "step": 205850 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442114716135835, + "loss": 0.0092, + "step": 205860 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014420390392056947, + "loss": 0.0094, + "step": 205870 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014419633622755545, + "loss": 0.0103, + "step": 205880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014418876853454146, + "loss": 0.0116, + "step": 205890 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014418120084152744, + "loss": 0.0106, + "step": 205900 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014417363314851343, + "loss": 0.0106, + "step": 205910 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014416606545549943, + "loss": 0.0135, + "step": 205920 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014415849776248542, + "loss": 0.0098, + "step": 205930 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441509300694714, + "loss": 0.0085, + "step": 205940 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441433623764574, + "loss": 0.0087, + "step": 205950 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441357946834434, + "loss": 0.0073, + "step": 205960 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014412822699042937, + "loss": 0.0101, + "step": 205970 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014412065929741538, + "loss": 0.0088, + "step": 205980 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014411309160440136, + "loss": 0.0084, + "step": 205990 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014410552391138734, + "loss": 0.0122, + "step": 206000 + }, + { + "epoch": 1.04, + "eval_cer": 0.914452788772905, + "eval_loss": 0.007414559833705425, + "eval_runtime": 116.657, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, + "step": 206000 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014409795621837332, + "loss": 0.0079, + "step": 206010 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014409038852535933, + "loss": 0.0104, + "step": 206020 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440828208323453, + "loss": 0.0149, + "step": 206030 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440752531393313, + "loss": 0.0109, + "step": 206040 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440676854463173, + "loss": 0.0074, + "step": 206050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014406011775330328, + "loss": 0.0079, + "step": 206060 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014405255006028926, + "loss": 0.0116, + "step": 206070 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014404498236727527, + "loss": 0.0102, + "step": 206080 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014403741467426125, + "loss": 0.0083, + "step": 206090 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014402984698124724, + "loss": 0.0103, + "step": 206100 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014402227928823324, + "loss": 0.0104, + "step": 206110 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014401471159521923, + "loss": 0.0131, + "step": 206120 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440071439022052, + "loss": 0.0095, + "step": 206130 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014399957620919122, + "loss": 0.0094, + "step": 206140 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439920085161772, + "loss": 0.0094, + "step": 206150 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014398444082316318, + "loss": 0.0097, + "step": 206160 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014397687313014916, + "loss": 0.0098, + "step": 206170 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014396930543713517, + "loss": 0.0089, + "step": 206180 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014396173774412115, + "loss": 0.0111, + "step": 206190 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014395417005110713, + "loss": 0.0104, + "step": 206200 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014394660235809314, + "loss": 0.0091, + "step": 206210 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014393903466507912, + "loss": 0.0094, + "step": 206220 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439314669720651, + "loss": 0.0101, + "step": 206230 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439238992790511, + "loss": 0.0108, + "step": 206240 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439163315860371, + "loss": 0.0113, + "step": 206250 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014390876389302307, + "loss": 0.0099, + "step": 206260 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014390119620000908, + "loss": 0.0088, + "step": 206270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014389362850699506, + "loss": 0.0087, + "step": 206280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014388606081398105, + "loss": 0.0105, + "step": 206290 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014387849312096705, + "loss": 0.0109, + "step": 206300 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014387092542795304, + "loss": 0.0121, + "step": 206310 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014386335773493902, + "loss": 0.012, + "step": 206320 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143855790041925, + "loss": 0.0095, + "step": 206330 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143848222348911, + "loss": 0.0087, + "step": 206340 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143840654655897, + "loss": 0.0126, + "step": 206350 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014383308696288297, + "loss": 0.0082, + "step": 206360 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014382551926986898, + "loss": 0.0112, + "step": 206370 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014381795157685496, + "loss": 0.0122, + "step": 206380 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014381038388384094, + "loss": 0.0088, + "step": 206390 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014380281619082695, + "loss": 0.0093, + "step": 206400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014379524849781293, + "loss": 0.0104, + "step": 206410 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437876808047989, + "loss": 0.0111, + "step": 206420 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014378011311178492, + "loss": 0.008, + "step": 206430 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437725454187709, + "loss": 0.0107, + "step": 206440 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014376497772575688, + "loss": 0.0085, + "step": 206450 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014375741003274287, + "loss": 0.0103, + "step": 206460 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014374984233972885, + "loss": 0.0108, + "step": 206470 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014374227464671486, + "loss": 0.0081, + "step": 206480 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014373470695370084, + "loss": 0.0088, + "step": 206490 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014372713926068682, + "loss": 0.0113, + "step": 206500 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014371957156767283, + "loss": 0.0102, + "step": 206510 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437120038746588, + "loss": 0.0089, + "step": 206520 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437044361816448, + "loss": 0.009, + "step": 206530 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014369686848863077, + "loss": 0.0105, + "step": 206540 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014368930079561678, + "loss": 0.0127, + "step": 206550 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014368173310260276, + "loss": 0.0067, + "step": 206560 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014367416540958874, + "loss": 0.0093, + "step": 206570 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014366659771657475, + "loss": 0.0078, + "step": 206580 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014365903002356073, + "loss": 0.0135, + "step": 206590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014365146233054671, + "loss": 0.0105, + "step": 206600 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014364389463753272, + "loss": 0.0101, + "step": 206610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436363269445187, + "loss": 0.0074, + "step": 206620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014362875925150469, + "loss": 0.0101, + "step": 206630 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436211915584907, + "loss": 0.0096, + "step": 206640 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014361362386547668, + "loss": 0.0105, + "step": 206650 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014360605617246266, + "loss": 0.0078, + "step": 206660 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014359848847944867, + "loss": 0.0106, + "step": 206670 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014359092078643465, + "loss": 0.0088, + "step": 206680 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014358335309342063, + "loss": 0.0138, + "step": 206690 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435757854004066, + "loss": 0.0087, + "step": 206700 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014356821770739262, + "loss": 0.009, + "step": 206710 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435606500143786, + "loss": 0.0091, + "step": 206720 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014355308232136458, + "loss": 0.0081, + "step": 206730 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435455146283506, + "loss": 0.007, + "step": 206740 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014353794693533657, + "loss": 0.0106, + "step": 206750 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014353037924232255, + "loss": 0.0101, + "step": 206760 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014352281154930856, + "loss": 0.0093, + "step": 206770 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014351524385629454, + "loss": 0.009, + "step": 206780 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014350767616328052, + "loss": 0.0087, + "step": 206790 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014350010847026653, + "loss": 0.0115, + "step": 206800 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014349254077725251, + "loss": 0.0087, + "step": 206810 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434849730842385, + "loss": 0.0115, + "step": 206820 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434774053912245, + "loss": 0.0096, + "step": 206830 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014346983769821049, + "loss": 0.0115, + "step": 206840 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014346227000519647, + "loss": 0.0089, + "step": 206850 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014345470231218245, + "loss": 0.0098, + "step": 206860 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014344713461916846, + "loss": 0.0089, + "step": 206870 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014343956692615444, + "loss": 0.0102, + "step": 206880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014343199923314042, + "loss": 0.0076, + "step": 206890 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014342443154012643, + "loss": 0.0109, + "step": 206900 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434168638471124, + "loss": 0.0108, + "step": 206910 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434092961540984, + "loss": 0.0112, + "step": 206920 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434017284610844, + "loss": 0.0116, + "step": 206930 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014339416076807038, + "loss": 0.0086, + "step": 206940 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014338659307505636, + "loss": 0.01, + "step": 206950 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014337902538204237, + "loss": 0.011, + "step": 206960 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014337145768902835, + "loss": 0.0092, + "step": 206970 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014336388999601433, + "loss": 0.0086, + "step": 206980 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014335632230300034, + "loss": 0.0102, + "step": 206990 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014334875460998632, + "loss": 0.0136, + "step": 207000 + }, + { + "epoch": 1.04, + "eval_cer": 0.9144566703574066, + "eval_loss": 0.0076129864901304245, + "eval_runtime": 116.5362, + "eval_samples_per_second": 17.162, + "eval_steps_per_second": 4.291, + "step": 207000 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433411869169723, + "loss": 0.008, + "step": 207010 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014333361922395831, + "loss": 0.0079, + "step": 207020 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433260515309443, + "loss": 0.0077, + "step": 207030 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014331848383793028, + "loss": 0.0097, + "step": 207040 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014331091614491626, + "loss": 0.0083, + "step": 207050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014330334845190227, + "loss": 0.01, + "step": 207060 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014329578075888825, + "loss": 0.0084, + "step": 207070 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014328821306587423, + "loss": 0.0112, + "step": 207080 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432806453728602, + "loss": 0.0095, + "step": 207090 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432730776798462, + "loss": 0.0095, + "step": 207100 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432655099868322, + "loss": 0.0097, + "step": 207110 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014325794229381818, + "loss": 0.009, + "step": 207120 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014325037460080416, + "loss": 0.0101, + "step": 207130 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014324280690779017, + "loss": 0.0084, + "step": 207140 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014323523921477615, + "loss": 0.0075, + "step": 207150 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014322767152176214, + "loss": 0.0094, + "step": 207160 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014322010382874814, + "loss": 0.0112, + "step": 207170 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014321253613573413, + "loss": 0.0117, + "step": 207180 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001432049684427201, + "loss": 0.0074, + "step": 207190 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014319740074970612, + "loss": 0.0109, + "step": 207200 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431898330566921, + "loss": 0.0093, + "step": 207210 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014318226536367808, + "loss": 0.0128, + "step": 207220 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014317469767066406, + "loss": 0.0111, + "step": 207230 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014316712997765007, + "loss": 0.0089, + "step": 207240 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014315956228463605, + "loss": 0.008, + "step": 207250 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014315199459162203, + "loss": 0.0119, + "step": 207260 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014314442689860804, + "loss": 0.0091, + "step": 207270 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014313685920559402, + "loss": 0.0106, + "step": 207280 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014312929151258, + "loss": 0.0084, + "step": 207290 + }, + { + "epoch": 1.05, + "learning_rate": 0.000143121723819566, + "loss": 0.0105, + "step": 207300 + }, + { + "epoch": 1.05, + "learning_rate": 0.000143114156126552, + "loss": 0.008, + "step": 207310 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014310658843353797, + "loss": 0.0087, + "step": 207320 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014309902074052398, + "loss": 0.0114, + "step": 207330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014309145304750996, + "loss": 0.0097, + "step": 207340 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014308388535449595, + "loss": 0.0109, + "step": 207350 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014307631766148195, + "loss": 0.0163, + "step": 207360 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014306874996846794, + "loss": 0.0126, + "step": 207370 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014306118227545392, + "loss": 0.0112, + "step": 207380 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014305361458243993, + "loss": 0.013, + "step": 207390 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430460468894259, + "loss": 0.0105, + "step": 207400 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430384791964119, + "loss": 0.0108, + "step": 207410 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014303091150339787, + "loss": 0.0096, + "step": 207420 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014302334381038388, + "loss": 0.0102, + "step": 207430 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014301577611736986, + "loss": 0.0116, + "step": 207440 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014300820842435584, + "loss": 0.0106, + "step": 207450 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014300064073134185, + "loss": 0.01, + "step": 207460 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014299307303832783, + "loss": 0.0103, + "step": 207470 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429855053453138, + "loss": 0.0099, + "step": 207480 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014297793765229982, + "loss": 0.0084, + "step": 207490 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429703699592858, + "loss": 0.009, + "step": 207500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014296280226627178, + "loss": 0.0084, + "step": 207510 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429552345732578, + "loss": 0.0081, + "step": 207520 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014294766688024377, + "loss": 0.0101, + "step": 207530 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014294009918722976, + "loss": 0.0114, + "step": 207540 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014293253149421576, + "loss": 0.0085, + "step": 207550 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014292496380120175, + "loss": 0.009, + "step": 207560 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014291739610818773, + "loss": 0.011, + "step": 207570 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429098284151737, + "loss": 0.0102, + "step": 207580 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014290226072215972, + "loss": 0.0092, + "step": 207590 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428946930291457, + "loss": 0.0109, + "step": 207600 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014288712533613168, + "loss": 0.0101, + "step": 207610 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428795576431177, + "loss": 0.0094, + "step": 207620 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014287198995010367, + "loss": 0.0094, + "step": 207630 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014286442225708965, + "loss": 0.0098, + "step": 207640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014285685456407566, + "loss": 0.0101, + "step": 207650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014284928687106164, + "loss": 0.01, + "step": 207660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014284171917804762, + "loss": 0.0081, + "step": 207670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014283415148503363, + "loss": 0.009, + "step": 207680 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428265837920196, + "loss": 0.0099, + "step": 207690 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428190160990056, + "loss": 0.009, + "step": 207700 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014281144840599158, + "loss": 0.0096, + "step": 207710 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014280388071297756, + "loss": 0.0084, + "step": 207720 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014279631301996357, + "loss": 0.0094, + "step": 207730 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014278874532694955, + "loss": 0.0126, + "step": 207740 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014278117763393553, + "loss": 0.0098, + "step": 207750 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427736099409215, + "loss": 0.0103, + "step": 207760 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014276604224790752, + "loss": 0.0098, + "step": 207770 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427584745548935, + "loss": 0.01, + "step": 207780 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014275090686187948, + "loss": 0.0107, + "step": 207790 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427433391688655, + "loss": 0.007, + "step": 207800 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014273577147585147, + "loss": 0.0092, + "step": 207810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014272820378283745, + "loss": 0.0093, + "step": 207820 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014272063608982346, + "loss": 0.0121, + "step": 207830 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014271306839680944, + "loss": 0.0121, + "step": 207840 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014270550070379542, + "loss": 0.0093, + "step": 207850 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014269793301078143, + "loss": 0.0107, + "step": 207860 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014269036531776741, + "loss": 0.0096, + "step": 207870 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426827976247534, + "loss": 0.0085, + "step": 207880 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426752299317394, + "loss": 0.009, + "step": 207890 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014266766223872539, + "loss": 0.0108, + "step": 207900 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014266009454571137, + "loss": 0.0105, + "step": 207910 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014265252685269738, + "loss": 0.0087, + "step": 207920 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014264495915968336, + "loss": 0.01, + "step": 207930 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014263739146666934, + "loss": 0.0094, + "step": 207940 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014262982377365532, + "loss": 0.0067, + "step": 207950 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014262225608064133, + "loss": 0.0103, + "step": 207960 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426146883876273, + "loss": 0.0124, + "step": 207970 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426071206946133, + "loss": 0.0103, + "step": 207980 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425995530015993, + "loss": 0.0123, + "step": 207990 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014259198530858528, + "loss": 0.0099, + "step": 208000 + }, + { + "epoch": 1.05, + "eval_cer": 0.914462492734159, + "eval_loss": 0.007478554733097553, + "eval_runtime": 116.5491, + "eval_samples_per_second": 17.16, + "eval_steps_per_second": 4.29, + "step": 208000 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014258441761557126, + "loss": 0.0089, + "step": 208010 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014257684992255727, + "loss": 0.0091, + "step": 208020 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014256928222954325, + "loss": 0.0102, + "step": 208030 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014256171453652923, + "loss": 0.0124, + "step": 208040 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014255414684351524, + "loss": 0.0094, + "step": 208050 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014254657915050122, + "loss": 0.0114, + "step": 208060 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425390114574872, + "loss": 0.0101, + "step": 208070 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014253144376447321, + "loss": 0.0103, + "step": 208080 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425238760714592, + "loss": 0.0097, + "step": 208090 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014251630837844518, + "loss": 0.0104, + "step": 208100 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014250874068543116, + "loss": 0.0063, + "step": 208110 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014250117299241717, + "loss": 0.0083, + "step": 208120 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014249360529940315, + "loss": 0.0105, + "step": 208130 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014248603760638913, + "loss": 0.0079, + "step": 208140 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014247846991337514, + "loss": 0.0078, + "step": 208150 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014247090222036112, + "loss": 0.0098, + "step": 208160 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424633345273471, + "loss": 0.0111, + "step": 208170 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424557668343331, + "loss": 0.0083, + "step": 208180 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424481991413191, + "loss": 0.012, + "step": 208190 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014244063144830507, + "loss": 0.0108, + "step": 208200 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014243306375529108, + "loss": 0.009, + "step": 208210 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014242549606227706, + "loss": 0.0089, + "step": 208220 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014241792836926304, + "loss": 0.0125, + "step": 208230 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014241036067624905, + "loss": 0.0098, + "step": 208240 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014240279298323503, + "loss": 0.009, + "step": 208250 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014239522529022102, + "loss": 0.0093, + "step": 208260 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142387657597207, + "loss": 0.013, + "step": 208270 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142380089904193, + "loss": 0.0104, + "step": 208280 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142372522211179, + "loss": 0.0098, + "step": 208290 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014236495451816497, + "loss": 0.0077, + "step": 208300 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014235738682515098, + "loss": 0.0093, + "step": 208310 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014234981913213696, + "loss": 0.0101, + "step": 208320 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014234225143912294, + "loss": 0.0102, + "step": 208330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014233468374610892, + "loss": 0.0098, + "step": 208340 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423271160530949, + "loss": 0.0086, + "step": 208350 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423195483600809, + "loss": 0.0099, + "step": 208360 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423119806670669, + "loss": 0.0088, + "step": 208370 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014230441297405287, + "loss": 0.0103, + "step": 208380 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014229684528103888, + "loss": 0.0084, + "step": 208390 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014228927758802486, + "loss": 0.008, + "step": 208400 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014228170989501085, + "loss": 0.0097, + "step": 208410 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014227414220199685, + "loss": 0.0105, + "step": 208420 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014226657450898284, + "loss": 0.0115, + "step": 208430 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014225900681596882, + "loss": 0.0103, + "step": 208440 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014225143912295483, + "loss": 0.0077, + "step": 208450 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422438714299408, + "loss": 0.0081, + "step": 208460 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422363037369268, + "loss": 0.0084, + "step": 208470 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014222873604391277, + "loss": 0.0094, + "step": 208480 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014222116835089878, + "loss": 0.0106, + "step": 208490 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014221360065788476, + "loss": 0.011, + "step": 208500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014220603296487074, + "loss": 0.0101, + "step": 208510 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014219846527185675, + "loss": 0.0084, + "step": 208520 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014219089757884273, + "loss": 0.0089, + "step": 208530 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014218332988582871, + "loss": 0.0106, + "step": 208540 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014217576219281472, + "loss": 0.0099, + "step": 208550 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421681944998007, + "loss": 0.0105, + "step": 208560 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014216062680678668, + "loss": 0.0086, + "step": 208570 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421530591137727, + "loss": 0.0098, + "step": 208580 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014214549142075867, + "loss": 0.0095, + "step": 208590 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014213792372774466, + "loss": 0.0087, + "step": 208600 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014213035603473066, + "loss": 0.0097, + "step": 208610 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014212278834171665, + "loss": 0.0065, + "step": 208620 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014211522064870263, + "loss": 0.0101, + "step": 208630 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421076529556886, + "loss": 0.009, + "step": 208640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014210008526267462, + "loss": 0.0104, + "step": 208650 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420925175696606, + "loss": 0.0093, + "step": 208660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014208494987664658, + "loss": 0.0093, + "step": 208670 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420773821836326, + "loss": 0.0112, + "step": 208680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014206981449061857, + "loss": 0.013, + "step": 208690 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014206224679760455, + "loss": 0.0088, + "step": 208700 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014205467910459056, + "loss": 0.0131, + "step": 208710 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014204711141157654, + "loss": 0.0113, + "step": 208720 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014203954371856252, + "loss": 0.0116, + "step": 208730 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014203197602554853, + "loss": 0.0124, + "step": 208740 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014202440833253451, + "loss": 0.0093, + "step": 208750 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420168406395205, + "loss": 0.0103, + "step": 208760 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420092729465065, + "loss": 0.0074, + "step": 208770 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014200170525349249, + "loss": 0.0122, + "step": 208780 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014199413756047847, + "loss": 0.0095, + "step": 208790 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014198656986746445, + "loss": 0.0081, + "step": 208800 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014197900217445046, + "loss": 0.0091, + "step": 208810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014197143448143644, + "loss": 0.0103, + "step": 208820 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014196386678842242, + "loss": 0.0089, + "step": 208830 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014195629909540843, + "loss": 0.0094, + "step": 208840 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419487314023944, + "loss": 0.0091, + "step": 208850 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419411637093804, + "loss": 0.0089, + "step": 208860 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419335960163664, + "loss": 0.0081, + "step": 208870 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014192602832335238, + "loss": 0.0148, + "step": 208880 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014191846063033836, + "loss": 0.0094, + "step": 208890 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014191089293732437, + "loss": 0.0084, + "step": 208900 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014190332524431035, + "loss": 0.0106, + "step": 208910 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014189575755129633, + "loss": 0.0091, + "step": 208920 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014188818985828234, + "loss": 0.0083, + "step": 208930 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014188062216526832, + "loss": 0.0083, + "step": 208940 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418730544722543, + "loss": 0.01, + "step": 208950 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418654867792403, + "loss": 0.0115, + "step": 208960 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014185791908622627, + "loss": 0.008, + "step": 208970 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014185035139321228, + "loss": 0.0119, + "step": 208980 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014184278370019826, + "loss": 0.0087, + "step": 208990 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014183521600718424, + "loss": 0.0099, + "step": 209000 + }, + { + "epoch": 1.05, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.007373651955276728, + "eval_runtime": 116.5945, + "eval_samples_per_second": 17.153, + "eval_steps_per_second": 4.288, + "step": 209000 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014182764831417022, + "loss": 0.0091, + "step": 209010 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014182008062115623, + "loss": 0.0088, + "step": 209020 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418125129281422, + "loss": 0.0083, + "step": 209030 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418049452351282, + "loss": 0.0102, + "step": 209040 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417973775421142, + "loss": 0.0074, + "step": 209050 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014178980984910018, + "loss": 0.009, + "step": 209060 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014178224215608616, + "loss": 0.009, + "step": 209070 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014177467446307217, + "loss": 0.013, + "step": 209080 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014176710677005815, + "loss": 0.0084, + "step": 209090 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014175953907704414, + "loss": 0.011, + "step": 209100 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014175197138403014, + "loss": 0.0112, + "step": 209110 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014174440369101613, + "loss": 0.0117, + "step": 209120 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417368359980021, + "loss": 0.0101, + "step": 209130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014172926830498812, + "loss": 0.0091, + "step": 209140 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417217006119741, + "loss": 0.0108, + "step": 209150 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014171413291896008, + "loss": 0.0111, + "step": 209160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014170656522594606, + "loss": 0.0086, + "step": 209170 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014169899753293207, + "loss": 0.0101, + "step": 209180 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014169142983991805, + "loss": 0.0112, + "step": 209190 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014168386214690403, + "loss": 0.009, + "step": 209200 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014167629445389004, + "loss": 0.0101, + "step": 209210 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014166872676087602, + "loss": 0.0079, + "step": 209220 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141661159067862, + "loss": 0.0108, + "step": 209230 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141653591374848, + "loss": 0.0091, + "step": 209240 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141646023681834, + "loss": 0.0077, + "step": 209250 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014163845598881997, + "loss": 0.0073, + "step": 209260 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014163088829580598, + "loss": 0.0113, + "step": 209270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014162332060279196, + "loss": 0.0108, + "step": 209280 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014161575290977795, + "loss": 0.0126, + "step": 209290 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014160818521676395, + "loss": 0.0086, + "step": 209300 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014160061752374994, + "loss": 0.0106, + "step": 209310 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014159304983073592, + "loss": 0.0108, + "step": 209320 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014158548213772193, + "loss": 0.0098, + "step": 209330 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415779144447079, + "loss": 0.0079, + "step": 209340 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415703467516939, + "loss": 0.0123, + "step": 209350 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014156277905867987, + "loss": 0.0092, + "step": 209360 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014155521136566588, + "loss": 0.009, + "step": 209370 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014154764367265186, + "loss": 0.0084, + "step": 209380 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014154007597963784, + "loss": 0.0098, + "step": 209390 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014153250828662385, + "loss": 0.0075, + "step": 209400 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014152494059360983, + "loss": 0.0126, + "step": 209410 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415173729005958, + "loss": 0.0083, + "step": 209420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014150980520758182, + "loss": 0.0083, + "step": 209430 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415022375145678, + "loss": 0.0101, + "step": 209440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014149466982155378, + "loss": 0.0079, + "step": 209450 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414871021285398, + "loss": 0.0138, + "step": 209460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014147953443552577, + "loss": 0.0088, + "step": 209470 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014147196674251176, + "loss": 0.0156, + "step": 209480 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014146439904949776, + "loss": 0.0086, + "step": 209490 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014145683135648375, + "loss": 0.0108, + "step": 209500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014144926366346973, + "loss": 0.009, + "step": 209510 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414416959704557, + "loss": 0.0106, + "step": 209520 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014143412827744172, + "loss": 0.0093, + "step": 209530 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414265605844277, + "loss": 0.0105, + "step": 209540 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014141899289141368, + "loss": 0.0113, + "step": 209550 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414114251983997, + "loss": 0.0101, + "step": 209560 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014140385750538567, + "loss": 0.0099, + "step": 209570 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014139628981237165, + "loss": 0.0094, + "step": 209580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014138872211935763, + "loss": 0.0097, + "step": 209590 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014138115442634361, + "loss": 0.0095, + "step": 209600 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014137358673332962, + "loss": 0.0104, + "step": 209610 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413660190403156, + "loss": 0.0102, + "step": 209620 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014135845134730159, + "loss": 0.009, + "step": 209630 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413508836542876, + "loss": 0.0112, + "step": 209640 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014134331596127358, + "loss": 0.0083, + "step": 209650 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014133574826825956, + "loss": 0.0105, + "step": 209660 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014132818057524557, + "loss": 0.0095, + "step": 209670 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014132061288223155, + "loss": 0.0081, + "step": 209680 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014131304518921753, + "loss": 0.0107, + "step": 209690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413054774962035, + "loss": 0.0095, + "step": 209700 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014129790980318952, + "loss": 0.0076, + "step": 209710 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412903421101755, + "loss": 0.0125, + "step": 209720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014128277441716148, + "loss": 0.0078, + "step": 209730 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412752067241475, + "loss": 0.0087, + "step": 209740 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014126763903113347, + "loss": 0.0124, + "step": 209750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014126007133811945, + "loss": 0.0092, + "step": 209760 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014125250364510546, + "loss": 0.0086, + "step": 209770 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014124493595209144, + "loss": 0.01, + "step": 209780 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014123736825907742, + "loss": 0.0099, + "step": 209790 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014122980056606343, + "loss": 0.0079, + "step": 209800 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014122223287304941, + "loss": 0.0103, + "step": 209810 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412146651800354, + "loss": 0.0087, + "step": 209820 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412070974870214, + "loss": 0.0104, + "step": 209830 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014119952979400739, + "loss": 0.0092, + "step": 209840 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014119196210099337, + "loss": 0.0096, + "step": 209850 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014118439440797938, + "loss": 0.0099, + "step": 209860 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014117682671496536, + "loss": 0.0093, + "step": 209870 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014116925902195134, + "loss": 0.0096, + "step": 209880 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014116169132893732, + "loss": 0.0094, + "step": 209890 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014115412363592333, + "loss": 0.0088, + "step": 209900 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411465559429093, + "loss": 0.0095, + "step": 209910 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411389882498953, + "loss": 0.0077, + "step": 209920 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411314205568813, + "loss": 0.0087, + "step": 209930 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014112385286386728, + "loss": 0.0095, + "step": 209940 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014111628517085326, + "loss": 0.0092, + "step": 209950 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014110871747783927, + "loss": 0.0087, + "step": 209960 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014110114978482525, + "loss": 0.0097, + "step": 209970 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014109358209181123, + "loss": 0.01, + "step": 209980 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014108601439879724, + "loss": 0.0225, + "step": 209990 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014107844670578322, + "loss": 0.0091, + "step": 210000 + }, + { + "epoch": 1.06, + "eval_cer": 0.9144906342217957, + "eval_loss": 0.007647486869245768, + "eval_runtime": 116.648, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.286, + "step": 210000 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410708790127692, + "loss": 0.0109, + "step": 210010 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014106331131975521, + "loss": 0.0083, + "step": 210020 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410557436267412, + "loss": 0.0113, + "step": 210030 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014104817593372718, + "loss": 0.0092, + "step": 210040 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014104060824071316, + "loss": 0.0101, + "step": 210050 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014103304054769917, + "loss": 0.0109, + "step": 210060 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014102547285468515, + "loss": 0.0098, + "step": 210070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014101790516167113, + "loss": 0.0081, + "step": 210080 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014101033746865714, + "loss": 0.0111, + "step": 210090 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014100276977564312, + "loss": 0.0109, + "step": 210100 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409952020826291, + "loss": 0.0108, + "step": 210110 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409876343896151, + "loss": 0.0102, + "step": 210120 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409800666966011, + "loss": 0.0094, + "step": 210130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014097249900358707, + "loss": 0.0098, + "step": 210140 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014096493131057308, + "loss": 0.0104, + "step": 210150 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014095736361755906, + "loss": 0.01, + "step": 210160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014094979592454504, + "loss": 0.0112, + "step": 210170 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014094222823153105, + "loss": 0.0093, + "step": 210180 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014093466053851703, + "loss": 0.0105, + "step": 210190 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014092709284550302, + "loss": 0.0095, + "step": 210200 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140919525152489, + "loss": 0.0093, + "step": 210210 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014091195745947498, + "loss": 0.0089, + "step": 210220 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140904389766461, + "loss": 0.0156, + "step": 210230 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014089682207344697, + "loss": 0.0098, + "step": 210240 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014088925438043295, + "loss": 0.01, + "step": 210250 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014088168668741893, + "loss": 0.0125, + "step": 210260 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014087411899440494, + "loss": 0.0105, + "step": 210270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014086655130139092, + "loss": 0.0102, + "step": 210280 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408589836083769, + "loss": 0.01, + "step": 210290 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408514159153629, + "loss": 0.0079, + "step": 210300 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408438482223489, + "loss": 0.0105, + "step": 210310 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014083628052933487, + "loss": 0.009, + "step": 210320 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014082871283632088, + "loss": 0.0118, + "step": 210330 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014082114514330686, + "loss": 0.0084, + "step": 210340 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014081357745029285, + "loss": 0.0083, + "step": 210350 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014080600975727885, + "loss": 0.0102, + "step": 210360 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014079844206426484, + "loss": 0.0113, + "step": 210370 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014079087437125082, + "loss": 0.0101, + "step": 210380 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014078330667823683, + "loss": 0.0134, + "step": 210390 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407757389852228, + "loss": 0.011, + "step": 210400 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407681712922088, + "loss": 0.0121, + "step": 210410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014076060359919477, + "loss": 0.0101, + "step": 210420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014075303590618078, + "loss": 0.0126, + "step": 210430 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014074546821316676, + "loss": 0.0097, + "step": 210440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014073790052015274, + "loss": 0.0095, + "step": 210450 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014073033282713875, + "loss": 0.0101, + "step": 210460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014072276513412473, + "loss": 0.01, + "step": 210470 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407151974411107, + "loss": 0.0102, + "step": 210480 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014070762974809672, + "loss": 0.0087, + "step": 210490 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407000620550827, + "loss": 0.0109, + "step": 210500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014069249436206868, + "loss": 0.0092, + "step": 210510 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406849266690547, + "loss": 0.0097, + "step": 210520 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014067735897604067, + "loss": 0.013, + "step": 210530 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014066979128302666, + "loss": 0.0165, + "step": 210540 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014066222359001266, + "loss": 0.0072, + "step": 210550 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014065465589699865, + "loss": 0.0083, + "step": 210560 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014064708820398463, + "loss": 0.0121, + "step": 210570 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406395205109706, + "loss": 0.015, + "step": 210580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014063195281795662, + "loss": 0.0078, + "step": 210590 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406243851249426, + "loss": 0.0099, + "step": 210600 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014061681743192858, + "loss": 0.0099, + "step": 210610 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406092497389146, + "loss": 0.014, + "step": 210620 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014060168204590057, + "loss": 0.0131, + "step": 210630 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014059411435288655, + "loss": 0.0093, + "step": 210640 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014058654665987256, + "loss": 0.0087, + "step": 210650 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014057897896685854, + "loss": 0.0119, + "step": 210660 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014057141127384452, + "loss": 0.0101, + "step": 210670 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014056384358083053, + "loss": 0.0075, + "step": 210680 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405562758878165, + "loss": 0.0092, + "step": 210690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405487081948025, + "loss": 0.0096, + "step": 210700 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405411405017885, + "loss": 0.0082, + "step": 210710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014053357280877448, + "loss": 0.0101, + "step": 210720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014052600511576047, + "loss": 0.0101, + "step": 210730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014051843742274645, + "loss": 0.0113, + "step": 210740 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014051086972973246, + "loss": 0.0096, + "step": 210750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014050330203671844, + "loss": 0.0093, + "step": 210760 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014049573434370442, + "loss": 0.0104, + "step": 210770 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014048816665069043, + "loss": 0.0125, + "step": 210780 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404805989576764, + "loss": 0.0119, + "step": 210790 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404730312646624, + "loss": 0.0085, + "step": 210800 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404654635716484, + "loss": 0.0099, + "step": 210810 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014045789587863438, + "loss": 0.0119, + "step": 210820 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014045032818562036, + "loss": 0.0098, + "step": 210830 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014044276049260637, + "loss": 0.0094, + "step": 210840 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014043519279959232, + "loss": 0.01, + "step": 210850 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014042762510657833, + "loss": 0.0094, + "step": 210860 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014042005741356431, + "loss": 0.0128, + "step": 210870 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404124897205503, + "loss": 0.0098, + "step": 210880 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404049220275363, + "loss": 0.0099, + "step": 210890 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014039735433452229, + "loss": 0.0095, + "step": 210900 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014038978664150827, + "loss": 0.0107, + "step": 210910 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014038221894849428, + "loss": 0.0099, + "step": 210920 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014037465125548026, + "loss": 0.0076, + "step": 210930 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014036708356246624, + "loss": 0.0091, + "step": 210940 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014035951586945222, + "loss": 0.0105, + "step": 210950 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014035194817643823, + "loss": 0.0111, + "step": 210960 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403443804834242, + "loss": 0.009, + "step": 210970 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403368127904102, + "loss": 0.0084, + "step": 210980 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403292450973962, + "loss": 0.0102, + "step": 210990 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014032167740438218, + "loss": 0.0079, + "step": 211000 + }, + { + "epoch": 1.06, + "eval_cer": 0.9144489071884033, + "eval_loss": 0.007559832185506821, + "eval_runtime": 116.7132, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, + "step": 211000 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014031410971136816, + "loss": 0.0094, + "step": 211010 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014030654201835417, + "loss": 0.007, + "step": 211020 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014029897432534015, + "loss": 0.0098, + "step": 211030 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014029140663232613, + "loss": 0.0085, + "step": 211040 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014028383893931214, + "loss": 0.0104, + "step": 211050 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014027627124629812, + "loss": 0.0095, + "step": 211060 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001402687035532841, + "loss": 0.0108, + "step": 211070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014026113586027011, + "loss": 0.0105, + "step": 211080 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001402535681672561, + "loss": 0.0102, + "step": 211090 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014024600047424208, + "loss": 0.0092, + "step": 211100 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014023843278122806, + "loss": 0.0088, + "step": 211110 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014023086508821407, + "loss": 0.0097, + "step": 211120 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014022329739520005, + "loss": 0.0097, + "step": 211130 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014021572970218603, + "loss": 0.0087, + "step": 211140 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014020816200917204, + "loss": 0.0081, + "step": 211150 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014020059431615802, + "loss": 0.0103, + "step": 211160 + }, + { + "epoch": 1.07, + "learning_rate": 0.000140193026623144, + "loss": 0.0095, + "step": 211170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014018545893013, + "loss": 0.0075, + "step": 211180 + }, + { + "epoch": 1.07, + "learning_rate": 0.000140177891237116, + "loss": 0.0091, + "step": 211190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014017032354410197, + "loss": 0.0087, + "step": 211200 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014016275585108798, + "loss": 0.0076, + "step": 211210 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014015518815807396, + "loss": 0.0115, + "step": 211220 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014014762046505994, + "loss": 0.0077, + "step": 211230 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014014005277204595, + "loss": 0.0172, + "step": 211240 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014013248507903193, + "loss": 0.0111, + "step": 211250 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014012491738601792, + "loss": 0.0101, + "step": 211260 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014011734969300392, + "loss": 0.009, + "step": 211270 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401097819999899, + "loss": 0.0107, + "step": 211280 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401022143069759, + "loss": 0.0101, + "step": 211290 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014009464661396187, + "loss": 0.013, + "step": 211300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014008707892094788, + "loss": 0.0092, + "step": 211310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014007951122793386, + "loss": 0.0118, + "step": 211320 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014007194353491984, + "loss": 0.0099, + "step": 211330 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014006437584190585, + "loss": 0.0117, + "step": 211340 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014005680814889183, + "loss": 0.0106, + "step": 211350 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400492404558778, + "loss": 0.0111, + "step": 211360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014004167276286382, + "loss": 0.0088, + "step": 211370 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400341050698498, + "loss": 0.0115, + "step": 211380 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014002653737683578, + "loss": 0.007, + "step": 211390 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400189696838218, + "loss": 0.0085, + "step": 211400 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014001140199080777, + "loss": 0.0162, + "step": 211410 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014000383429779375, + "loss": 0.0088, + "step": 211420 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013999626660477976, + "loss": 0.0105, + "step": 211430 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013998869891176574, + "loss": 0.0104, + "step": 211440 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013998113121875173, + "loss": 0.0086, + "step": 211450 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399735635257377, + "loss": 0.0093, + "step": 211460 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013996599583272372, + "loss": 0.0095, + "step": 211470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013995842813970967, + "loss": 0.0097, + "step": 211480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013995086044669568, + "loss": 0.0084, + "step": 211490 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013994329275368166, + "loss": 0.0121, + "step": 211500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013993572506066764, + "loss": 0.0091, + "step": 211510 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013992815736765365, + "loss": 0.0091, + "step": 211520 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013992058967463963, + "loss": 0.0084, + "step": 211530 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399130219816256, + "loss": 0.0105, + "step": 211540 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013990545428861162, + "loss": 0.0091, + "step": 211550 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398978865955976, + "loss": 0.0082, + "step": 211560 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013989031890258358, + "loss": 0.0087, + "step": 211570 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398827512095696, + "loss": 0.0094, + "step": 211580 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013987518351655557, + "loss": 0.0098, + "step": 211590 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013986761582354156, + "loss": 0.0127, + "step": 211600 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013986004813052756, + "loss": 0.0097, + "step": 211610 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013985248043751355, + "loss": 0.0116, + "step": 211620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013984491274449953, + "loss": 0.0083, + "step": 211630 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398373450514855, + "loss": 0.0101, + "step": 211640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013982977735847152, + "loss": 0.0079, + "step": 211650 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398222096654575, + "loss": 0.0109, + "step": 211660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013981464197244348, + "loss": 0.0093, + "step": 211670 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398070742794295, + "loss": 0.0078, + "step": 211680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013979950658641547, + "loss": 0.0087, + "step": 211690 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013979193889340145, + "loss": 0.0092, + "step": 211700 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013978437120038746, + "loss": 0.0094, + "step": 211710 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013977680350737344, + "loss": 0.0116, + "step": 211720 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013976923581435942, + "loss": 0.0111, + "step": 211730 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013976166812134543, + "loss": 0.0111, + "step": 211740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397541004283314, + "loss": 0.0112, + "step": 211750 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397465327353174, + "loss": 0.0094, + "step": 211760 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397389650423034, + "loss": 0.0097, + "step": 211770 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013973139734928938, + "loss": 0.0104, + "step": 211780 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013972382965627537, + "loss": 0.0141, + "step": 211790 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013971626196326137, + "loss": 0.0092, + "step": 211800 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013970869427024736, + "loss": 0.0089, + "step": 211810 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013970112657723334, + "loss": 0.0092, + "step": 211820 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013969355888421932, + "loss": 0.0103, + "step": 211830 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013968599119120533, + "loss": 0.011, + "step": 211840 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396784234981913, + "loss": 0.0109, + "step": 211850 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396708558051773, + "loss": 0.0123, + "step": 211860 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396632881121633, + "loss": 0.0113, + "step": 211870 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013965572041914928, + "loss": 0.0112, + "step": 211880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013964815272613526, + "loss": 0.0076, + "step": 211890 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013964058503312127, + "loss": 0.0117, + "step": 211900 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013963301734010725, + "loss": 0.0105, + "step": 211910 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013962544964709323, + "loss": 0.0103, + "step": 211920 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013961788195407924, + "loss": 0.0105, + "step": 211930 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013961031426106522, + "loss": 0.0103, + "step": 211940 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396027465680512, + "loss": 0.0091, + "step": 211950 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395951788750372, + "loss": 0.0099, + "step": 211960 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395876111820232, + "loss": 0.0086, + "step": 211970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013958004348900918, + "loss": 0.0117, + "step": 211980 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013957247579599516, + "loss": 0.0097, + "step": 211990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013956490810298117, + "loss": 0.009, + "step": 212000 + }, + { + "epoch": 1.07, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.007792965974658728, + "eval_runtime": 116.6797, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, + "step": 212000 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013955734040996715, + "loss": 0.01, + "step": 212010 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013954977271695313, + "loss": 0.0111, + "step": 212020 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013954220502393914, + "loss": 0.0078, + "step": 212030 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013953463733092512, + "loss": 0.0154, + "step": 212040 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395270696379111, + "loss": 0.009, + "step": 212050 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395195019448971, + "loss": 0.0109, + "step": 212060 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395119342518831, + "loss": 0.0071, + "step": 212070 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013950436655886907, + "loss": 0.0102, + "step": 212080 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013949679886585508, + "loss": 0.0083, + "step": 212090 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013948923117284103, + "loss": 0.0074, + "step": 212100 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013948166347982704, + "loss": 0.0102, + "step": 212110 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013947409578681302, + "loss": 0.0092, + "step": 212120 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139466528093799, + "loss": 0.0087, + "step": 212130 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013945896040078501, + "loss": 0.0122, + "step": 212140 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139451392707771, + "loss": 0.0086, + "step": 212150 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013944382501475698, + "loss": 0.0102, + "step": 212160 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013943625732174299, + "loss": 0.0089, + "step": 212170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013942868962872897, + "loss": 0.0081, + "step": 212180 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013942112193571495, + "loss": 0.0097, + "step": 212190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013941355424270093, + "loss": 0.0098, + "step": 212200 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013940598654968694, + "loss": 0.0124, + "step": 212210 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013939841885667292, + "loss": 0.011, + "step": 212220 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393908511636589, + "loss": 0.0101, + "step": 212230 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393832834706449, + "loss": 0.0108, + "step": 212240 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393757157776309, + "loss": 0.0095, + "step": 212250 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013936814808461687, + "loss": 0.0105, + "step": 212260 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013936058039160288, + "loss": 0.0098, + "step": 212270 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013935301269858886, + "loss": 0.0075, + "step": 212280 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013934544500557484, + "loss": 0.0106, + "step": 212290 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013933787731256085, + "loss": 0.0093, + "step": 212300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013933030961954683, + "loss": 0.008, + "step": 212310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013932274192653282, + "loss": 0.0113, + "step": 212320 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013931517423351882, + "loss": 0.0079, + "step": 212330 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393076065405048, + "loss": 0.0082, + "step": 212340 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393000388474908, + "loss": 0.0122, + "step": 212350 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013929247115447677, + "loss": 0.0092, + "step": 212360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013928490346146278, + "loss": 0.0092, + "step": 212370 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013927733576844876, + "loss": 0.0103, + "step": 212380 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013926976807543474, + "loss": 0.0097, + "step": 212390 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013926220038242075, + "loss": 0.0068, + "step": 212400 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013925463268940673, + "loss": 0.0106, + "step": 212410 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392470649963927, + "loss": 0.0112, + "step": 212420 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013923949730337872, + "loss": 0.0102, + "step": 212430 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392319296103647, + "loss": 0.0103, + "step": 212440 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013922436191735068, + "loss": 0.0139, + "step": 212450 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392167942243367, + "loss": 0.0087, + "step": 212460 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013920922653132267, + "loss": 0.0097, + "step": 212470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013920165883830865, + "loss": 0.0112, + "step": 212480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013919409114529466, + "loss": 0.01, + "step": 212490 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013918652345228064, + "loss": 0.0118, + "step": 212500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013917895575926663, + "loss": 0.0118, + "step": 212510 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391713880662526, + "loss": 0.0086, + "step": 212520 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013916382037323862, + "loss": 0.0085, + "step": 212530 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391562526802246, + "loss": 0.011, + "step": 212540 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013914868498721058, + "loss": 0.0089, + "step": 212550 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391411172941966, + "loss": 0.01, + "step": 212560 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013913354960118257, + "loss": 0.0079, + "step": 212570 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013912598190816855, + "loss": 0.0084, + "step": 212580 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013911841421515456, + "loss": 0.0101, + "step": 212590 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013911084652214054, + "loss": 0.0097, + "step": 212600 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013910327882912652, + "loss": 0.0119, + "step": 212610 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013909571113611253, + "loss": 0.0095, + "step": 212620 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390881434430985, + "loss": 0.0101, + "step": 212630 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390805757500845, + "loss": 0.0093, + "step": 212640 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390730080570705, + "loss": 0.0093, + "step": 212650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013906544036405648, + "loss": 0.0098, + "step": 212660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013905787267104246, + "loss": 0.0101, + "step": 212670 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013905030497802845, + "loss": 0.011, + "step": 212680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013904273728501445, + "loss": 0.0094, + "step": 212690 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013903516959200044, + "loss": 0.0106, + "step": 212700 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013902760189898642, + "loss": 0.0072, + "step": 212710 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013902003420597243, + "loss": 0.0092, + "step": 212720 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013901246651295838, + "loss": 0.0094, + "step": 212730 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390048988199444, + "loss": 0.0127, + "step": 212740 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013899733112693037, + "loss": 0.0099, + "step": 212750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013898976343391635, + "loss": 0.009, + "step": 212760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013898219574090236, + "loss": 0.0123, + "step": 212770 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013897462804788834, + "loss": 0.0099, + "step": 212780 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013896706035487432, + "loss": 0.0091, + "step": 212790 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013895949266186033, + "loss": 0.011, + "step": 212800 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389519249688463, + "loss": 0.0112, + "step": 212810 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389443572758323, + "loss": 0.0082, + "step": 212820 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389367895828183, + "loss": 0.0075, + "step": 212830 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013892922188980428, + "loss": 0.0085, + "step": 212840 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013892165419679027, + "loss": 0.0108, + "step": 212850 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013891408650377627, + "loss": 0.0089, + "step": 212860 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013890651881076226, + "loss": 0.0096, + "step": 212870 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013889895111774824, + "loss": 0.0092, + "step": 212880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013889138342473422, + "loss": 0.0083, + "step": 212890 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013888381573172023, + "loss": 0.0085, + "step": 212900 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388762480387062, + "loss": 0.011, + "step": 212910 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388686803456922, + "loss": 0.0089, + "step": 212920 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388611126526782, + "loss": 0.0129, + "step": 212930 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013885354495966418, + "loss": 0.0093, + "step": 212940 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013884597726665016, + "loss": 0.0101, + "step": 212950 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013883840957363617, + "loss": 0.0133, + "step": 212960 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013883084188062215, + "loss": 0.0119, + "step": 212970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013882327418760813, + "loss": 0.0106, + "step": 212980 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013881570649459414, + "loss": 0.0077, + "step": 212990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013880813880158012, + "loss": 0.0184, + "step": 213000 + }, + { + "epoch": 1.07, + "eval_cer": 0.914481900656667, + "eval_loss": 0.007489955984055996, + "eval_runtime": 116.6491, + "eval_samples_per_second": 17.145, + "eval_steps_per_second": 4.286, + "step": 213000 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388005711085661, + "loss": 0.011, + "step": 213010 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387930034155521, + "loss": 0.0117, + "step": 213020 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387854357225381, + "loss": 0.0105, + "step": 213030 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013877786802952408, + "loss": 0.0092, + "step": 213040 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013877030033651006, + "loss": 0.0097, + "step": 213050 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013876273264349607, + "loss": 0.0091, + "step": 213060 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013875516495048205, + "loss": 0.0091, + "step": 213070 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013874759725746803, + "loss": 0.0087, + "step": 213080 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013874002956445404, + "loss": 0.0087, + "step": 213090 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013873246187144002, + "loss": 0.0103, + "step": 213100 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138724894178426, + "loss": 0.0094, + "step": 213110 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138717326485412, + "loss": 0.0111, + "step": 213120 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138709758792398, + "loss": 0.0108, + "step": 213130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013870219109938397, + "loss": 0.0071, + "step": 213140 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013869462340636998, + "loss": 0.0082, + "step": 213150 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013868705571335596, + "loss": 0.0103, + "step": 213160 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013867948802034194, + "loss": 0.0134, + "step": 213170 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013867192032732795, + "loss": 0.0127, + "step": 213180 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013866435263431393, + "loss": 0.0096, + "step": 213190 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013865678494129991, + "loss": 0.0091, + "step": 213200 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013864921724828592, + "loss": 0.0071, + "step": 213210 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386416495552719, + "loss": 0.0107, + "step": 213220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013863408186225789, + "loss": 0.0083, + "step": 213230 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013862651416924387, + "loss": 0.0122, + "step": 213240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013861894647622988, + "loss": 0.0085, + "step": 213250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013861137878321586, + "loss": 0.0061, + "step": 213260 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013860381109020184, + "loss": 0.0101, + "step": 213270 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013859624339718785, + "loss": 0.0075, + "step": 213280 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013858867570417383, + "loss": 0.0109, + "step": 213290 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385811080111598, + "loss": 0.0111, + "step": 213300 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013857354031814582, + "loss": 0.0097, + "step": 213310 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385659726251318, + "loss": 0.0098, + "step": 213320 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013855840493211778, + "loss": 0.0103, + "step": 213330 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385508372391038, + "loss": 0.0092, + "step": 213340 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013854326954608977, + "loss": 0.0097, + "step": 213350 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013853570185307575, + "loss": 0.0083, + "step": 213360 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013852813416006173, + "loss": 0.0097, + "step": 213370 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013852056646704772, + "loss": 0.0107, + "step": 213380 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013851299877403372, + "loss": 0.0112, + "step": 213390 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385054310810197, + "loss": 0.0116, + "step": 213400 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384978633880057, + "loss": 0.0087, + "step": 213410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013849029569499167, + "loss": 0.0097, + "step": 213420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013848272800197768, + "loss": 0.0118, + "step": 213430 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013847516030896366, + "loss": 0.0093, + "step": 213440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013846759261594964, + "loss": 0.0105, + "step": 213450 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013846002492293565, + "loss": 0.0084, + "step": 213460 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013845245722992163, + "loss": 0.0083, + "step": 213470 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384448895369076, + "loss": 0.0076, + "step": 213480 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013843732184389362, + "loss": 0.0096, + "step": 213490 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384297541508796, + "loss": 0.0099, + "step": 213500 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013842218645786558, + "loss": 0.0102, + "step": 213510 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384146187648516, + "loss": 0.0087, + "step": 213520 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013840705107183757, + "loss": 0.0092, + "step": 213530 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013839948337882355, + "loss": 0.0075, + "step": 213540 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013839191568580956, + "loss": 0.0081, + "step": 213550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013838434799279554, + "loss": 0.0093, + "step": 213560 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013837678029978153, + "loss": 0.01, + "step": 213570 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001383692126067675, + "loss": 0.01, + "step": 213580 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013836164491375352, + "loss": 0.011, + "step": 213590 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001383540772207395, + "loss": 0.0079, + "step": 213600 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013834650952772548, + "loss": 0.0096, + "step": 213610 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001383389418347115, + "loss": 0.0082, + "step": 213620 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013833137414169747, + "loss": 0.0092, + "step": 213630 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013832380644868345, + "loss": 0.008, + "step": 213640 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013831623875566946, + "loss": 0.0092, + "step": 213650 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013830867106265544, + "loss": 0.0097, + "step": 213660 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013830110336964142, + "loss": 0.0099, + "step": 213670 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013829353567662743, + "loss": 0.0108, + "step": 213680 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382859679836134, + "loss": 0.0082, + "step": 213690 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382784002905994, + "loss": 0.0095, + "step": 213700 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382708325975854, + "loss": 0.0093, + "step": 213710 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013826326490457138, + "loss": 0.009, + "step": 213720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013825569721155736, + "loss": 0.0087, + "step": 213730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013824812951854337, + "loss": 0.0094, + "step": 213740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013824056182552935, + "loss": 0.0098, + "step": 213750 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013823299413251534, + "loss": 0.0118, + "step": 213760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013822542643950132, + "loss": 0.0106, + "step": 213770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013821785874648733, + "loss": 0.0091, + "step": 213780 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382102910534733, + "loss": 0.01, + "step": 213790 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382027233604593, + "loss": 0.0074, + "step": 213800 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381951556674453, + "loss": 0.0104, + "step": 213810 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013818758797443128, + "loss": 0.0124, + "step": 213820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013818002028141726, + "loss": 0.0092, + "step": 213830 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013817245258840327, + "loss": 0.0077, + "step": 213840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013816488489538925, + "loss": 0.0114, + "step": 213850 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013815731720237523, + "loss": 0.0116, + "step": 213860 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013814974950936124, + "loss": 0.0092, + "step": 213870 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013814218181634722, + "loss": 0.0102, + "step": 213880 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381346141233332, + "loss": 0.0085, + "step": 213890 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381270464303192, + "loss": 0.0094, + "step": 213900 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381194787373052, + "loss": 0.0079, + "step": 213910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013811191104429117, + "loss": 0.011, + "step": 213920 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013810434335127716, + "loss": 0.0097, + "step": 213930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013809677565826316, + "loss": 0.009, + "step": 213940 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013808920796524915, + "loss": 0.0091, + "step": 213950 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013808164027223513, + "loss": 0.0104, + "step": 213960 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013807407257922114, + "loss": 0.0152, + "step": 213970 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013806650488620712, + "loss": 0.0104, + "step": 213980 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001380589371931931, + "loss": 0.0146, + "step": 213990 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013805136950017908, + "loss": 0.0098, + "step": 214000 + }, + { + "epoch": 1.08, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.0074865869246423244, + "eval_runtime": 116.6822, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, + "step": 214000 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013804380180716506, + "loss": 0.0103, + "step": 214010 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013803623411415107, + "loss": 0.0094, + "step": 214020 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013802866642113705, + "loss": 0.0128, + "step": 214030 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013802109872812303, + "loss": 0.011, + "step": 214040 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013801353103510904, + "loss": 0.0086, + "step": 214050 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013800596334209502, + "loss": 0.01, + "step": 214060 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137998395649081, + "loss": 0.0124, + "step": 214070 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137990827956067, + "loss": 0.0109, + "step": 214080 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137983260263053, + "loss": 0.0105, + "step": 214090 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013797569257003898, + "loss": 0.0111, + "step": 214100 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013796812487702498, + "loss": 0.0144, + "step": 214110 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013796055718401097, + "loss": 0.0105, + "step": 214120 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013795298949099695, + "loss": 0.008, + "step": 214130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013794542179798293, + "loss": 0.0092, + "step": 214140 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013793785410496894, + "loss": 0.0135, + "step": 214150 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013793028641195492, + "loss": 0.0098, + "step": 214160 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379227187189409, + "loss": 0.0086, + "step": 214170 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379151510259269, + "loss": 0.0082, + "step": 214180 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379075833329129, + "loss": 0.0113, + "step": 214190 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013790001563989887, + "loss": 0.0094, + "step": 214200 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013789244794688488, + "loss": 0.0099, + "step": 214210 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013788488025387086, + "loss": 0.0116, + "step": 214220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013787731256085684, + "loss": 0.0084, + "step": 214230 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013786974486784285, + "loss": 0.0087, + "step": 214240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013786217717482883, + "loss": 0.0097, + "step": 214250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013785460948181481, + "loss": 0.0086, + "step": 214260 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013784704178880082, + "loss": 0.0096, + "step": 214270 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378394740957868, + "loss": 0.0099, + "step": 214280 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013783190640277279, + "loss": 0.007, + "step": 214290 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013782433870975877, + "loss": 0.0097, + "step": 214300 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013781677101674478, + "loss": 0.0114, + "step": 214310 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013780920332373076, + "loss": 0.01, + "step": 214320 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013780163563071674, + "loss": 0.0089, + "step": 214330 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013779406793770275, + "loss": 0.009, + "step": 214340 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013778650024468873, + "loss": 0.0087, + "step": 214350 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377789325516747, + "loss": 0.0122, + "step": 214360 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013777136485866072, + "loss": 0.0096, + "step": 214370 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377637971656467, + "loss": 0.0093, + "step": 214380 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013775622947263268, + "loss": 0.0081, + "step": 214390 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377486617796187, + "loss": 0.0103, + "step": 214400 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013774109408660467, + "loss": 0.0087, + "step": 214410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013773352639359065, + "loss": 0.0113, + "step": 214420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013772595870057666, + "loss": 0.0092, + "step": 214430 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013771839100756264, + "loss": 0.008, + "step": 214440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013771082331454862, + "loss": 0.0075, + "step": 214450 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377032556215346, + "loss": 0.01, + "step": 214460 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013769568792852061, + "loss": 0.0104, + "step": 214470 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376881202355066, + "loss": 0.0086, + "step": 214480 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013768055254249258, + "loss": 0.0102, + "step": 214490 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013767298484947859, + "loss": 0.014, + "step": 214500 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013766541715646457, + "loss": 0.0109, + "step": 214510 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013765784946345055, + "loss": 0.0106, + "step": 214520 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013765028177043656, + "loss": 0.009, + "step": 214530 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013764271407742254, + "loss": 0.0089, + "step": 214540 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013763514638440852, + "loss": 0.0108, + "step": 214550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013762757869139453, + "loss": 0.0069, + "step": 214560 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376200109983805, + "loss": 0.009, + "step": 214570 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376124433053665, + "loss": 0.0082, + "step": 214580 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376048756123525, + "loss": 0.011, + "step": 214590 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013759730791933848, + "loss": 0.0095, + "step": 214600 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013758974022632446, + "loss": 0.0083, + "step": 214610 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013758217253331045, + "loss": 0.0088, + "step": 214620 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013757460484029643, + "loss": 0.0087, + "step": 214630 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013756703714728244, + "loss": 0.0103, + "step": 214640 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013755946945426842, + "loss": 0.0119, + "step": 214650 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001375519017612544, + "loss": 0.0121, + "step": 214660 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013754433406824038, + "loss": 0.0101, + "step": 214670 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001375367663752264, + "loss": 0.0107, + "step": 214680 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013752919868221237, + "loss": 0.0103, + "step": 214690 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013752163098919835, + "loss": 0.0136, + "step": 214700 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013751406329618436, + "loss": 0.009, + "step": 214710 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013750649560317034, + "loss": 0.0119, + "step": 214720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013749892791015632, + "loss": 0.0089, + "step": 214730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013749136021714233, + "loss": 0.0116, + "step": 214740 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374837925241283, + "loss": 0.0084, + "step": 214750 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374762248311143, + "loss": 0.0111, + "step": 214760 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374686571381003, + "loss": 0.0124, + "step": 214770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013746108944508628, + "loss": 0.0078, + "step": 214780 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013745352175207227, + "loss": 0.0073, + "step": 214790 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013744595405905827, + "loss": 0.0096, + "step": 214800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013743838636604426, + "loss": 0.0097, + "step": 214810 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013743081867303024, + "loss": 0.0107, + "step": 214820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013742325098001622, + "loss": 0.0073, + "step": 214830 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013741568328700223, + "loss": 0.0113, + "step": 214840 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374081155939882, + "loss": 0.0089, + "step": 214850 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374005479009742, + "loss": 0.0104, + "step": 214860 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373929802079602, + "loss": 0.0089, + "step": 214870 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013738541251494618, + "loss": 0.0081, + "step": 214880 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013737784482193216, + "loss": 0.0087, + "step": 214890 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013737027712891817, + "loss": 0.0083, + "step": 214900 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013736270943590415, + "loss": 0.0077, + "step": 214910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013735514174289013, + "loss": 0.0095, + "step": 214920 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013734757404987614, + "loss": 0.0098, + "step": 214930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013734000635686212, + "loss": 0.0137, + "step": 214940 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373324386638481, + "loss": 0.0117, + "step": 214950 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373248709708341, + "loss": 0.0105, + "step": 214960 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373173032778201, + "loss": 0.0105, + "step": 214970 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013730973558480608, + "loss": 0.0104, + "step": 214980 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013730216789179206, + "loss": 0.0088, + "step": 214990 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013729460019877807, + "loss": 0.0132, + "step": 215000 + }, + { + "epoch": 1.08, + "eval_cer": 0.9144809302605417, + "eval_loss": 0.0071860929019749165, + "eval_runtime": 116.5447, + "eval_samples_per_second": 17.161, + "eval_steps_per_second": 4.29, + "step": 215000 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013728703250576405, + "loss": 0.013, + "step": 215010 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013727946481275003, + "loss": 0.011, + "step": 215020 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013727189711973604, + "loss": 0.0118, + "step": 215030 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013726432942672202, + "loss": 0.0071, + "step": 215040 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137256761733708, + "loss": 0.009, + "step": 215050 + }, + { + "epoch": 1.09, + "learning_rate": 0.000137249194040694, + "loss": 0.0086, + "step": 215060 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013724162634768, + "loss": 0.0097, + "step": 215070 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013723405865466597, + "loss": 0.0097, + "step": 215080 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013722649096165198, + "loss": 0.0091, + "step": 215090 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013721892326863796, + "loss": 0.0101, + "step": 215100 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013721135557562394, + "loss": 0.009, + "step": 215110 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013720378788260995, + "loss": 0.0098, + "step": 215120 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013719622018959593, + "loss": 0.0091, + "step": 215130 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013718865249658191, + "loss": 0.0101, + "step": 215140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013718108480356792, + "loss": 0.0105, + "step": 215150 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371735171105539, + "loss": 0.0113, + "step": 215160 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013716594941753989, + "loss": 0.0086, + "step": 215170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013715838172452587, + "loss": 0.0079, + "step": 215180 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013715081403151188, + "loss": 0.0093, + "step": 215190 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013714324633849786, + "loss": 0.0104, + "step": 215200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013713567864548384, + "loss": 0.0091, + "step": 215210 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013712811095246985, + "loss": 0.0082, + "step": 215220 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013712054325945583, + "loss": 0.0078, + "step": 215230 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371129755664418, + "loss": 0.0113, + "step": 215240 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371054078734278, + "loss": 0.0091, + "step": 215250 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013709784018041377, + "loss": 0.0109, + "step": 215260 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013709027248739978, + "loss": 0.0121, + "step": 215270 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013708270479438576, + "loss": 0.0096, + "step": 215280 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013707513710137174, + "loss": 0.0102, + "step": 215290 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013706756940835775, + "loss": 0.0075, + "step": 215300 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013706000171534373, + "loss": 0.0089, + "step": 215310 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013705243402232972, + "loss": 0.009, + "step": 215320 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013704486632931572, + "loss": 0.0069, + "step": 215330 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370372986363017, + "loss": 0.0092, + "step": 215340 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370297309432877, + "loss": 0.0125, + "step": 215350 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013702216325027367, + "loss": 0.0107, + "step": 215360 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013701459555725968, + "loss": 0.0099, + "step": 215370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013700702786424566, + "loss": 0.0116, + "step": 215380 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013699946017123164, + "loss": 0.0101, + "step": 215390 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013699189247821765, + "loss": 0.009, + "step": 215400 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013698432478520363, + "loss": 0.0079, + "step": 215410 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369767570921896, + "loss": 0.014, + "step": 215420 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013696918939917562, + "loss": 0.0104, + "step": 215430 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369616217061616, + "loss": 0.0123, + "step": 215440 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013695405401314758, + "loss": 0.0127, + "step": 215450 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369464863201336, + "loss": 0.0098, + "step": 215460 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013693891862711957, + "loss": 0.0119, + "step": 215470 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013693135093410555, + "loss": 0.0069, + "step": 215480 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013692378324109156, + "loss": 0.0138, + "step": 215490 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013691621554807754, + "loss": 0.0085, + "step": 215500 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013690864785506353, + "loss": 0.0105, + "step": 215510 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369010801620495, + "loss": 0.0083, + "step": 215520 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013689351246903552, + "loss": 0.0092, + "step": 215530 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368859447760215, + "loss": 0.0088, + "step": 215540 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013687837708300748, + "loss": 0.0083, + "step": 215550 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368708093899935, + "loss": 0.0084, + "step": 215560 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013686324169697947, + "loss": 0.0087, + "step": 215570 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013685567400396545, + "loss": 0.0096, + "step": 215580 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013684810631095146, + "loss": 0.0116, + "step": 215590 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013684053861793744, + "loss": 0.0082, + "step": 215600 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013683297092492342, + "loss": 0.0095, + "step": 215610 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013682540323190943, + "loss": 0.009, + "step": 215620 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368178355388954, + "loss": 0.0098, + "step": 215630 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368102678458814, + "loss": 0.0116, + "step": 215640 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368027001528674, + "loss": 0.0128, + "step": 215650 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013679513245985338, + "loss": 0.0094, + "step": 215660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013678756476683936, + "loss": 0.0093, + "step": 215670 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013677999707382537, + "loss": 0.0112, + "step": 215680 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013677242938081135, + "loss": 0.0098, + "step": 215690 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013676486168779734, + "loss": 0.0089, + "step": 215700 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013675729399478332, + "loss": 0.0084, + "step": 215710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013674972630176933, + "loss": 0.0109, + "step": 215720 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367421586087553, + "loss": 0.012, + "step": 215730 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367345909157413, + "loss": 0.0104, + "step": 215740 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367270232227273, + "loss": 0.0097, + "step": 215750 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013671945552971328, + "loss": 0.0086, + "step": 215760 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013671188783669926, + "loss": 0.0112, + "step": 215770 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013670432014368527, + "loss": 0.0066, + "step": 215780 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013669675245067125, + "loss": 0.0102, + "step": 215790 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013668918475765723, + "loss": 0.0091, + "step": 215800 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013668161706464324, + "loss": 0.0097, + "step": 215810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013667404937162922, + "loss": 0.0108, + "step": 215820 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366664816786152, + "loss": 0.0092, + "step": 215830 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366589139856012, + "loss": 0.0093, + "step": 215840 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366513462925872, + "loss": 0.0085, + "step": 215850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013664377859957317, + "loss": 0.0086, + "step": 215860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013663621090655916, + "loss": 0.0104, + "step": 215870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013662864321354514, + "loss": 0.0084, + "step": 215880 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013662107552053112, + "loss": 0.0091, + "step": 215890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013661350782751713, + "loss": 0.0086, + "step": 215900 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366059401345031, + "loss": 0.0145, + "step": 215910 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365983724414891, + "loss": 0.0091, + "step": 215920 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365908047484751, + "loss": 0.0084, + "step": 215930 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013658323705546108, + "loss": 0.0079, + "step": 215940 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013657566936244706, + "loss": 0.0074, + "step": 215950 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013656810166943307, + "loss": 0.009, + "step": 215960 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013656053397641905, + "loss": 0.0076, + "step": 215970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013655296628340503, + "loss": 0.0079, + "step": 215980 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013654539859039104, + "loss": 0.0081, + "step": 215990 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013653783089737702, + "loss": 0.0104, + "step": 216000 + }, + { + "epoch": 1.09, + "eval_cer": 0.9144760782799146, + "eval_loss": 0.0073201656341552734, + "eval_runtime": 116.5986, + "eval_samples_per_second": 17.153, + "eval_steps_per_second": 4.288, + "step": 216000 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136530263204363, + "loss": 0.0089, + "step": 216010 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136522695511349, + "loss": 0.0088, + "step": 216020 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136515127818335, + "loss": 0.0064, + "step": 216030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013650756012532098, + "loss": 0.008, + "step": 216040 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013649999243230698, + "loss": 0.0087, + "step": 216050 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013649242473929297, + "loss": 0.0104, + "step": 216060 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013648485704627895, + "loss": 0.0128, + "step": 216070 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013647728935326493, + "loss": 0.012, + "step": 216080 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013646972166025094, + "loss": 0.0097, + "step": 216090 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013646215396723692, + "loss": 0.0101, + "step": 216100 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364545862742229, + "loss": 0.008, + "step": 216110 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364470185812089, + "loss": 0.0097, + "step": 216120 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364394508881949, + "loss": 0.0081, + "step": 216130 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013643188319518087, + "loss": 0.0068, + "step": 216140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013642431550216688, + "loss": 0.012, + "step": 216150 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013641674780915286, + "loss": 0.0083, + "step": 216160 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013640918011613884, + "loss": 0.0109, + "step": 216170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013640161242312485, + "loss": 0.0092, + "step": 216180 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013639404473011083, + "loss": 0.0109, + "step": 216190 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013638647703709681, + "loss": 0.0068, + "step": 216200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013637890934408282, + "loss": 0.0082, + "step": 216210 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363713416510688, + "loss": 0.0089, + "step": 216220 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013636377395805479, + "loss": 0.0087, + "step": 216230 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013635620626504077, + "loss": 0.0083, + "step": 216240 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013634863857202678, + "loss": 0.0084, + "step": 216250 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013634107087901276, + "loss": 0.0103, + "step": 216260 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013633350318599874, + "loss": 0.0107, + "step": 216270 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013632593549298475, + "loss": 0.0097, + "step": 216280 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013631836779997073, + "loss": 0.0096, + "step": 216290 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363108001069567, + "loss": 0.0129, + "step": 216300 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013630323241394272, + "loss": 0.0097, + "step": 216310 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362956647209287, + "loss": 0.0076, + "step": 216320 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013628809702791468, + "loss": 0.0112, + "step": 216330 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362805293349007, + "loss": 0.0075, + "step": 216340 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013627296164188667, + "loss": 0.0076, + "step": 216350 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013626539394887265, + "loss": 0.0081, + "step": 216360 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013625782625585866, + "loss": 0.0106, + "step": 216370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013625025856284464, + "loss": 0.0091, + "step": 216380 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013624269086983062, + "loss": 0.0091, + "step": 216390 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362351231768166, + "loss": 0.011, + "step": 216400 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013622755548380261, + "loss": 0.0085, + "step": 216410 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362199877907886, + "loss": 0.0091, + "step": 216420 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013621242009777458, + "loss": 0.0099, + "step": 216430 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013620485240476059, + "loss": 0.0086, + "step": 216440 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013619728471174657, + "loss": 0.0095, + "step": 216450 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013618971701873255, + "loss": 0.0067, + "step": 216460 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013618214932571856, + "loss": 0.0089, + "step": 216470 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013617458163270454, + "loss": 0.0074, + "step": 216480 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013616701393969052, + "loss": 0.0127, + "step": 216490 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361594462466765, + "loss": 0.0083, + "step": 216500 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013615187855366248, + "loss": 0.01, + "step": 216510 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361443108606485, + "loss": 0.0095, + "step": 216520 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013613674316763447, + "loss": 0.0108, + "step": 216530 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013612917547462045, + "loss": 0.008, + "step": 216540 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013612160778160646, + "loss": 0.0097, + "step": 216550 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013611404008859244, + "loss": 0.0084, + "step": 216560 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013610647239557843, + "loss": 0.007, + "step": 216570 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013609890470256443, + "loss": 0.0082, + "step": 216580 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013609133700955042, + "loss": 0.0122, + "step": 216590 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360837693165364, + "loss": 0.0085, + "step": 216600 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013607620162352238, + "loss": 0.0103, + "step": 216610 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360686339305084, + "loss": 0.0084, + "step": 216620 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013606106623749437, + "loss": 0.0075, + "step": 216630 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013605349854448035, + "loss": 0.0124, + "step": 216640 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013604593085146636, + "loss": 0.0092, + "step": 216650 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013603836315845234, + "loss": 0.0107, + "step": 216660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013603079546543832, + "loss": 0.0087, + "step": 216670 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013602322777242433, + "loss": 0.0093, + "step": 216680 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360156600794103, + "loss": 0.0093, + "step": 216690 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360080923863963, + "loss": 0.0127, + "step": 216700 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360005246933823, + "loss": 0.0101, + "step": 216710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013599295700036828, + "loss": 0.0108, + "step": 216720 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013598538930735426, + "loss": 0.0153, + "step": 216730 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013597782161434027, + "loss": 0.0084, + "step": 216740 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013597025392132625, + "loss": 0.0112, + "step": 216750 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013596268622831224, + "loss": 0.0092, + "step": 216760 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013595511853529822, + "loss": 0.0076, + "step": 216770 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013594755084228423, + "loss": 0.0112, + "step": 216780 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359399831492702, + "loss": 0.009, + "step": 216790 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359324154562562, + "loss": 0.0123, + "step": 216800 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359248477632422, + "loss": 0.0071, + "step": 216810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013591728007022818, + "loss": 0.0074, + "step": 216820 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013590971237721416, + "loss": 0.0093, + "step": 216830 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013590214468420017, + "loss": 0.0099, + "step": 216840 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013589457699118615, + "loss": 0.0078, + "step": 216850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013588700929817213, + "loss": 0.0086, + "step": 216860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013587944160515814, + "loss": 0.012, + "step": 216870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013587187391214412, + "loss": 0.0089, + "step": 216880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358643062191301, + "loss": 0.0098, + "step": 216890 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358567385261161, + "loss": 0.0094, + "step": 216900 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358491708331021, + "loss": 0.0097, + "step": 216910 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013584160314008807, + "loss": 0.0092, + "step": 216920 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013583403544707406, + "loss": 0.0104, + "step": 216930 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013582646775406006, + "loss": 0.0083, + "step": 216940 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013581890006104605, + "loss": 0.011, + "step": 216950 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013581133236803203, + "loss": 0.008, + "step": 216960 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013580376467501804, + "loss": 0.01, + "step": 216970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013579619698200402, + "loss": 0.0111, + "step": 216980 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013578862928899, + "loss": 0.0122, + "step": 216990 + }, + { + "epoch": 1.09, + "learning_rate": 0.000135781061595976, + "loss": 0.0094, + "step": 217000 + }, + { + "epoch": 1.09, + "eval_cer": 0.9144741374876638, + "eval_loss": 0.007423856761306524, + "eval_runtime": 116.6037, + "eval_samples_per_second": 17.152, + "eval_steps_per_second": 4.288, + "step": 217000 + }, + { + "epoch": 1.09, + "learning_rate": 0.000135773493902962, + "loss": 0.0097, + "step": 217010 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013576592620994797, + "loss": 0.0098, + "step": 217020 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013575835851693398, + "loss": 0.0105, + "step": 217030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013575079082391996, + "loss": 0.0095, + "step": 217040 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013574322313090594, + "loss": 0.0086, + "step": 217050 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013573565543789195, + "loss": 0.0081, + "step": 217060 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013572808774487793, + "loss": 0.0093, + "step": 217070 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001357205200518639, + "loss": 0.0081, + "step": 217080 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013571295235884992, + "loss": 0.0072, + "step": 217090 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001357053846658359, + "loss": 0.0104, + "step": 217100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013569781697282188, + "loss": 0.0097, + "step": 217110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013569024927980787, + "loss": 0.0078, + "step": 217120 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013568268158679385, + "loss": 0.0118, + "step": 217130 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013567511389377983, + "loss": 0.0099, + "step": 217140 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013566754620076584, + "loss": 0.0103, + "step": 217150 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013565997850775182, + "loss": 0.0102, + "step": 217160 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356524108147378, + "loss": 0.0114, + "step": 217170 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356448431217238, + "loss": 0.0079, + "step": 217180 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356372754287098, + "loss": 0.0094, + "step": 217190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013562970773569577, + "loss": 0.0087, + "step": 217200 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013562214004268178, + "loss": 0.0098, + "step": 217210 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013561457234966776, + "loss": 0.0094, + "step": 217220 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013560700465665374, + "loss": 0.0133, + "step": 217230 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013559943696363975, + "loss": 0.0093, + "step": 217240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013559186927062573, + "loss": 0.0103, + "step": 217250 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013558430157761171, + "loss": 0.0103, + "step": 217260 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013557673388459772, + "loss": 0.0091, + "step": 217270 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001355691661915837, + "loss": 0.0085, + "step": 217280 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013556159849856969, + "loss": 0.0069, + "step": 217290 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013555403080555567, + "loss": 0.0086, + "step": 217300 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013554646311254168, + "loss": 0.0092, + "step": 217310 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013553889541952766, + "loss": 0.0106, + "step": 217320 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013553132772651364, + "loss": 0.0092, + "step": 217330 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013552376003349965, + "loss": 0.0103, + "step": 217340 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013551619234048563, + "loss": 0.0091, + "step": 217350 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001355086246474716, + "loss": 0.0086, + "step": 217360 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013550105695445762, + "loss": 0.0098, + "step": 217370 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354934892614436, + "loss": 0.0083, + "step": 217380 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013548592156842958, + "loss": 0.007, + "step": 217390 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354783538754156, + "loss": 0.0106, + "step": 217400 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013547078618240157, + "loss": 0.0085, + "step": 217410 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013546321848938755, + "loss": 0.0073, + "step": 217420 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013545565079637356, + "loss": 0.0098, + "step": 217430 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013544808310335954, + "loss": 0.0106, + "step": 217440 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013544051541034552, + "loss": 0.0093, + "step": 217450 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354329477173315, + "loss": 0.0114, + "step": 217460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013542538002431751, + "loss": 0.0099, + "step": 217470 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354178123313035, + "loss": 0.0094, + "step": 217480 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013541024463828948, + "loss": 0.008, + "step": 217490 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013540267694527549, + "loss": 0.0104, + "step": 217500 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013539510925226147, + "loss": 0.0103, + "step": 217510 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013538754155924745, + "loss": 0.0081, + "step": 217520 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013537997386623346, + "loss": 0.0128, + "step": 217530 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013537240617321944, + "loss": 0.0082, + "step": 217540 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013536483848020542, + "loss": 0.008, + "step": 217550 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013535727078719143, + "loss": 0.0124, + "step": 217560 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353497030941774, + "loss": 0.0071, + "step": 217570 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353421354011634, + "loss": 0.0103, + "step": 217580 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353345677081494, + "loss": 0.0128, + "step": 217590 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013532700001513538, + "loss": 0.0081, + "step": 217600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013531943232212136, + "loss": 0.0111, + "step": 217610 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013531186462910737, + "loss": 0.0084, + "step": 217620 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013530429693609335, + "loss": 0.0103, + "step": 217630 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013529672924307933, + "loss": 0.0095, + "step": 217640 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013528916155006532, + "loss": 0.0091, + "step": 217650 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013528159385705132, + "loss": 0.0094, + "step": 217660 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352740261640373, + "loss": 0.0109, + "step": 217670 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352664584710233, + "loss": 0.0111, + "step": 217680 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352588907780093, + "loss": 0.01, + "step": 217690 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013525132308499528, + "loss": 0.009, + "step": 217700 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013524375539198126, + "loss": 0.0098, + "step": 217710 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013523618769896727, + "loss": 0.0101, + "step": 217720 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013522862000595325, + "loss": 0.0089, + "step": 217730 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013522105231293923, + "loss": 0.0077, + "step": 217740 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013521348461992524, + "loss": 0.0105, + "step": 217750 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352059169269112, + "loss": 0.0074, + "step": 217760 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351983492338972, + "loss": 0.0105, + "step": 217770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013519078154088318, + "loss": 0.0108, + "step": 217780 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013518321384786916, + "loss": 0.0096, + "step": 217790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013517564615485517, + "loss": 0.0089, + "step": 217800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013516807846184115, + "loss": 0.0099, + "step": 217810 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013516051076882714, + "loss": 0.0099, + "step": 217820 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013515294307581312, + "loss": 0.0188, + "step": 217830 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013514537538279913, + "loss": 0.0099, + "step": 217840 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351378076897851, + "loss": 0.0119, + "step": 217850 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351302399967711, + "loss": 0.0089, + "step": 217860 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351226723037571, + "loss": 0.0105, + "step": 217870 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013511510461074308, + "loss": 0.0073, + "step": 217880 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013510753691772906, + "loss": 0.0088, + "step": 217890 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013509996922471507, + "loss": 0.011, + "step": 217900 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013509240153170105, + "loss": 0.0088, + "step": 217910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013508483383868703, + "loss": 0.0103, + "step": 217920 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013507726614567304, + "loss": 0.008, + "step": 217930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013506969845265902, + "loss": 0.0104, + "step": 217940 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135062130759645, + "loss": 0.0087, + "step": 217950 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135054563066631, + "loss": 0.0111, + "step": 217960 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135046995373617, + "loss": 0.0104, + "step": 217970 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013503942768060297, + "loss": 0.0133, + "step": 217980 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013503185998758898, + "loss": 0.011, + "step": 217990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013502429229457496, + "loss": 0.0077, + "step": 218000 + }, + { + "epoch": 1.1, + "eval_cer": 0.9144867526372941, + "eval_loss": 0.006999760400503874, + "eval_runtime": 116.2125, + "eval_samples_per_second": 17.21, + "eval_steps_per_second": 4.302, + "step": 218000 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013501672460156095, + "loss": 0.0123, + "step": 218010 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013500915690854693, + "loss": 0.0082, + "step": 218020 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013500158921553294, + "loss": 0.0101, + "step": 218030 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013499402152251892, + "loss": 0.0102, + "step": 218040 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349864538295049, + "loss": 0.0086, + "step": 218050 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349788861364909, + "loss": 0.0095, + "step": 218060 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349713184434769, + "loss": 0.0087, + "step": 218070 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013496375075046287, + "loss": 0.0114, + "step": 218080 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013495618305744888, + "loss": 0.0101, + "step": 218090 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013494861536443486, + "loss": 0.0098, + "step": 218100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013494104767142084, + "loss": 0.0096, + "step": 218110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013493347997840685, + "loss": 0.0094, + "step": 218120 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013492591228539283, + "loss": 0.0113, + "step": 218130 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349183445923788, + "loss": 0.0129, + "step": 218140 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013491077689936482, + "loss": 0.0101, + "step": 218150 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349032092063508, + "loss": 0.0094, + "step": 218160 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013489564151333678, + "loss": 0.0102, + "step": 218170 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013488807382032277, + "loss": 0.0104, + "step": 218180 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013488050612730877, + "loss": 0.0099, + "step": 218190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013487293843429476, + "loss": 0.0096, + "step": 218200 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013486537074128074, + "loss": 0.0102, + "step": 218210 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013485780304826675, + "loss": 0.008, + "step": 218220 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013485023535525273, + "loss": 0.0105, + "step": 218230 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348426676622387, + "loss": 0.0093, + "step": 218240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013483509996922472, + "loss": 0.0104, + "step": 218250 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348275322762107, + "loss": 0.0102, + "step": 218260 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013481996458319668, + "loss": 0.0083, + "step": 218270 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348123968901827, + "loss": 0.0104, + "step": 218280 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013480482919716867, + "loss": 0.0097, + "step": 218290 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013479726150415465, + "loss": 0.009, + "step": 218300 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013478969381114066, + "loss": 0.0086, + "step": 218310 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013478212611812664, + "loss": 0.0106, + "step": 218320 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013477455842511262, + "loss": 0.0099, + "step": 218330 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347669907320986, + "loss": 0.0108, + "step": 218340 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347594230390846, + "loss": 0.0112, + "step": 218350 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347518553460706, + "loss": 0.0106, + "step": 218360 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013474428765305658, + "loss": 0.0077, + "step": 218370 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013473671996004258, + "loss": 0.014, + "step": 218380 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013472915226702854, + "loss": 0.0105, + "step": 218390 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013472158457401455, + "loss": 0.0139, + "step": 218400 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013471401688100053, + "loss": 0.0107, + "step": 218410 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347064491879865, + "loss": 0.0074, + "step": 218420 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013469888149497252, + "loss": 0.0088, + "step": 218430 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346913138019585, + "loss": 0.0103, + "step": 218440 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013468374610894448, + "loss": 0.0088, + "step": 218450 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346761784159305, + "loss": 0.009, + "step": 218460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013466861072291647, + "loss": 0.0099, + "step": 218470 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013466104302990245, + "loss": 0.0084, + "step": 218480 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013465347533688846, + "loss": 0.0127, + "step": 218490 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013464590764387444, + "loss": 0.0092, + "step": 218500 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013463833995086042, + "loss": 0.0089, + "step": 218510 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013463077225784643, + "loss": 0.0079, + "step": 218520 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013462320456483241, + "loss": 0.0104, + "step": 218530 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346156368718184, + "loss": 0.0113, + "step": 218540 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013460806917880438, + "loss": 0.0096, + "step": 218550 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013460050148579039, + "loss": 0.0077, + "step": 218560 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013459293379277637, + "loss": 0.0077, + "step": 218570 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013458536609976235, + "loss": 0.0096, + "step": 218580 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013457779840674836, + "loss": 0.009, + "step": 218590 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013457023071373434, + "loss": 0.0087, + "step": 218600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013456266302072032, + "loss": 0.0112, + "step": 218610 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013455509532770633, + "loss": 0.0089, + "step": 218620 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345475276346923, + "loss": 0.0107, + "step": 218630 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345399599416783, + "loss": 0.0085, + "step": 218640 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345323922486643, + "loss": 0.0083, + "step": 218650 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013452482455565028, + "loss": 0.009, + "step": 218660 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013451725686263626, + "loss": 0.0094, + "step": 218670 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013450968916962227, + "loss": 0.01, + "step": 218680 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013450212147660825, + "loss": 0.0082, + "step": 218690 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013449455378359423, + "loss": 0.0097, + "step": 218700 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013448698609058022, + "loss": 0.0128, + "step": 218710 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013447941839756622, + "loss": 0.0085, + "step": 218720 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344718507045522, + "loss": 0.009, + "step": 218730 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344642830115382, + "loss": 0.009, + "step": 218740 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344567153185242, + "loss": 0.009, + "step": 218750 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013444914762551018, + "loss": 0.0075, + "step": 218760 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013444157993249616, + "loss": 0.0114, + "step": 218770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013443401223948217, + "loss": 0.01, + "step": 218780 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013442644454646815, + "loss": 0.01, + "step": 218790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013441887685345413, + "loss": 0.0095, + "step": 218800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013441130916044014, + "loss": 0.01, + "step": 218810 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013440374146742612, + "loss": 0.0119, + "step": 218820 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343961737744121, + "loss": 0.0094, + "step": 218830 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343886060813981, + "loss": 0.0081, + "step": 218840 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343810383883841, + "loss": 0.0083, + "step": 218850 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013437347069537007, + "loss": 0.0105, + "step": 218860 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013436590300235605, + "loss": 0.0095, + "step": 218870 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013435833530934206, + "loss": 0.0111, + "step": 218880 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013435076761632804, + "loss": 0.0072, + "step": 218890 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013434319992331403, + "loss": 0.0123, + "step": 218900 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013433563223030003, + "loss": 0.0066, + "step": 218910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013432806453728602, + "loss": 0.0082, + "step": 218920 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134320496844272, + "loss": 0.0085, + "step": 218930 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134312929151258, + "loss": 0.0088, + "step": 218940 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134305361458244, + "loss": 0.0115, + "step": 218950 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013429779376522997, + "loss": 0.0093, + "step": 218960 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013429022607221598, + "loss": 0.0127, + "step": 218970 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013428265837920196, + "loss": 0.0107, + "step": 218980 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013427509068618794, + "loss": 0.0085, + "step": 218990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013426752299317395, + "loss": 0.0087, + "step": 219000 + }, + { + "epoch": 1.1, + "eval_cer": 0.9144799598644162, + "eval_loss": 0.007354082074016333, + "eval_runtime": 116.3343, + "eval_samples_per_second": 17.192, + "eval_steps_per_second": 4.298, + "step": 219000 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013425995530015993, + "loss": 0.0105, + "step": 219010 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001342523876071459, + "loss": 0.0091, + "step": 219020 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001342448199141319, + "loss": 0.0087, + "step": 219030 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013423725222111787, + "loss": 0.0103, + "step": 219040 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013422968452810388, + "loss": 0.0114, + "step": 219050 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013422211683508986, + "loss": 0.0088, + "step": 219060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013421454914207585, + "loss": 0.0107, + "step": 219070 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013420698144906183, + "loss": 0.0094, + "step": 219080 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013419941375604784, + "loss": 0.0085, + "step": 219090 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013419184606303382, + "loss": 0.0095, + "step": 219100 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341842783700198, + "loss": 0.0109, + "step": 219110 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341767106770058, + "loss": 0.0102, + "step": 219120 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341691429839918, + "loss": 0.0099, + "step": 219130 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013416157529097777, + "loss": 0.0104, + "step": 219140 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013415400759796378, + "loss": 0.0083, + "step": 219150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013414643990494976, + "loss": 0.0103, + "step": 219160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013413887221193574, + "loss": 0.0093, + "step": 219170 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013413130451892175, + "loss": 0.0116, + "step": 219180 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013412373682590773, + "loss": 0.0088, + "step": 219190 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341161691328937, + "loss": 0.01, + "step": 219200 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013410860143987972, + "loss": 0.0094, + "step": 219210 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341010337468657, + "loss": 0.0103, + "step": 219220 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013409346605385168, + "loss": 0.009, + "step": 219230 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013408589836083767, + "loss": 0.0087, + "step": 219240 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013407833066782367, + "loss": 0.0076, + "step": 219250 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013407076297480966, + "loss": 0.012, + "step": 219260 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013406319528179564, + "loss": 0.0097, + "step": 219270 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013405562758878165, + "loss": 0.0075, + "step": 219280 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013404805989576763, + "loss": 0.0094, + "step": 219290 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340404922027536, + "loss": 0.0104, + "step": 219300 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013403292450973962, + "loss": 0.0083, + "step": 219310 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340253568167256, + "loss": 0.0069, + "step": 219320 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013401778912371158, + "loss": 0.0084, + "step": 219330 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340102214306976, + "loss": 0.0097, + "step": 219340 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013400265373768357, + "loss": 0.0106, + "step": 219350 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013399508604466955, + "loss": 0.0071, + "step": 219360 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013398751835165556, + "loss": 0.0117, + "step": 219370 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013397995065864154, + "loss": 0.0129, + "step": 219380 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013397238296562752, + "loss": 0.0094, + "step": 219390 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339648152726135, + "loss": 0.0109, + "step": 219400 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339572475795995, + "loss": 0.0082, + "step": 219410 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339496798865855, + "loss": 0.0105, + "step": 219420 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013394211219357148, + "loss": 0.0107, + "step": 219430 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013393454450055748, + "loss": 0.0119, + "step": 219440 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013392697680754347, + "loss": 0.0087, + "step": 219450 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013391940911452945, + "loss": 0.0096, + "step": 219460 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013391184142151546, + "loss": 0.0096, + "step": 219470 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013390427372850144, + "loss": 0.009, + "step": 219480 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013389670603548742, + "loss": 0.0097, + "step": 219490 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013388913834247343, + "loss": 0.0098, + "step": 219500 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338815706494594, + "loss": 0.0128, + "step": 219510 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338740029564454, + "loss": 0.0071, + "step": 219520 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338664352634314, + "loss": 0.0075, + "step": 219530 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013385886757041738, + "loss": 0.0092, + "step": 219540 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013385129987740336, + "loss": 0.0089, + "step": 219550 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013384373218438937, + "loss": 0.007, + "step": 219560 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013383616449137535, + "loss": 0.0099, + "step": 219570 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013382859679836133, + "loss": 0.0118, + "step": 219580 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013382102910534731, + "loss": 0.0098, + "step": 219590 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013381346141233332, + "loss": 0.0089, + "step": 219600 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338058937193193, + "loss": 0.0128, + "step": 219610 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013379832602630529, + "loss": 0.0091, + "step": 219620 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337907583332913, + "loss": 0.0083, + "step": 219630 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013378319064027728, + "loss": 0.0102, + "step": 219640 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013377562294726326, + "loss": 0.0078, + "step": 219650 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013376805525424924, + "loss": 0.0108, + "step": 219660 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013376048756123522, + "loss": 0.0106, + "step": 219670 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013375291986822123, + "loss": 0.0112, + "step": 219680 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337453521752072, + "loss": 0.0094, + "step": 219690 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337377844821932, + "loss": 0.012, + "step": 219700 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337302167891792, + "loss": 0.009, + "step": 219710 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013372264909616518, + "loss": 0.0107, + "step": 219720 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013371508140315116, + "loss": 0.0093, + "step": 219730 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013370751371013717, + "loss": 0.0103, + "step": 219740 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013369994601712315, + "loss": 0.0088, + "step": 219750 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013369237832410913, + "loss": 0.0083, + "step": 219760 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013368481063109512, + "loss": 0.0103, + "step": 219770 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013367724293808112, + "loss": 0.0084, + "step": 219780 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336696752450671, + "loss": 0.0073, + "step": 219790 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336621075520531, + "loss": 0.0089, + "step": 219800 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336545398590391, + "loss": 0.0086, + "step": 219810 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013364697216602508, + "loss": 0.0094, + "step": 219820 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013363940447301106, + "loss": 0.0112, + "step": 219830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013363183677999707, + "loss": 0.0078, + "step": 219840 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013362426908698305, + "loss": 0.0078, + "step": 219850 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013361670139396903, + "loss": 0.0094, + "step": 219860 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013360913370095504, + "loss": 0.0101, + "step": 219870 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013360156600794102, + "loss": 0.0114, + "step": 219880 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133593998314927, + "loss": 0.0088, + "step": 219890 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133586430621913, + "loss": 0.0088, + "step": 219900 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133578862928899, + "loss": 0.0094, + "step": 219910 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013357129523588497, + "loss": 0.0079, + "step": 219920 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013356372754287098, + "loss": 0.0105, + "step": 219930 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013355615984985696, + "loss": 0.0113, + "step": 219940 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013354859215684294, + "loss": 0.0113, + "step": 219950 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013354102446382893, + "loss": 0.0084, + "step": 219960 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013353345677081493, + "loss": 0.0104, + "step": 219970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013352588907780092, + "loss": 0.0082, + "step": 219980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335183213847869, + "loss": 0.0096, + "step": 219990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335107536917729, + "loss": 0.0092, + "step": 220000 + }, + { + "epoch": 1.11, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.007259270641952753, + "eval_runtime": 116.3674, + "eval_samples_per_second": 17.187, + "eval_steps_per_second": 4.297, + "step": 220000 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335031859987589, + "loss": 0.0095, + "step": 220010 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013349561830574487, + "loss": 0.0124, + "step": 220020 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013348805061273088, + "loss": 0.0093, + "step": 220030 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013348048291971686, + "loss": 0.0102, + "step": 220040 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013347291522670284, + "loss": 0.0096, + "step": 220050 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013346534753368885, + "loss": 0.0121, + "step": 220060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013345777984067483, + "loss": 0.0112, + "step": 220070 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334502121476608, + "loss": 0.0094, + "step": 220080 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013344264445464682, + "loss": 0.0098, + "step": 220090 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334350767616328, + "loss": 0.0092, + "step": 220100 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013342750906861878, + "loss": 0.0078, + "step": 220110 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013341994137560476, + "loss": 0.0092, + "step": 220120 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013341237368259077, + "loss": 0.0097, + "step": 220130 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013340480598957675, + "loss": 0.0094, + "step": 220140 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013339723829656274, + "loss": 0.0084, + "step": 220150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013338967060354874, + "loss": 0.0096, + "step": 220160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013338210291053473, + "loss": 0.0096, + "step": 220170 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333745352175207, + "loss": 0.0081, + "step": 220180 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013336696752450672, + "loss": 0.0096, + "step": 220190 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333593998314927, + "loss": 0.0102, + "step": 220200 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013335183213847868, + "loss": 0.0093, + "step": 220210 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333442644454647, + "loss": 0.0077, + "step": 220220 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013333669675245067, + "loss": 0.0108, + "step": 220230 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013332912905943665, + "loss": 0.011, + "step": 220240 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013332156136642266, + "loss": 0.009, + "step": 220250 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013331399367340864, + "loss": 0.007, + "step": 220260 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013330642598039462, + "loss": 0.013, + "step": 220270 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332988582873806, + "loss": 0.0085, + "step": 220280 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013329129059436659, + "loss": 0.0093, + "step": 220290 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013328372290135257, + "loss": 0.0092, + "step": 220300 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013327615520833858, + "loss": 0.0104, + "step": 220310 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013326858751532456, + "loss": 0.0087, + "step": 220320 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013326101982231054, + "loss": 0.0099, + "step": 220330 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013325345212929655, + "loss": 0.0113, + "step": 220340 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013324588443628253, + "loss": 0.0104, + "step": 220350 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332383167432685, + "loss": 0.0099, + "step": 220360 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013323074905025452, + "loss": 0.01, + "step": 220370 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332231813572405, + "loss": 0.008, + "step": 220380 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013321561366422648, + "loss": 0.0114, + "step": 220390 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332080459712125, + "loss": 0.0097, + "step": 220400 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013320047827819847, + "loss": 0.0095, + "step": 220410 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013319291058518445, + "loss": 0.0094, + "step": 220420 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013318534289217046, + "loss": 0.011, + "step": 220430 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013317777519915644, + "loss": 0.0086, + "step": 220440 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013317020750614242, + "loss": 0.009, + "step": 220450 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013316263981312843, + "loss": 0.0088, + "step": 220460 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013315507212011441, + "loss": 0.0078, + "step": 220470 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331475044271004, + "loss": 0.0084, + "step": 220480 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013313993673408638, + "loss": 0.0082, + "step": 220490 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013313236904107239, + "loss": 0.0111, + "step": 220500 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013312480134805837, + "loss": 0.0086, + "step": 220510 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013311723365504435, + "loss": 0.0101, + "step": 220520 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013310966596203036, + "loss": 0.008, + "step": 220530 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013310209826901634, + "loss": 0.0089, + "step": 220540 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013309453057600232, + "loss": 0.0103, + "step": 220550 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013308696288298833, + "loss": 0.0094, + "step": 220560 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330793951899743, + "loss": 0.0106, + "step": 220570 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330718274969603, + "loss": 0.0099, + "step": 220580 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330642598039463, + "loss": 0.0099, + "step": 220590 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013305669211093228, + "loss": 0.0103, + "step": 220600 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013304912441791826, + "loss": 0.0095, + "step": 220610 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013304155672490427, + "loss": 0.0079, + "step": 220620 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013303398903189025, + "loss": 0.0076, + "step": 220630 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013302642133887623, + "loss": 0.0089, + "step": 220640 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013301885364586222, + "loss": 0.0085, + "step": 220650 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013301128595284822, + "loss": 0.0098, + "step": 220660 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330037182598342, + "loss": 0.0098, + "step": 220670 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329961505668202, + "loss": 0.0089, + "step": 220680 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329885828738062, + "loss": 0.0122, + "step": 220690 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013298101518079218, + "loss": 0.01, + "step": 220700 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013297344748777816, + "loss": 0.0098, + "step": 220710 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013296587979476417, + "loss": 0.0101, + "step": 220720 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013295831210175015, + "loss": 0.009, + "step": 220730 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013295074440873613, + "loss": 0.009, + "step": 220740 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013294317671572214, + "loss": 0.009, + "step": 220750 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013293560902270812, + "loss": 0.0099, + "step": 220760 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329280413296941, + "loss": 0.011, + "step": 220770 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329204736366801, + "loss": 0.0127, + "step": 220780 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329129059436661, + "loss": 0.0095, + "step": 220790 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013290533825065207, + "loss": 0.0071, + "step": 220800 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013289777055763805, + "loss": 0.0084, + "step": 220810 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013289020286462406, + "loss": 0.0088, + "step": 220820 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013288263517161004, + "loss": 0.0083, + "step": 220830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013287506747859603, + "loss": 0.0131, + "step": 220840 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013286749978558203, + "loss": 0.0084, + "step": 220850 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013285993209256802, + "loss": 0.0099, + "step": 220860 + }, + { + "epoch": 1.11, + "learning_rate": 0.000132852364399554, + "loss": 0.0098, + "step": 220870 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013284479670654, + "loss": 0.0118, + "step": 220880 + }, + { + "epoch": 1.11, + "learning_rate": 0.000132837229013526, + "loss": 0.0085, + "step": 220890 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013282966132051197, + "loss": 0.0095, + "step": 220900 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013282209362749795, + "loss": 0.0106, + "step": 220910 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013281452593448393, + "loss": 0.0097, + "step": 220920 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013280695824146994, + "loss": 0.0087, + "step": 220930 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013279939054845592, + "loss": 0.008, + "step": 220940 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327918228554419, + "loss": 0.0089, + "step": 220950 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327842551624279, + "loss": 0.008, + "step": 220960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327766874694139, + "loss": 0.0092, + "step": 220970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013276911977639987, + "loss": 0.0084, + "step": 220980 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013276155208338588, + "loss": 0.0084, + "step": 220990 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013275398439037186, + "loss": 0.0098, + "step": 221000 + }, + { + "epoch": 1.11, + "eval_cer": 0.9144712262992877, + "eval_loss": 0.007316153962165117, + "eval_runtime": 116.2409, + "eval_samples_per_second": 17.206, + "eval_steps_per_second": 4.301, + "step": 221000 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013274641669735785, + "loss": 0.0087, + "step": 221010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013273884900434383, + "loss": 0.0087, + "step": 221020 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013273128131132984, + "loss": 0.0086, + "step": 221030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013272371361831582, + "loss": 0.0081, + "step": 221040 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327161459253018, + "loss": 0.0073, + "step": 221050 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327085782322878, + "loss": 0.0095, + "step": 221060 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327010105392738, + "loss": 0.0076, + "step": 221070 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013269344284625977, + "loss": 0.0102, + "step": 221080 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013268587515324578, + "loss": 0.007, + "step": 221090 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013267830746023176, + "loss": 0.0085, + "step": 221100 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013267073976721774, + "loss": 0.0145, + "step": 221110 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013266317207420375, + "loss": 0.0096, + "step": 221120 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013265560438118973, + "loss": 0.0093, + "step": 221130 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326480366881757, + "loss": 0.0106, + "step": 221140 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013264046899516172, + "loss": 0.0105, + "step": 221150 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326329013021477, + "loss": 0.0187, + "step": 221160 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013262533360913368, + "loss": 0.013, + "step": 221170 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013261776591611967, + "loss": 0.0105, + "step": 221180 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013261019822310567, + "loss": 0.0121, + "step": 221190 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013260263053009166, + "loss": 0.0089, + "step": 221200 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013259506283707764, + "loss": 0.0107, + "step": 221210 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013258749514406365, + "loss": 0.0065, + "step": 221220 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013257992745104963, + "loss": 0.0099, + "step": 221230 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325723597580356, + "loss": 0.0102, + "step": 221240 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013256479206502162, + "loss": 0.0107, + "step": 221250 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325572243720076, + "loss": 0.0095, + "step": 221260 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013254965667899358, + "loss": 0.0091, + "step": 221270 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325420889859796, + "loss": 0.0111, + "step": 221280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013253452129296557, + "loss": 0.009, + "step": 221290 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013252695359995155, + "loss": 0.0087, + "step": 221300 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013251938590693756, + "loss": 0.0098, + "step": 221310 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013251181821392354, + "loss": 0.0087, + "step": 221320 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013250425052090952, + "loss": 0.0082, + "step": 221330 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324966828278955, + "loss": 0.0081, + "step": 221340 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324891151348815, + "loss": 0.008, + "step": 221350 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324815474418675, + "loss": 0.0102, + "step": 221360 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013247397974885348, + "loss": 0.0129, + "step": 221370 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013246641205583948, + "loss": 0.0084, + "step": 221380 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013245884436282547, + "loss": 0.0082, + "step": 221390 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013245127666981145, + "loss": 0.0102, + "step": 221400 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013244370897679746, + "loss": 0.01, + "step": 221410 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013243614128378344, + "loss": 0.0097, + "step": 221420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013242857359076942, + "loss": 0.0104, + "step": 221430 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013242100589775543, + "loss": 0.0088, + "step": 221440 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324134382047414, + "loss": 0.0119, + "step": 221450 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324058705117274, + "loss": 0.0087, + "step": 221460 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323983028187134, + "loss": 0.0078, + "step": 221470 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013239073512569938, + "loss": 0.0089, + "step": 221480 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013238316743268536, + "loss": 0.0096, + "step": 221490 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013237559973967137, + "loss": 0.0075, + "step": 221500 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013236803204665735, + "loss": 0.0108, + "step": 221510 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013236046435364333, + "loss": 0.0104, + "step": 221520 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013235289666062931, + "loss": 0.0085, + "step": 221530 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323453289676153, + "loss": 0.0081, + "step": 221540 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013233776127460128, + "loss": 0.0098, + "step": 221550 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013233019358158729, + "loss": 0.0075, + "step": 221560 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013232262588857327, + "loss": 0.0104, + "step": 221570 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013231505819555925, + "loss": 0.0073, + "step": 221580 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013230749050254526, + "loss": 0.0135, + "step": 221590 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013229992280953124, + "loss": 0.009, + "step": 221600 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013229235511651722, + "loss": 0.0072, + "step": 221610 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013228478742350323, + "loss": 0.0124, + "step": 221620 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322772197304892, + "loss": 0.0096, + "step": 221630 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322696520374752, + "loss": 0.0099, + "step": 221640 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322620843444612, + "loss": 0.0104, + "step": 221650 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013225451665144718, + "loss": 0.0086, + "step": 221660 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013224694895843316, + "loss": 0.0111, + "step": 221670 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013223938126541917, + "loss": 0.009, + "step": 221680 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013223181357240515, + "loss": 0.0112, + "step": 221690 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013222424587939113, + "loss": 0.0302, + "step": 221700 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013221667818637712, + "loss": 0.0137, + "step": 221710 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013220911049336312, + "loss": 0.0125, + "step": 221720 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322015428003491, + "loss": 0.0086, + "step": 221730 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321939751073351, + "loss": 0.0094, + "step": 221740 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321864074143211, + "loss": 0.0084, + "step": 221750 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013217883972130708, + "loss": 0.0071, + "step": 221760 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013217127202829306, + "loss": 0.0095, + "step": 221770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013216370433527907, + "loss": 0.0073, + "step": 221780 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013215613664226505, + "loss": 0.0099, + "step": 221790 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013214856894925103, + "loss": 0.011, + "step": 221800 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013214100125623704, + "loss": 0.009, + "step": 221810 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013213343356322302, + "loss": 0.0075, + "step": 221820 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132125865870209, + "loss": 0.0103, + "step": 221830 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132118298177195, + "loss": 0.0093, + "step": 221840 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132110730484181, + "loss": 0.0083, + "step": 221850 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013210316279116697, + "loss": 0.0093, + "step": 221860 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013209559509815298, + "loss": 0.0126, + "step": 221870 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013208802740513896, + "loss": 0.0078, + "step": 221880 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013208045971212494, + "loss": 0.0089, + "step": 221890 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013207289201911093, + "loss": 0.0084, + "step": 221900 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013206532432609693, + "loss": 0.0099, + "step": 221910 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013205775663308292, + "loss": 0.0114, + "step": 221920 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320501889400689, + "loss": 0.0092, + "step": 221930 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320426212470549, + "loss": 0.0119, + "step": 221940 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320350535540409, + "loss": 0.0091, + "step": 221950 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013202748586102687, + "loss": 0.0094, + "step": 221960 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013201991816801288, + "loss": 0.012, + "step": 221970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013201235047499886, + "loss": 0.0083, + "step": 221980 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013200478278198484, + "loss": 0.0094, + "step": 221990 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013199721508897085, + "loss": 0.0103, + "step": 222000 + }, + { + "epoch": 1.12, + "eval_cer": 0.9144731670915385, + "eval_loss": 0.007101530209183693, + "eval_runtime": 116.3424, + "eval_samples_per_second": 17.191, + "eval_steps_per_second": 4.298, + "step": 222000 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013198964739595683, + "loss": 0.0095, + "step": 222010 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319820797029428, + "loss": 0.0094, + "step": 222020 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013197451200992882, + "loss": 0.0088, + "step": 222030 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319669443169148, + "loss": 0.0095, + "step": 222040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013195937662390078, + "loss": 0.0087, + "step": 222050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013195180893088676, + "loss": 0.0114, + "step": 222060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013194424123787277, + "loss": 0.0078, + "step": 222070 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013193667354485875, + "loss": 0.0081, + "step": 222080 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013192910585184474, + "loss": 0.0105, + "step": 222090 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013192153815883074, + "loss": 0.0084, + "step": 222100 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013191397046581673, + "loss": 0.01, + "step": 222110 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319064027728027, + "loss": 0.0105, + "step": 222120 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013189883507978872, + "loss": 0.0105, + "step": 222130 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318912673867747, + "loss": 0.0071, + "step": 222140 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013188369969376068, + "loss": 0.0094, + "step": 222150 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013187613200074666, + "loss": 0.0093, + "step": 222160 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013186856430773264, + "loss": 0.0089, + "step": 222170 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013186099661471865, + "loss": 0.0107, + "step": 222180 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013185342892170463, + "loss": 0.0089, + "step": 222190 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318458612286906, + "loss": 0.0093, + "step": 222200 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013183829353567662, + "loss": 0.0074, + "step": 222210 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318307258426626, + "loss": 0.0089, + "step": 222220 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013182315814964858, + "loss": 0.0118, + "step": 222230 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013181559045663457, + "loss": 0.0085, + "step": 222240 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013180802276362057, + "loss": 0.0081, + "step": 222250 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013180045507060656, + "loss": 0.009, + "step": 222260 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013179288737759254, + "loss": 0.0072, + "step": 222270 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013178531968457855, + "loss": 0.0102, + "step": 222280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013177775199156453, + "loss": 0.0092, + "step": 222290 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317701842985505, + "loss": 0.0082, + "step": 222300 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013176261660553652, + "loss": 0.0091, + "step": 222310 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317550489125225, + "loss": 0.0101, + "step": 222320 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013174748121950848, + "loss": 0.0113, + "step": 222330 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317399135264945, + "loss": 0.0099, + "step": 222340 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013173234583348047, + "loss": 0.0085, + "step": 222350 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013172477814046645, + "loss": 0.0106, + "step": 222360 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013171721044745246, + "loss": 0.0095, + "step": 222370 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013170964275443844, + "loss": 0.0089, + "step": 222380 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013170207506142442, + "loss": 0.0093, + "step": 222390 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013169450736841043, + "loss": 0.0096, + "step": 222400 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316869396753964, + "loss": 0.0082, + "step": 222410 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316793719823824, + "loss": 0.0072, + "step": 222420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013167180428936838, + "loss": 0.0077, + "step": 222430 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013166423659635438, + "loss": 0.0091, + "step": 222440 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013165666890334037, + "loss": 0.0082, + "step": 222450 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013164910121032635, + "loss": 0.0086, + "step": 222460 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013164153351731236, + "loss": 0.0079, + "step": 222470 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013163396582429834, + "loss": 0.0102, + "step": 222480 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013162639813128432, + "loss": 0.0084, + "step": 222490 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013161883043827033, + "loss": 0.0121, + "step": 222500 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316112627452563, + "loss": 0.0152, + "step": 222510 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316036950522423, + "loss": 0.0075, + "step": 222520 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315961273592283, + "loss": 0.0107, + "step": 222530 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013158855966621428, + "loss": 0.0099, + "step": 222540 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013158099197320026, + "loss": 0.0087, + "step": 222550 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013157342428018627, + "loss": 0.0084, + "step": 222560 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013156585658717225, + "loss": 0.0113, + "step": 222570 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013155828889415823, + "loss": 0.0103, + "step": 222580 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013155072120114421, + "loss": 0.0104, + "step": 222590 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013154315350813022, + "loss": 0.0076, + "step": 222600 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315355858151162, + "loss": 0.0112, + "step": 222610 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013152801812210219, + "loss": 0.0108, + "step": 222620 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315204504290882, + "loss": 0.0074, + "step": 222630 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013151288273607418, + "loss": 0.0091, + "step": 222640 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013150531504306016, + "loss": 0.0092, + "step": 222650 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013149774735004617, + "loss": 0.009, + "step": 222660 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013149017965703215, + "loss": 0.009, + "step": 222670 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013148261196401813, + "loss": 0.0082, + "step": 222680 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013147504427100414, + "loss": 0.0082, + "step": 222690 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013146747657799012, + "loss": 0.0085, + "step": 222700 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314599088849761, + "loss": 0.0082, + "step": 222710 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314523411919621, + "loss": 0.0091, + "step": 222720 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314447734989481, + "loss": 0.0064, + "step": 222730 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013143720580593407, + "loss": 0.01, + "step": 222740 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013142963811292005, + "loss": 0.0119, + "step": 222750 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013142207041990606, + "loss": 0.0101, + "step": 222760 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013141450272689204, + "loss": 0.0104, + "step": 222770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013140693503387802, + "loss": 0.0101, + "step": 222780 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131399367340864, + "loss": 0.0091, + "step": 222790 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013139179964785, + "loss": 0.0079, + "step": 222800 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131384231954836, + "loss": 0.009, + "step": 222810 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013137666426182198, + "loss": 0.0082, + "step": 222820 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013136909656880796, + "loss": 0.0085, + "step": 222830 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013136152887579397, + "loss": 0.0119, + "step": 222840 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013135396118277995, + "loss": 0.0116, + "step": 222850 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013134639348976593, + "loss": 0.0094, + "step": 222860 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013133882579675194, + "loss": 0.0086, + "step": 222870 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013133125810373792, + "loss": 0.0081, + "step": 222880 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313236904107239, + "loss": 0.0104, + "step": 222890 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313161227177099, + "loss": 0.009, + "step": 222900 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313085550246959, + "loss": 0.0121, + "step": 222910 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013130098733168187, + "loss": 0.0112, + "step": 222920 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013129341963866788, + "loss": 0.0097, + "step": 222930 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013128585194565386, + "loss": 0.0086, + "step": 222940 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013127828425263984, + "loss": 0.0101, + "step": 222950 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013127071655962583, + "loss": 0.0072, + "step": 222960 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013126314886661183, + "loss": 0.0111, + "step": 222970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013125558117359782, + "loss": 0.0117, + "step": 222980 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312480134805838, + "loss": 0.0076, + "step": 222990 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312404457875698, + "loss": 0.0088, + "step": 223000 + }, + { + "epoch": 1.13, + "eval_cer": 0.9144547295651558, + "eval_loss": 0.006930416449904442, + "eval_runtime": 115.5739, + "eval_samples_per_second": 17.305, + "eval_steps_per_second": 4.326, + "step": 223000 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312328780945558, + "loss": 0.009, + "step": 223010 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013122531040154177, + "loss": 0.0118, + "step": 223020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013121774270852778, + "loss": 0.0107, + "step": 223030 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013121017501551376, + "loss": 0.0117, + "step": 223040 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013120260732249974, + "loss": 0.0103, + "step": 223050 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013119503962948575, + "loss": 0.0108, + "step": 223060 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013118747193647173, + "loss": 0.0086, + "step": 223070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311799042434577, + "loss": 0.0081, + "step": 223080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013117233655044372, + "loss": 0.0077, + "step": 223090 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311647688574297, + "loss": 0.0115, + "step": 223100 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013115720116441568, + "loss": 0.0079, + "step": 223110 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013114963347140166, + "loss": 0.0118, + "step": 223120 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013114206577838767, + "loss": 0.0116, + "step": 223130 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013113449808537365, + "loss": 0.01, + "step": 223140 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013112693039235964, + "loss": 0.0072, + "step": 223150 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013111936269934564, + "loss": 0.012, + "step": 223160 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013111179500633163, + "loss": 0.0078, + "step": 223170 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311042273133176, + "loss": 0.0077, + "step": 223180 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013109665962030362, + "loss": 0.009, + "step": 223190 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310890919272896, + "loss": 0.0083, + "step": 223200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013108152423427558, + "loss": 0.0121, + "step": 223210 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310739565412616, + "loss": 0.0085, + "step": 223220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013106638884824757, + "loss": 0.009, + "step": 223230 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013105882115523355, + "loss": 0.0099, + "step": 223240 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013105125346221956, + "loss": 0.0082, + "step": 223250 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013104368576920554, + "loss": 0.0086, + "step": 223260 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013103611807619152, + "loss": 0.0098, + "step": 223270 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310285503831775, + "loss": 0.0096, + "step": 223280 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310209826901635, + "loss": 0.0103, + "step": 223290 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310134149971495, + "loss": 0.011, + "step": 223300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013100584730413547, + "loss": 0.0114, + "step": 223310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013099827961112148, + "loss": 0.0086, + "step": 223320 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013099071191810746, + "loss": 0.0088, + "step": 223330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013098314422509345, + "loss": 0.0116, + "step": 223340 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013097557653207945, + "loss": 0.0083, + "step": 223350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013096800883906544, + "loss": 0.0092, + "step": 223360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013096044114605142, + "loss": 0.012, + "step": 223370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013095287345303743, + "loss": 0.0089, + "step": 223380 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309453057600234, + "loss": 0.0112, + "step": 223390 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309377380670094, + "loss": 0.0111, + "step": 223400 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309301703739954, + "loss": 0.0077, + "step": 223410 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013092260268098135, + "loss": 0.0126, + "step": 223420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013091503498796736, + "loss": 0.0121, + "step": 223430 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013090746729495334, + "loss": 0.0072, + "step": 223440 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013089989960193932, + "loss": 0.0083, + "step": 223450 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013089233190892533, + "loss": 0.0126, + "step": 223460 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308847642159113, + "loss": 0.0103, + "step": 223470 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308771965228973, + "loss": 0.0099, + "step": 223480 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013086962882988328, + "loss": 0.0099, + "step": 223490 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013086206113686928, + "loss": 0.009, + "step": 223500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013085449344385527, + "loss": 0.0093, + "step": 223510 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013084692575084125, + "loss": 0.01, + "step": 223520 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013083935805782726, + "loss": 0.0125, + "step": 223530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013083179036481324, + "loss": 0.0083, + "step": 223540 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013082422267179922, + "loss": 0.0111, + "step": 223550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013081665497878523, + "loss": 0.0122, + "step": 223560 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308090872857712, + "loss": 0.0079, + "step": 223570 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308015195927572, + "loss": 0.0098, + "step": 223580 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307939518997432, + "loss": 0.0146, + "step": 223590 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013078638420672918, + "loss": 0.0137, + "step": 223600 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013077881651371516, + "loss": 0.0081, + "step": 223610 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013077124882070117, + "loss": 0.0081, + "step": 223620 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013076368112768715, + "loss": 0.0092, + "step": 223630 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013075611343467313, + "loss": 0.0093, + "step": 223640 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013074854574165911, + "loss": 0.0117, + "step": 223650 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013074097804864512, + "loss": 0.0087, + "step": 223660 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307334103556311, + "loss": 0.0096, + "step": 223670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013072584266261709, + "loss": 0.0091, + "step": 223680 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307182749696031, + "loss": 0.0078, + "step": 223690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013071070727658908, + "loss": 0.0094, + "step": 223700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013070313958357506, + "loss": 0.0096, + "step": 223710 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013069557189056107, + "loss": 0.0084, + "step": 223720 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013068800419754705, + "loss": 0.0095, + "step": 223730 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013068043650453303, + "loss": 0.0259, + "step": 223740 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013067286881151904, + "loss": 0.011, + "step": 223750 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013066530111850502, + "loss": 0.0127, + "step": 223760 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130657733425491, + "loss": 0.012, + "step": 223770 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130650165732477, + "loss": 0.0083, + "step": 223780 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130642598039463, + "loss": 0.0106, + "step": 223790 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013063503034644897, + "loss": 0.0088, + "step": 223800 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013062746265343498, + "loss": 0.0082, + "step": 223810 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013061989496042096, + "loss": 0.012, + "step": 223820 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013061232726740694, + "loss": 0.0106, + "step": 223830 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013060475957439292, + "loss": 0.0098, + "step": 223840 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013059719188137893, + "loss": 0.0101, + "step": 223850 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013058962418836491, + "loss": 0.0092, + "step": 223860 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305820564953509, + "loss": 0.0091, + "step": 223870 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305744888023369, + "loss": 0.0098, + "step": 223880 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013056692110932289, + "loss": 0.0071, + "step": 223890 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013055935341630887, + "loss": 0.0095, + "step": 223900 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013055178572329488, + "loss": 0.007, + "step": 223910 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013054421803028086, + "loss": 0.0089, + "step": 223920 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013053665033726684, + "loss": 0.009, + "step": 223930 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013052908264425285, + "loss": 0.0078, + "step": 223940 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013052151495123883, + "loss": 0.0081, + "step": 223950 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305139472582248, + "loss": 0.0079, + "step": 223960 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013050637956521082, + "loss": 0.0088, + "step": 223970 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304988118721968, + "loss": 0.0096, + "step": 223980 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013049124417918278, + "loss": 0.0079, + "step": 223990 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013048367648616876, + "loss": 0.0089, + "step": 224000 + }, + { + "epoch": 1.13, + "eval_cer": 0.9144683151109114, + "eval_loss": 0.007022760342806578, + "eval_runtime": 115.4845, + "eval_samples_per_second": 17.318, + "eval_steps_per_second": 4.33, + "step": 224000 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013047610879315477, + "loss": 0.0131, + "step": 224010 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013046854110014075, + "loss": 0.0086, + "step": 224020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013046097340712673, + "loss": 0.0072, + "step": 224030 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013045340571411274, + "loss": 0.0101, + "step": 224040 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304458380210987, + "loss": 0.0081, + "step": 224050 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304382703280847, + "loss": 0.0085, + "step": 224060 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304307026350707, + "loss": 0.0097, + "step": 224070 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013042313494205667, + "loss": 0.0085, + "step": 224080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013041556724904268, + "loss": 0.0082, + "step": 224090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013040799955602866, + "loss": 0.0082, + "step": 224100 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013040043186301464, + "loss": 0.0101, + "step": 224110 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013039286417000065, + "loss": 0.0106, + "step": 224120 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013038529647698663, + "loss": 0.0105, + "step": 224130 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303777287839726, + "loss": 0.0115, + "step": 224140 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013037016109095862, + "loss": 0.013, + "step": 224150 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303625933979446, + "loss": 0.0121, + "step": 224160 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013035502570493058, + "loss": 0.0091, + "step": 224170 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013034745801191656, + "loss": 0.008, + "step": 224180 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013033989031890257, + "loss": 0.0067, + "step": 224190 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013033232262588855, + "loss": 0.0079, + "step": 224200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013032475493287454, + "loss": 0.0096, + "step": 224210 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013031718723986054, + "loss": 0.0095, + "step": 224220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013030961954684653, + "loss": 0.0086, + "step": 224230 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303020518538325, + "loss": 0.009, + "step": 224240 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013029448416081852, + "loss": 0.0074, + "step": 224250 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302869164678045, + "loss": 0.0104, + "step": 224260 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013027934877479048, + "loss": 0.0072, + "step": 224270 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302717810817765, + "loss": 0.0088, + "step": 224280 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013026421338876247, + "loss": 0.0122, + "step": 224290 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013025664569574845, + "loss": 0.011, + "step": 224300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013024907800273446, + "loss": 0.0093, + "step": 224310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013024151030972044, + "loss": 0.0076, + "step": 224320 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013023394261670642, + "loss": 0.0088, + "step": 224330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013022637492369243, + "loss": 0.009, + "step": 224340 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302188072306784, + "loss": 0.0111, + "step": 224350 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302112395376644, + "loss": 0.0088, + "step": 224360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013020367184465037, + "loss": 0.0117, + "step": 224370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013019610415163638, + "loss": 0.0087, + "step": 224380 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013018853645862236, + "loss": 0.0086, + "step": 224390 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013018096876560835, + "loss": 0.013, + "step": 224400 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013017340107259435, + "loss": 0.008, + "step": 224410 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013016583337958034, + "loss": 0.0078, + "step": 224420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013015826568656632, + "loss": 0.0096, + "step": 224430 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013015069799355233, + "loss": 0.0102, + "step": 224440 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301431303005383, + "loss": 0.0078, + "step": 224450 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301355626075243, + "loss": 0.0093, + "step": 224460 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301279949145103, + "loss": 0.0104, + "step": 224470 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013012042722149628, + "loss": 0.01, + "step": 224480 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013011285952848226, + "loss": 0.0085, + "step": 224490 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013010529183546827, + "loss": 0.009, + "step": 224500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013009772414245425, + "loss": 0.0089, + "step": 224510 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013009015644944023, + "loss": 0.0078, + "step": 224520 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300825887564262, + "loss": 0.0086, + "step": 224530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013007502106341222, + "loss": 0.0079, + "step": 224540 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300674533703982, + "loss": 0.0083, + "step": 224550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013005988567738418, + "loss": 0.0106, + "step": 224560 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300523179843702, + "loss": 0.0106, + "step": 224570 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013004475029135617, + "loss": 0.009, + "step": 224580 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013003718259834216, + "loss": 0.0079, + "step": 224590 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013002961490532816, + "loss": 0.0089, + "step": 224600 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013002204721231415, + "loss": 0.0081, + "step": 224610 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013001447951930013, + "loss": 0.0082, + "step": 224620 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013000691182628614, + "loss": 0.0067, + "step": 224630 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012999934413327212, + "loss": 0.0099, + "step": 224640 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299917764402581, + "loss": 0.0121, + "step": 224650 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299842087472441, + "loss": 0.0113, + "step": 224660 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012997664105423006, + "loss": 0.0089, + "step": 224670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012996907336121607, + "loss": 0.009, + "step": 224680 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012996150566820205, + "loss": 0.0098, + "step": 224690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012995393797518803, + "loss": 0.0091, + "step": 224700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012994637028217404, + "loss": 0.0101, + "step": 224710 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012993880258916002, + "loss": 0.0115, + "step": 224720 + }, + { + "epoch": 1.13, + "learning_rate": 0.000129931234896146, + "loss": 0.0072, + "step": 224730 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012992366720313199, + "loss": 0.0087, + "step": 224740 + }, + { + "epoch": 1.13, + "learning_rate": 0.000129916099510118, + "loss": 0.0091, + "step": 224750 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012990853181710398, + "loss": 0.0079, + "step": 224760 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012990096412408996, + "loss": 0.0114, + "step": 224770 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012989339643107597, + "loss": 0.0084, + "step": 224780 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012988582873806195, + "loss": 0.007, + "step": 224790 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012987826104504793, + "loss": 0.008, + "step": 224800 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012987069335203394, + "loss": 0.0068, + "step": 224810 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012986312565901992, + "loss": 0.0076, + "step": 224820 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298555579660059, + "loss": 0.009, + "step": 224830 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298479902729919, + "loss": 0.0108, + "step": 224840 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298404225799779, + "loss": 0.0086, + "step": 224850 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012983285488696387, + "loss": 0.0129, + "step": 224860 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012982528719394988, + "loss": 0.0081, + "step": 224870 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012981771950093586, + "loss": 0.009, + "step": 224880 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012981015180792184, + "loss": 0.0093, + "step": 224890 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012980258411490782, + "loss": 0.0103, + "step": 224900 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012979501642189383, + "loss": 0.0129, + "step": 224910 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012978744872887981, + "loss": 0.0069, + "step": 224920 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001297798810358658, + "loss": 0.0105, + "step": 224930 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001297723133428518, + "loss": 0.008, + "step": 224940 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012976474564983779, + "loss": 0.0154, + "step": 224950 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012975717795682377, + "loss": 0.0076, + "step": 224960 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012974961026380978, + "loss": 0.0084, + "step": 224970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012974204257079576, + "loss": 0.011, + "step": 224980 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012973447487778174, + "loss": 0.0082, + "step": 224990 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012972690718476775, + "loss": 0.0074, + "step": 225000 + }, + { + "epoch": 1.14, + "eval_cer": 0.9144644335264098, + "eval_loss": 0.007108866702765226, + "eval_runtime": 116.0265, + "eval_samples_per_second": 17.237, + "eval_steps_per_second": 4.309, + "step": 225000 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012971933949175373, + "loss": 0.0077, + "step": 225010 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001297117717987397, + "loss": 0.009, + "step": 225020 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012970420410572572, + "loss": 0.0086, + "step": 225030 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296966364127117, + "loss": 0.0085, + "step": 225040 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012968906871969768, + "loss": 0.0083, + "step": 225050 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012968150102668366, + "loss": 0.0086, + "step": 225060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012967393333366967, + "loss": 0.0077, + "step": 225070 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012966636564065565, + "loss": 0.0087, + "step": 225080 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012965879794764163, + "loss": 0.0076, + "step": 225090 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012965123025462764, + "loss": 0.0082, + "step": 225100 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012964366256161362, + "loss": 0.0099, + "step": 225110 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296360948685996, + "loss": 0.0135, + "step": 225120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012962852717558561, + "loss": 0.012, + "step": 225130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296209594825716, + "loss": 0.0091, + "step": 225140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012961339178955758, + "loss": 0.0111, + "step": 225150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012960582409654359, + "loss": 0.0098, + "step": 225160 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012959825640352957, + "loss": 0.0105, + "step": 225170 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012959068871051555, + "loss": 0.0087, + "step": 225180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012958312101750156, + "loss": 0.0121, + "step": 225190 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012957555332448754, + "loss": 0.0088, + "step": 225200 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012956798563147352, + "loss": 0.0115, + "step": 225210 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295604179384595, + "loss": 0.0086, + "step": 225220 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295528502454455, + "loss": 0.0118, + "step": 225230 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295452825524315, + "loss": 0.0105, + "step": 225240 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012953771485941747, + "loss": 0.0082, + "step": 225250 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012953014716640348, + "loss": 0.008, + "step": 225260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012952257947338946, + "loss": 0.0093, + "step": 225270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012951501178037544, + "loss": 0.0091, + "step": 225280 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012950744408736145, + "loss": 0.0122, + "step": 225290 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294998763943474, + "loss": 0.01, + "step": 225300 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012949230870133342, + "loss": 0.0081, + "step": 225310 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294847410083194, + "loss": 0.0091, + "step": 225320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012947717331530538, + "loss": 0.0101, + "step": 225330 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294696056222914, + "loss": 0.0096, + "step": 225340 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012946203792927737, + "loss": 0.0116, + "step": 225350 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012945447023626335, + "loss": 0.0079, + "step": 225360 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012944690254324936, + "loss": 0.0092, + "step": 225370 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012943933485023534, + "loss": 0.0092, + "step": 225380 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012943176715722132, + "loss": 0.0096, + "step": 225390 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012942419946420733, + "loss": 0.0118, + "step": 225400 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294166317711933, + "loss": 0.0089, + "step": 225410 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294090640781793, + "loss": 0.0092, + "step": 225420 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012940149638516527, + "loss": 0.009, + "step": 225430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012939392869215128, + "loss": 0.0094, + "step": 225440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012938636099913726, + "loss": 0.0091, + "step": 225450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012937879330612325, + "loss": 0.0091, + "step": 225460 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012937122561310925, + "loss": 0.0101, + "step": 225470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012936365792009524, + "loss": 0.0081, + "step": 225480 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012935609022708122, + "loss": 0.0083, + "step": 225490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012934852253406723, + "loss": 0.0105, + "step": 225500 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293409548410532, + "loss": 0.0084, + "step": 225510 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293333871480392, + "loss": 0.0075, + "step": 225520 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293258194550252, + "loss": 0.0081, + "step": 225530 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012931825176201118, + "loss": 0.0094, + "step": 225540 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012931068406899716, + "loss": 0.0112, + "step": 225550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012930311637598317, + "loss": 0.0153, + "step": 225560 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012929554868296915, + "loss": 0.0082, + "step": 225570 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012928798098995513, + "loss": 0.0086, + "step": 225580 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292804132969411, + "loss": 0.0088, + "step": 225590 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012927284560392712, + "loss": 0.0086, + "step": 225600 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292652779109131, + "loss": 0.0094, + "step": 225610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012925771021789908, + "loss": 0.0094, + "step": 225620 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292501425248851, + "loss": 0.0077, + "step": 225630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012924257483187107, + "loss": 0.0112, + "step": 225640 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012923500713885706, + "loss": 0.0068, + "step": 225650 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012922743944584306, + "loss": 0.0075, + "step": 225660 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012921987175282905, + "loss": 0.0083, + "step": 225670 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012921230405981503, + "loss": 0.011, + "step": 225680 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012920473636680104, + "loss": 0.0087, + "step": 225690 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012919716867378702, + "loss": 0.01, + "step": 225700 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129189600980773, + "loss": 0.0077, + "step": 225710 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129182033287759, + "loss": 0.0101, + "step": 225720 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129174465594745, + "loss": 0.0098, + "step": 225730 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012916689790173097, + "loss": 0.0105, + "step": 225740 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012915933020871698, + "loss": 0.0081, + "step": 225750 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012915176251570296, + "loss": 0.0075, + "step": 225760 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012914419482268894, + "loss": 0.0094, + "step": 225770 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012913662712967492, + "loss": 0.0095, + "step": 225780 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012912905943666093, + "loss": 0.0097, + "step": 225790 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291214917436469, + "loss": 0.0092, + "step": 225800 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291139240506329, + "loss": 0.0091, + "step": 225810 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291063563576189, + "loss": 0.0093, + "step": 225820 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012909878866460488, + "loss": 0.0086, + "step": 225830 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012909122097159087, + "loss": 0.0094, + "step": 225840 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012908365327857687, + "loss": 0.0072, + "step": 225850 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012907608558556286, + "loss": 0.0085, + "step": 225860 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012906851789254884, + "loss": 0.0095, + "step": 225870 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012906095019953485, + "loss": 0.0098, + "step": 225880 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012905338250652083, + "loss": 0.0067, + "step": 225890 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290458148135068, + "loss": 0.0075, + "step": 225900 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012903824712049282, + "loss": 0.0074, + "step": 225910 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290306794274788, + "loss": 0.0108, + "step": 225920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012902311173446478, + "loss": 0.008, + "step": 225930 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012901554404145076, + "loss": 0.0089, + "step": 225940 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012900797634843674, + "loss": 0.0117, + "step": 225950 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012900040865542272, + "loss": 0.0077, + "step": 225960 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012899284096240873, + "loss": 0.0078, + "step": 225970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012898527326939471, + "loss": 0.0114, + "step": 225980 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289777055763807, + "loss": 0.0074, + "step": 225990 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289701378833667, + "loss": 0.0092, + "step": 226000 + }, + { + "epoch": 1.14, + "eval_cer": 0.9144498775845288, + "eval_loss": 0.007178218103945255, + "eval_runtime": 116.0384, + "eval_samples_per_second": 17.236, + "eval_steps_per_second": 4.309, + "step": 226000 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012896257019035269, + "loss": 0.006, + "step": 226010 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012895500249733867, + "loss": 0.0088, + "step": 226020 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012894743480432468, + "loss": 0.0089, + "step": 226030 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012893986711131066, + "loss": 0.0095, + "step": 226040 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012893229941829664, + "loss": 0.0088, + "step": 226050 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012892473172528265, + "loss": 0.0087, + "step": 226060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012891716403226863, + "loss": 0.0116, + "step": 226070 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289095963392546, + "loss": 0.0094, + "step": 226080 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012890202864624062, + "loss": 0.0082, + "step": 226090 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001288944609532266, + "loss": 0.0103, + "step": 226100 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012888689326021258, + "loss": 0.0094, + "step": 226110 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012887932556719856, + "loss": 0.0097, + "step": 226120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012887175787418457, + "loss": 0.0091, + "step": 226130 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012886419018117055, + "loss": 0.0082, + "step": 226140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012885662248815654, + "loss": 0.011, + "step": 226150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012884905479514254, + "loss": 0.0077, + "step": 226160 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012884148710212853, + "loss": 0.0134, + "step": 226170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001288339194091145, + "loss": 0.007, + "step": 226180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012882635171610052, + "loss": 0.0082, + "step": 226190 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001288187840230865, + "loss": 0.0114, + "step": 226200 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012881121633007248, + "loss": 0.009, + "step": 226210 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012880364863705849, + "loss": 0.0069, + "step": 226220 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012879608094404447, + "loss": 0.0091, + "step": 226230 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012878851325103045, + "loss": 0.0078, + "step": 226240 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012878094555801646, + "loss": 0.012, + "step": 226250 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012877337786500244, + "loss": 0.0071, + "step": 226260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012876581017198842, + "loss": 0.0089, + "step": 226270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012875824247897443, + "loss": 0.0102, + "step": 226280 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287506747859604, + "loss": 0.0094, + "step": 226290 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287431070929464, + "loss": 0.0088, + "step": 226300 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012873553939993237, + "loss": 0.0113, + "step": 226310 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012872797170691838, + "loss": 0.0083, + "step": 226320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012872040401390436, + "loss": 0.0103, + "step": 226330 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012871283632089035, + "loss": 0.01, + "step": 226340 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012870526862787635, + "loss": 0.0095, + "step": 226350 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012869770093486234, + "loss": 0.0085, + "step": 226360 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012869013324184832, + "loss": 0.0115, + "step": 226370 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012868256554883433, + "loss": 0.0099, + "step": 226380 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286749978558203, + "loss": 0.0094, + "step": 226390 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286674301628063, + "loss": 0.0069, + "step": 226400 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286598624697923, + "loss": 0.0081, + "step": 226410 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012865229477677828, + "loss": 0.0096, + "step": 226420 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012864472708376426, + "loss": 0.0083, + "step": 226430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012863715939075027, + "loss": 0.0077, + "step": 226440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012862959169773625, + "loss": 0.0088, + "step": 226450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012862202400472223, + "loss": 0.0088, + "step": 226460 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286144563117082, + "loss": 0.0068, + "step": 226470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012860688861869422, + "loss": 0.0081, + "step": 226480 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285993209256802, + "loss": 0.0078, + "step": 226490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012859175323266618, + "loss": 0.0094, + "step": 226500 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285841855396522, + "loss": 0.0092, + "step": 226510 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012857661784663817, + "loss": 0.0079, + "step": 226520 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012856905015362416, + "loss": 0.008, + "step": 226530 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012856148246061016, + "loss": 0.0087, + "step": 226540 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012855391476759615, + "loss": 0.008, + "step": 226550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012854634707458213, + "loss": 0.009, + "step": 226560 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285387793815681, + "loss": 0.0106, + "step": 226570 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285312116885541, + "loss": 0.0087, + "step": 226580 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285236439955401, + "loss": 0.0092, + "step": 226590 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012851607630252608, + "loss": 0.0093, + "step": 226600 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012850850860951206, + "loss": 0.0084, + "step": 226610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012850094091649807, + "loss": 0.0093, + "step": 226620 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012849337322348405, + "loss": 0.0081, + "step": 226630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012848580553047003, + "loss": 0.0101, + "step": 226640 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012847823783745601, + "loss": 0.0121, + "step": 226650 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012847067014444202, + "loss": 0.0102, + "step": 226660 + }, + { + "epoch": 1.14, + "learning_rate": 0.000128463102451428, + "loss": 0.0096, + "step": 226670 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012845553475841399, + "loss": 0.0103, + "step": 226680 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284479670654, + "loss": 0.0079, + "step": 226690 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012844039937238598, + "loss": 0.0078, + "step": 226700 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012843283167937196, + "loss": 0.0084, + "step": 226710 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012842526398635797, + "loss": 0.009, + "step": 226720 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012841769629334395, + "loss": 0.0095, + "step": 226730 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012841012860032993, + "loss": 0.0099, + "step": 226740 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012840256090731594, + "loss": 0.0079, + "step": 226750 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012839499321430192, + "loss": 0.0107, + "step": 226760 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283874255212879, + "loss": 0.0114, + "step": 226770 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283798578282739, + "loss": 0.0083, + "step": 226780 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283722901352599, + "loss": 0.0077, + "step": 226790 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012836472244224587, + "loss": 0.0083, + "step": 226800 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012835715474923188, + "loss": 0.0076, + "step": 226810 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012834958705621786, + "loss": 0.01, + "step": 226820 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012834201936320384, + "loss": 0.0064, + "step": 226830 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012833445167018982, + "loss": 0.0086, + "step": 226840 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012832688397717583, + "loss": 0.0109, + "step": 226850 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012831931628416181, + "loss": 0.0107, + "step": 226860 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283117485911478, + "loss": 0.0101, + "step": 226870 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283041808981338, + "loss": 0.0068, + "step": 226880 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012829661320511979, + "loss": 0.0079, + "step": 226890 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012828904551210577, + "loss": 0.0086, + "step": 226900 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012828147781909178, + "loss": 0.0079, + "step": 226910 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012827391012607776, + "loss": 0.0089, + "step": 226920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012826634243306374, + "loss": 0.0103, + "step": 226930 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012825877474004975, + "loss": 0.0083, + "step": 226940 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012825120704703573, + "loss": 0.0097, + "step": 226950 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001282436393540217, + "loss": 0.008, + "step": 226960 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012823607166100772, + "loss": 0.0086, + "step": 226970 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001282285039679937, + "loss": 0.0114, + "step": 226980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012822093627497968, + "loss": 0.0095, + "step": 226990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012821336858196566, + "loss": 0.0074, + "step": 227000 + }, + { + "epoch": 1.15, + "eval_cer": 0.9144663743186606, + "eval_loss": 0.006952292751520872, + "eval_runtime": 116.2021, + "eval_samples_per_second": 17.211, + "eval_steps_per_second": 4.303, + "step": 227000 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012820580088895167, + "loss": 0.0068, + "step": 227010 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012819823319593765, + "loss": 0.0086, + "step": 227020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012819066550292363, + "loss": 0.0077, + "step": 227030 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012818309780990964, + "loss": 0.0083, + "step": 227040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012817553011689562, + "loss": 0.0087, + "step": 227050 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001281679624238816, + "loss": 0.0063, + "step": 227060 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012816039473086761, + "loss": 0.0083, + "step": 227070 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001281528270378536, + "loss": 0.0101, + "step": 227080 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012814525934483958, + "loss": 0.01, + "step": 227090 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012813769165182559, + "loss": 0.0098, + "step": 227100 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012813012395881157, + "loss": 0.0088, + "step": 227110 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012812255626579755, + "loss": 0.0124, + "step": 227120 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012811498857278356, + "loss": 0.0077, + "step": 227130 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012810742087976954, + "loss": 0.0105, + "step": 227140 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012809985318675552, + "loss": 0.0085, + "step": 227150 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280922854937415, + "loss": 0.0082, + "step": 227160 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280847178007275, + "loss": 0.0095, + "step": 227170 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280771501077135, + "loss": 0.0094, + "step": 227180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012806958241469947, + "loss": 0.0075, + "step": 227190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012806201472168545, + "loss": 0.0111, + "step": 227200 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012805444702867144, + "loss": 0.0101, + "step": 227210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012804687933565744, + "loss": 0.01, + "step": 227220 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012803931164264343, + "loss": 0.0095, + "step": 227230 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280317439496294, + "loss": 0.0096, + "step": 227240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012802417625661542, + "loss": 0.0091, + "step": 227250 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280166085636014, + "loss": 0.0092, + "step": 227260 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012800904087058738, + "loss": 0.0089, + "step": 227270 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280014731775734, + "loss": 0.0103, + "step": 227280 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012799390548455937, + "loss": 0.0104, + "step": 227290 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012798633779154535, + "loss": 0.0072, + "step": 227300 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012797877009853136, + "loss": 0.0116, + "step": 227310 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012797120240551734, + "loss": 0.0076, + "step": 227320 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012796363471250332, + "loss": 0.0103, + "step": 227330 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012795606701948933, + "loss": 0.0084, + "step": 227340 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001279484993264753, + "loss": 0.0089, + "step": 227350 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001279409316334613, + "loss": 0.0075, + "step": 227360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012793336394044727, + "loss": 0.0091, + "step": 227370 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012792579624743328, + "loss": 0.0087, + "step": 227380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012791822855441926, + "loss": 0.0073, + "step": 227390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012791066086140525, + "loss": 0.007, + "step": 227400 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012790309316839125, + "loss": 0.0067, + "step": 227410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012789552547537724, + "loss": 0.0072, + "step": 227420 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012788795778236322, + "loss": 0.0095, + "step": 227430 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012788039008934923, + "loss": 0.0097, + "step": 227440 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278728223963352, + "loss": 0.0094, + "step": 227450 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278652547033212, + "loss": 0.0094, + "step": 227460 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278576870103072, + "loss": 0.0078, + "step": 227470 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012785011931729318, + "loss": 0.0113, + "step": 227480 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012784255162427916, + "loss": 0.0086, + "step": 227490 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012783498393126517, + "loss": 0.0073, + "step": 227500 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012782741623825115, + "loss": 0.0085, + "step": 227510 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012781984854523713, + "loss": 0.0104, + "step": 227520 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278122808522231, + "loss": 0.011, + "step": 227530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012780471315920912, + "loss": 0.011, + "step": 227540 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277971454661951, + "loss": 0.008, + "step": 227550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012778957777318108, + "loss": 0.009, + "step": 227560 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277820100801671, + "loss": 0.0086, + "step": 227570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012777444238715307, + "loss": 0.0079, + "step": 227580 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012776687469413906, + "loss": 0.0089, + "step": 227590 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012775930700112506, + "loss": 0.0087, + "step": 227600 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012775173930811105, + "loss": 0.0076, + "step": 227610 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012774417161509703, + "loss": 0.0092, + "step": 227620 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012773660392208304, + "loss": 0.0105, + "step": 227630 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012772903622906902, + "loss": 0.0095, + "step": 227640 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127721468536055, + "loss": 0.011, + "step": 227650 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127713900843041, + "loss": 0.007, + "step": 227660 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127706333150027, + "loss": 0.0082, + "step": 227670 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012769876545701297, + "loss": 0.0079, + "step": 227680 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012769119776399898, + "loss": 0.0091, + "step": 227690 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012768363007098496, + "loss": 0.0096, + "step": 227700 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012767606237797094, + "loss": 0.0094, + "step": 227710 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012766849468495692, + "loss": 0.0096, + "step": 227720 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012766092699194293, + "loss": 0.0127, + "step": 227730 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276533592989289, + "loss": 0.0061, + "step": 227740 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276457916059149, + "loss": 0.0086, + "step": 227750 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276382239129009, + "loss": 0.0079, + "step": 227760 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012763065621988688, + "loss": 0.0089, + "step": 227770 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012762308852687287, + "loss": 0.0094, + "step": 227780 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012761552083385887, + "loss": 0.0085, + "step": 227790 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012760795314084486, + "loss": 0.0083, + "step": 227800 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012760038544783084, + "loss": 0.009, + "step": 227810 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012759281775481682, + "loss": 0.0076, + "step": 227820 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275852500618028, + "loss": 0.0082, + "step": 227830 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275776823687888, + "loss": 0.0093, + "step": 227840 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275701146757748, + "loss": 0.0074, + "step": 227850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012756254698276077, + "loss": 0.0084, + "step": 227860 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012755497928974678, + "loss": 0.0079, + "step": 227870 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012754741159673276, + "loss": 0.012, + "step": 227880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012753984390371874, + "loss": 0.0094, + "step": 227890 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012753227621070472, + "loss": 0.011, + "step": 227900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012752470851769073, + "loss": 0.0079, + "step": 227910 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012751714082467671, + "loss": 0.0091, + "step": 227920 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275095731316627, + "loss": 0.0087, + "step": 227930 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275020054386487, + "loss": 0.0082, + "step": 227940 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012749443774563469, + "loss": 0.011, + "step": 227950 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012748687005262067, + "loss": 0.009, + "step": 227960 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012747930235960668, + "loss": 0.0077, + "step": 227970 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012747173466659266, + "loss": 0.0086, + "step": 227980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012746416697357864, + "loss": 0.0083, + "step": 227990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012745659928056465, + "loss": 0.01, + "step": 228000 + }, + { + "epoch": 1.15, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.006729237735271454, + "eval_runtime": 116.2506, + "eval_samples_per_second": 17.204, + "eval_steps_per_second": 4.301, + "step": 228000 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012744903158755063, + "loss": 0.0105, + "step": 228010 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274414638945366, + "loss": 0.0093, + "step": 228020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012743389620152262, + "loss": 0.0093, + "step": 228030 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274263285085086, + "loss": 0.0105, + "step": 228040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012741876081549458, + "loss": 0.0092, + "step": 228050 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012741119312248056, + "loss": 0.0112, + "step": 228060 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012740362542946657, + "loss": 0.0099, + "step": 228070 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012739605773645255, + "loss": 0.0103, + "step": 228080 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012738849004343853, + "loss": 0.0118, + "step": 228090 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012738092235042454, + "loss": 0.0098, + "step": 228100 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012737335465741052, + "loss": 0.0103, + "step": 228110 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273657869643965, + "loss": 0.0094, + "step": 228120 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012735821927138251, + "loss": 0.0074, + "step": 228130 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273506515783685, + "loss": 0.0091, + "step": 228140 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012734308388535448, + "loss": 0.0078, + "step": 228150 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012733551619234049, + "loss": 0.0086, + "step": 228160 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012732794849932647, + "loss": 0.0077, + "step": 228170 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012732038080631245, + "loss": 0.0083, + "step": 228180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012731281311329846, + "loss": 0.0091, + "step": 228190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012730524542028444, + "loss": 0.0107, + "step": 228200 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012729767772727042, + "loss": 0.0082, + "step": 228210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012729011003425643, + "loss": 0.0076, + "step": 228220 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001272825423412424, + "loss": 0.0093, + "step": 228230 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001272749746482284, + "loss": 0.0085, + "step": 228240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012726740695521437, + "loss": 0.0081, + "step": 228250 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012725983926220038, + "loss": 0.0083, + "step": 228260 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012725227156918636, + "loss": 0.0116, + "step": 228270 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012724470387617234, + "loss": 0.011, + "step": 228280 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012723713618315835, + "loss": 0.0086, + "step": 228290 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012722956849014433, + "loss": 0.0093, + "step": 228300 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012722200079713032, + "loss": 0.0098, + "step": 228310 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012721443310411632, + "loss": 0.0075, + "step": 228320 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001272068654111023, + "loss": 0.0087, + "step": 228330 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271992977180883, + "loss": 0.009, + "step": 228340 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271917300250743, + "loss": 0.0091, + "step": 228350 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012718416233206028, + "loss": 0.0102, + "step": 228360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012717659463904626, + "loss": 0.0104, + "step": 228370 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012716902694603227, + "loss": 0.0101, + "step": 228380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012716145925301825, + "loss": 0.0098, + "step": 228390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012715389156000423, + "loss": 0.0093, + "step": 228400 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271463238669902, + "loss": 0.0094, + "step": 228410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012713875617397622, + "loss": 0.0075, + "step": 228420 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271311884809622, + "loss": 0.0095, + "step": 228430 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012712362078794818, + "loss": 0.0075, + "step": 228440 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012711605309493416, + "loss": 0.0139, + "step": 228450 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012710848540192015, + "loss": 0.0092, + "step": 228460 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012710091770890615, + "loss": 0.0095, + "step": 228470 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012709335001589214, + "loss": 0.0104, + "step": 228480 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012708578232287812, + "loss": 0.0096, + "step": 228490 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012707821462986413, + "loss": 0.008, + "step": 228500 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270706469368501, + "loss": 0.0101, + "step": 228510 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270630792438361, + "loss": 0.0122, + "step": 228520 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270555115508221, + "loss": 0.0087, + "step": 228530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012704794385780808, + "loss": 0.012, + "step": 228540 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012704037616479406, + "loss": 0.0111, + "step": 228550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012703280847178007, + "loss": 0.0089, + "step": 228560 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012702524077876605, + "loss": 0.0123, + "step": 228570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012701767308575203, + "loss": 0.0096, + "step": 228580 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127010105392738, + "loss": 0.0085, + "step": 228590 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012700253769972402, + "loss": 0.0111, + "step": 228600 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012699497000671, + "loss": 0.0111, + "step": 228610 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012698740231369598, + "loss": 0.0104, + "step": 228620 + }, + { + "epoch": 1.15, + "learning_rate": 0.000126979834620682, + "loss": 0.0139, + "step": 228630 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012697226692766797, + "loss": 0.0102, + "step": 228640 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012696469923465396, + "loss": 0.0087, + "step": 228650 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012695713154163996, + "loss": 0.0096, + "step": 228660 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012694956384862595, + "loss": 0.0107, + "step": 228670 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012694199615561193, + "loss": 0.0118, + "step": 228680 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012693442846259794, + "loss": 0.0087, + "step": 228690 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012692686076958392, + "loss": 0.0079, + "step": 228700 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269192930765699, + "loss": 0.0089, + "step": 228710 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269117253835559, + "loss": 0.0096, + "step": 228720 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269041576905419, + "loss": 0.0091, + "step": 228730 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012689658999752787, + "loss": 0.0082, + "step": 228740 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012688902230451388, + "loss": 0.0101, + "step": 228750 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012688145461149986, + "loss": 0.0091, + "step": 228760 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012687388691848584, + "loss": 0.0097, + "step": 228770 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012686631922547182, + "loss": 0.0088, + "step": 228780 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012685875153245783, + "loss": 0.0108, + "step": 228790 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268511838394438, + "loss": 0.0119, + "step": 228800 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268436161464298, + "loss": 0.0088, + "step": 228810 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268360484534158, + "loss": 0.0076, + "step": 228820 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012682848076040178, + "loss": 0.0075, + "step": 228830 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012682091306738777, + "loss": 0.0106, + "step": 228840 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012681334537437377, + "loss": 0.0087, + "step": 228850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012680577768135976, + "loss": 0.0092, + "step": 228860 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012679820998834574, + "loss": 0.0083, + "step": 228870 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012679064229533175, + "loss": 0.0073, + "step": 228880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012678307460231773, + "loss": 0.0096, + "step": 228890 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001267755069093037, + "loss": 0.009, + "step": 228900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012676793921628972, + "loss": 0.0089, + "step": 228910 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001267603715232757, + "loss": 0.0073, + "step": 228920 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012675280383026168, + "loss": 0.0102, + "step": 228930 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012674523613724766, + "loss": 0.0092, + "step": 228940 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012673766844423367, + "loss": 0.0095, + "step": 228950 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012673010075121965, + "loss": 0.0089, + "step": 228960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012672253305820563, + "loss": 0.0099, + "step": 228970 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012671496536519164, + "loss": 0.0077, + "step": 228980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012670739767217762, + "loss": 0.0103, + "step": 228990 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266998299791636, + "loss": 0.0086, + "step": 229000 + }, + { + "epoch": 1.16, + "eval_cer": 0.9144634631302844, + "eval_loss": 0.006603468209505081, + "eval_runtime": 116.4012, + "eval_samples_per_second": 17.182, + "eval_steps_per_second": 4.295, + "step": 229000 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266922622861496, + "loss": 0.0089, + "step": 229010 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266846945931356, + "loss": 0.0089, + "step": 229020 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012667712690012158, + "loss": 0.0081, + "step": 229030 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012666955920710758, + "loss": 0.0099, + "step": 229040 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012666199151409357, + "loss": 0.0112, + "step": 229050 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012665442382107955, + "loss": 0.0097, + "step": 229060 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012664685612806553, + "loss": 0.0077, + "step": 229070 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266392884350515, + "loss": 0.0085, + "step": 229080 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012663172074203752, + "loss": 0.0088, + "step": 229090 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266241530490235, + "loss": 0.0101, + "step": 229100 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012661658535600948, + "loss": 0.0067, + "step": 229110 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266090176629955, + "loss": 0.008, + "step": 229120 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012660144996998147, + "loss": 0.0105, + "step": 229130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012659388227696745, + "loss": 0.01, + "step": 229140 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012658631458395343, + "loss": 0.0112, + "step": 229150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012657874689093944, + "loss": 0.0082, + "step": 229160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012657117919792542, + "loss": 0.0089, + "step": 229170 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265636115049114, + "loss": 0.0076, + "step": 229180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012655604381189741, + "loss": 0.0096, + "step": 229190 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265484761188834, + "loss": 0.0082, + "step": 229200 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012654090842586938, + "loss": 0.0065, + "step": 229210 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012653334073285539, + "loss": 0.008, + "step": 229220 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012652577303984137, + "loss": 0.0093, + "step": 229230 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012651820534682735, + "loss": 0.0096, + "step": 229240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012651063765381336, + "loss": 0.0096, + "step": 229250 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012650306996079934, + "loss": 0.0091, + "step": 229260 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012649550226778532, + "loss": 0.0103, + "step": 229270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012648793457477133, + "loss": 0.0085, + "step": 229280 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264803668817573, + "loss": 0.0099, + "step": 229290 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264727991887433, + "loss": 0.0084, + "step": 229300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012646523149572927, + "loss": 0.0087, + "step": 229310 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012645766380271528, + "loss": 0.0095, + "step": 229320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012645009610970126, + "loss": 0.0078, + "step": 229330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012644252841668724, + "loss": 0.0091, + "step": 229340 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012643496072367325, + "loss": 0.0093, + "step": 229350 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012642739303065923, + "loss": 0.0098, + "step": 229360 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012641982533764522, + "loss": 0.0091, + "step": 229370 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012641225764463122, + "loss": 0.01, + "step": 229380 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264046899516172, + "loss": 0.0087, + "step": 229390 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263971222586032, + "loss": 0.0095, + "step": 229400 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263895545655892, + "loss": 0.0086, + "step": 229410 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012638198687257518, + "loss": 0.0078, + "step": 229420 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012637441917956116, + "loss": 0.0087, + "step": 229430 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012636685148654717, + "loss": 0.0092, + "step": 229440 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012635928379353315, + "loss": 0.0091, + "step": 229450 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012635171610051913, + "loss": 0.01, + "step": 229460 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263441484075051, + "loss": 0.0087, + "step": 229470 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012633658071449112, + "loss": 0.009, + "step": 229480 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263290130214771, + "loss": 0.0101, + "step": 229490 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012632144532846308, + "loss": 0.0087, + "step": 229500 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263138776354491, + "loss": 0.0084, + "step": 229510 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012630630994243507, + "loss": 0.011, + "step": 229520 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012629874224942105, + "loss": 0.0068, + "step": 229530 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012629117455640706, + "loss": 0.0084, + "step": 229540 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012628360686339304, + "loss": 0.0082, + "step": 229550 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012627603917037903, + "loss": 0.011, + "step": 229560 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012626847147736503, + "loss": 0.0095, + "step": 229570 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012626090378435102, + "loss": 0.0086, + "step": 229580 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126253336091337, + "loss": 0.009, + "step": 229590 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126245768398323, + "loss": 0.0087, + "step": 229600 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126238200705309, + "loss": 0.0083, + "step": 229610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012623063301229497, + "loss": 0.0085, + "step": 229620 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012622306531928098, + "loss": 0.0097, + "step": 229630 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012621549762626696, + "loss": 0.0085, + "step": 229640 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012620792993325294, + "loss": 0.0085, + "step": 229650 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012620036224023892, + "loss": 0.0098, + "step": 229660 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012619279454722493, + "loss": 0.008, + "step": 229670 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261852268542109, + "loss": 0.0111, + "step": 229680 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261776591611969, + "loss": 0.0098, + "step": 229690 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012617009146818287, + "loss": 0.0089, + "step": 229700 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012616252377516886, + "loss": 0.01, + "step": 229710 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012615495608215486, + "loss": 0.009, + "step": 229720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012614738838914085, + "loss": 0.009, + "step": 229730 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012613982069612683, + "loss": 0.0105, + "step": 229740 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012613225300311284, + "loss": 0.0089, + "step": 229750 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012612468531009882, + "loss": 0.0082, + "step": 229760 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261171176170848, + "loss": 0.0098, + "step": 229770 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261095499240708, + "loss": 0.0083, + "step": 229780 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261019822310568, + "loss": 0.0099, + "step": 229790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012609441453804277, + "loss": 0.0088, + "step": 229800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012608684684502878, + "loss": 0.009, + "step": 229810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012607927915201476, + "loss": 0.0074, + "step": 229820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012607171145900074, + "loss": 0.0109, + "step": 229830 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012606414376598672, + "loss": 0.0135, + "step": 229840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012605657607297273, + "loss": 0.008, + "step": 229850 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001260490083799587, + "loss": 0.0105, + "step": 229860 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001260414406869447, + "loss": 0.0221, + "step": 229870 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001260338729939307, + "loss": 0.0097, + "step": 229880 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012602630530091668, + "loss": 0.0112, + "step": 229890 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012601873760790267, + "loss": 0.0123, + "step": 229900 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012601116991488867, + "loss": 0.0098, + "step": 229910 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012600360222187466, + "loss": 0.0086, + "step": 229920 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012599603452886064, + "loss": 0.0069, + "step": 229930 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012598846683584665, + "loss": 0.0107, + "step": 229940 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012598089914283263, + "loss": 0.0074, + "step": 229950 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259733314498186, + "loss": 0.0074, + "step": 229960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012596576375680462, + "loss": 0.0097, + "step": 229970 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259581960637906, + "loss": 0.0084, + "step": 229980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012595062837077658, + "loss": 0.0106, + "step": 229990 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012594306067776256, + "loss": 0.0113, + "step": 230000 + }, + { + "epoch": 1.16, + "eval_cer": 0.9144556999612812, + "eval_loss": 0.006792085710912943, + "eval_runtime": 116.2077, + "eval_samples_per_second": 17.211, + "eval_steps_per_second": 4.303, + "step": 230000 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012593549298474857, + "loss": 0.0083, + "step": 230010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012592792529173455, + "loss": 0.0075, + "step": 230020 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012592035759872053, + "loss": 0.0076, + "step": 230030 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012591278990570654, + "loss": 0.0087, + "step": 230040 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012590522221269252, + "loss": 0.01, + "step": 230050 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258976545196785, + "loss": 0.0086, + "step": 230060 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258900868266645, + "loss": 0.0101, + "step": 230070 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258825191336505, + "loss": 0.0084, + "step": 230080 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012587495144063648, + "loss": 0.0099, + "step": 230090 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012586738374762248, + "loss": 0.0115, + "step": 230100 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012585981605460847, + "loss": 0.0099, + "step": 230110 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012585224836159445, + "loss": 0.0105, + "step": 230120 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012584468066858046, + "loss": 0.0122, + "step": 230130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012583711297556644, + "loss": 0.0108, + "step": 230140 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012582954528255242, + "loss": 0.0096, + "step": 230150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012582197758953843, + "loss": 0.0129, + "step": 230160 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258144098965244, + "loss": 0.0109, + "step": 230170 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258068422035104, + "loss": 0.0096, + "step": 230180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012579927451049637, + "loss": 0.0087, + "step": 230190 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012579170681748238, + "loss": 0.0108, + "step": 230200 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012578413912446836, + "loss": 0.0094, + "step": 230210 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012577657143145434, + "loss": 0.0093, + "step": 230220 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012576900373844035, + "loss": 0.0077, + "step": 230230 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012576143604542633, + "loss": 0.0082, + "step": 230240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012575386835241231, + "loss": 0.0085, + "step": 230250 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012574630065939832, + "loss": 0.0093, + "step": 230260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257387329663843, + "loss": 0.0091, + "step": 230270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012573116527337029, + "loss": 0.0075, + "step": 230280 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257235975803563, + "loss": 0.0077, + "step": 230290 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012571602988734228, + "loss": 0.011, + "step": 230300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012570846219432826, + "loss": 0.0095, + "step": 230310 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012570089450131427, + "loss": 0.0092, + "step": 230320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012569332680830022, + "loss": 0.0094, + "step": 230330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012568575911528623, + "loss": 0.0081, + "step": 230340 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256781914222722, + "loss": 0.0111, + "step": 230350 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256706237292582, + "loss": 0.0098, + "step": 230360 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012566305603624417, + "loss": 0.0103, + "step": 230370 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012565548834323018, + "loss": 0.008, + "step": 230380 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012564792065021616, + "loss": 0.0081, + "step": 230390 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012564035295720214, + "loss": 0.0104, + "step": 230400 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012563278526418815, + "loss": 0.0068, + "step": 230410 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012562521757117413, + "loss": 0.0089, + "step": 230420 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012561764987816012, + "loss": 0.0094, + "step": 230430 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012561008218514612, + "loss": 0.0086, + "step": 230440 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256025144921321, + "loss": 0.0087, + "step": 230450 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255949467991181, + "loss": 0.008, + "step": 230460 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255873791061041, + "loss": 0.0102, + "step": 230470 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012557981141309008, + "loss": 0.0112, + "step": 230480 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012557224372007606, + "loss": 0.0086, + "step": 230490 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012556467602706207, + "loss": 0.0109, + "step": 230500 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012555710833404805, + "loss": 0.0084, + "step": 230510 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012554954064103403, + "loss": 0.0119, + "step": 230520 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012554197294802, + "loss": 0.0083, + "step": 230530 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012553440525500602, + "loss": 0.0087, + "step": 230540 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125526837561992, + "loss": 0.0077, + "step": 230550 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012551926986897798, + "loss": 0.0076, + "step": 230560 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125511702175964, + "loss": 0.0078, + "step": 230570 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012550413448294997, + "loss": 0.0095, + "step": 230580 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012549656678993595, + "loss": 0.0087, + "step": 230590 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012548899909692196, + "loss": 0.0073, + "step": 230600 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012548143140390794, + "loss": 0.0111, + "step": 230610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012547386371089393, + "loss": 0.0086, + "step": 230620 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012546629601787993, + "loss": 0.0093, + "step": 230630 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012545872832486592, + "loss": 0.0071, + "step": 230640 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254511606318519, + "loss": 0.0083, + "step": 230650 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254435929388379, + "loss": 0.008, + "step": 230660 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254360252458239, + "loss": 0.0096, + "step": 230670 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012542845755280987, + "loss": 0.0096, + "step": 230680 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012542088985979588, + "loss": 0.0103, + "step": 230690 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012541332216678186, + "loss": 0.0094, + "step": 230700 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012540575447376784, + "loss": 0.0089, + "step": 230710 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012539818678075382, + "loss": 0.0085, + "step": 230720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012539061908773983, + "loss": 0.0097, + "step": 230730 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253830513947258, + "loss": 0.0086, + "step": 230740 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253754837017118, + "loss": 0.0119, + "step": 230750 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253679160086978, + "loss": 0.0081, + "step": 230760 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012536034831568378, + "loss": 0.009, + "step": 230770 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012535278062266976, + "loss": 0.0098, + "step": 230780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012534521292965577, + "loss": 0.0086, + "step": 230790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012533764523664175, + "loss": 0.01, + "step": 230800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012533007754362774, + "loss": 0.0098, + "step": 230810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012532250985061374, + "loss": 0.0077, + "step": 230820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012531494215759973, + "loss": 0.0089, + "step": 230830 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253073744645857, + "loss": 0.0085, + "step": 230840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012529980677157172, + "loss": 0.0081, + "step": 230850 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001252922390785577, + "loss": 0.0079, + "step": 230860 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012528467138554368, + "loss": 0.0089, + "step": 230870 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012527710369252966, + "loss": 0.0089, + "step": 230880 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012526953599951567, + "loss": 0.0092, + "step": 230890 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012526196830650165, + "loss": 0.0082, + "step": 230900 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012525440061348763, + "loss": 0.0087, + "step": 230910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012524683292047364, + "loss": 0.0097, + "step": 230920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012523926522745962, + "loss": 0.012, + "step": 230930 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001252316975344456, + "loss": 0.0091, + "step": 230940 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001252241298414316, + "loss": 0.0108, + "step": 230950 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012521656214841757, + "loss": 0.0088, + "step": 230960 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012520899445540357, + "loss": 0.0124, + "step": 230970 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012520142676238956, + "loss": 0.0096, + "step": 230980 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012519385906937554, + "loss": 0.011, + "step": 230990 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012518629137636155, + "loss": 0.0086, + "step": 231000 + }, + { + "epoch": 1.17, + "eval_cer": 0.9144353216426477, + "eval_loss": 0.006772263906896114, + "eval_runtime": 116.0719, + "eval_samples_per_second": 17.231, + "eval_steps_per_second": 4.308, + "step": 231000 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012517872368334753, + "loss": 0.0083, + "step": 231010 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251711559903335, + "loss": 0.008, + "step": 231020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012516358829731952, + "loss": 0.0109, + "step": 231030 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251560206043055, + "loss": 0.01, + "step": 231040 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012514845291129148, + "loss": 0.0098, + "step": 231050 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251408852182775, + "loss": 0.0091, + "step": 231060 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012513331752526347, + "loss": 0.0108, + "step": 231070 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012512574983224945, + "loss": 0.009, + "step": 231080 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012511818213923543, + "loss": 0.0086, + "step": 231090 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012511061444622144, + "loss": 0.0091, + "step": 231100 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012510304675320742, + "loss": 0.0078, + "step": 231110 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250954790601934, + "loss": 0.0135, + "step": 231120 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250879113671794, + "loss": 0.0079, + "step": 231130 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250803436741654, + "loss": 0.0119, + "step": 231140 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012507277598115138, + "loss": 0.0098, + "step": 231150 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012506520828813738, + "loss": 0.0115, + "step": 231160 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012505764059512337, + "loss": 0.009, + "step": 231170 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012505007290210935, + "loss": 0.0071, + "step": 231180 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012504250520909536, + "loss": 0.0081, + "step": 231190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012503493751608134, + "loss": 0.0099, + "step": 231200 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012502736982306732, + "loss": 0.0095, + "step": 231210 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012501980213005333, + "loss": 0.0116, + "step": 231220 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250122344370393, + "loss": 0.01, + "step": 231230 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250046667440253, + "loss": 0.0102, + "step": 231240 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012499709905101127, + "loss": 0.0093, + "step": 231250 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012498953135799728, + "loss": 0.0079, + "step": 231260 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012498196366498326, + "loss": 0.0094, + "step": 231270 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012497439597196924, + "loss": 0.0112, + "step": 231280 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012496682827895525, + "loss": 0.0115, + "step": 231290 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012495926058594123, + "loss": 0.0113, + "step": 231300 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012495169289292721, + "loss": 0.0109, + "step": 231310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012494412519991322, + "loss": 0.013, + "step": 231320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249365575068992, + "loss": 0.0074, + "step": 231330 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012492898981388519, + "loss": 0.0101, + "step": 231340 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249214221208712, + "loss": 0.0109, + "step": 231350 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012491385442785718, + "loss": 0.0095, + "step": 231360 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012490628673484316, + "loss": 0.0136, + "step": 231370 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012489871904182917, + "loss": 0.0108, + "step": 231380 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012489115134881515, + "loss": 0.0081, + "step": 231390 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012488358365580113, + "loss": 0.0073, + "step": 231400 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248760159627871, + "loss": 0.008, + "step": 231410 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012486844826977312, + "loss": 0.0077, + "step": 231420 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248608805767591, + "loss": 0.0097, + "step": 231430 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012485331288374508, + "loss": 0.0078, + "step": 231440 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248457451907311, + "loss": 0.0106, + "step": 231450 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012483817749771707, + "loss": 0.0092, + "step": 231460 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012483060980470305, + "loss": 0.008, + "step": 231470 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012482304211168906, + "loss": 0.0072, + "step": 231480 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012481547441867504, + "loss": 0.0098, + "step": 231490 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012480790672566102, + "loss": 0.0118, + "step": 231500 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012480033903264703, + "loss": 0.0113, + "step": 231510 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012479277133963301, + "loss": 0.0099, + "step": 231520 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124785203646619, + "loss": 0.0086, + "step": 231530 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124777635953605, + "loss": 0.007, + "step": 231540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012477006826059099, + "loss": 0.0115, + "step": 231550 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012476250056757697, + "loss": 0.0116, + "step": 231560 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012475493287456298, + "loss": 0.0101, + "step": 231570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012474736518154896, + "loss": 0.0103, + "step": 231580 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012473979748853494, + "loss": 0.0077, + "step": 231590 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012473222979552092, + "loss": 0.008, + "step": 231600 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247246621025069, + "loss": 0.0131, + "step": 231610 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012471709440949288, + "loss": 0.0092, + "step": 231620 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247095267164789, + "loss": 0.0094, + "step": 231630 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012470195902346487, + "loss": 0.0097, + "step": 231640 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012469439133045085, + "loss": 0.0077, + "step": 231650 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012468682363743686, + "loss": 0.0087, + "step": 231660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012467925594442284, + "loss": 0.0095, + "step": 231670 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012467168825140883, + "loss": 0.009, + "step": 231680 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012466412055839483, + "loss": 0.0098, + "step": 231690 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012465655286538082, + "loss": 0.011, + "step": 231700 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246489851723668, + "loss": 0.0084, + "step": 231710 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246414174793528, + "loss": 0.0109, + "step": 231720 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246338497863388, + "loss": 0.009, + "step": 231730 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012462628209332477, + "loss": 0.0078, + "step": 231740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012461871440031078, + "loss": 0.0093, + "step": 231750 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012461114670729676, + "loss": 0.0083, + "step": 231760 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012460357901428274, + "loss": 0.0066, + "step": 231770 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012459601132126872, + "loss": 0.0083, + "step": 231780 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012458844362825473, + "loss": 0.0077, + "step": 231790 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245808759352407, + "loss": 0.0098, + "step": 231800 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245733082422267, + "loss": 0.0115, + "step": 231810 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245657405492127, + "loss": 0.0085, + "step": 231820 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012455817285619868, + "loss": 0.0106, + "step": 231830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012455060516318466, + "loss": 0.0094, + "step": 231840 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012454303747017067, + "loss": 0.0102, + "step": 231850 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012453546977715665, + "loss": 0.0094, + "step": 231860 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012452790208414264, + "loss": 0.0113, + "step": 231870 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012452033439112864, + "loss": 0.0081, + "step": 231880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012451276669811463, + "loss": 0.0124, + "step": 231890 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245051990051006, + "loss": 0.0078, + "step": 231900 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012449763131208662, + "loss": 0.0112, + "step": 231910 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244900636190726, + "loss": 0.01, + "step": 231920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012448249592605858, + "loss": 0.0075, + "step": 231930 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012447492823304456, + "loss": 0.0094, + "step": 231940 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012446736054003057, + "loss": 0.0077, + "step": 231950 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012445979284701655, + "loss": 0.0089, + "step": 231960 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012445222515400253, + "loss": 0.0072, + "step": 231970 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012444465746098854, + "loss": 0.0095, + "step": 231980 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012443708976797452, + "loss": 0.0108, + "step": 231990 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244295220749605, + "loss": 0.0075, + "step": 232000 + }, + { + "epoch": 1.17, + "eval_cer": 0.9144654039225352, + "eval_loss": 0.006733159068971872, + "eval_runtime": 115.9285, + "eval_samples_per_second": 17.252, + "eval_steps_per_second": 4.313, + "step": 232000 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244219543819465, + "loss": 0.0108, + "step": 232010 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244143866889325, + "loss": 0.0096, + "step": 232020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012440681899591848, + "loss": 0.0086, + "step": 232030 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012439925130290448, + "loss": 0.0088, + "step": 232040 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012439168360989047, + "loss": 0.0111, + "step": 232050 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012438411591687645, + "loss": 0.0079, + "step": 232060 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012437654822386246, + "loss": 0.0072, + "step": 232070 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012436898053084844, + "loss": 0.0086, + "step": 232080 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012436141283783442, + "loss": 0.0098, + "step": 232090 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012435384514482043, + "loss": 0.0129, + "step": 232100 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243462774518064, + "loss": 0.0102, + "step": 232110 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243387097587924, + "loss": 0.0102, + "step": 232120 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012433114206577837, + "loss": 0.0117, + "step": 232130 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012432357437276438, + "loss": 0.0085, + "step": 232140 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012431600667975036, + "loss": 0.008, + "step": 232150 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012430843898673634, + "loss": 0.0075, + "step": 232160 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012430087129372235, + "loss": 0.0131, + "step": 232170 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012429330360070833, + "loss": 0.0105, + "step": 232180 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012428573590769431, + "loss": 0.0098, + "step": 232190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012427816821468032, + "loss": 0.0091, + "step": 232200 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012427060052166628, + "loss": 0.01, + "step": 232210 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012426303282865229, + "loss": 0.009, + "step": 232220 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012425546513563827, + "loss": 0.0077, + "step": 232230 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012424789744262425, + "loss": 0.0123, + "step": 232240 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012424032974961026, + "loss": 0.0099, + "step": 232250 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012423276205659624, + "loss": 0.0069, + "step": 232260 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012422519436358222, + "loss": 0.0075, + "step": 232270 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012421762667056823, + "loss": 0.01, + "step": 232280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242100589775542, + "loss": 0.0097, + "step": 232290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242024912845402, + "loss": 0.0102, + "step": 232300 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012419492359152617, + "loss": 0.0093, + "step": 232310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012418735589851218, + "loss": 0.0102, + "step": 232320 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012417978820549816, + "loss": 0.0076, + "step": 232330 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012417222051248414, + "loss": 0.0083, + "step": 232340 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012416465281947015, + "loss": 0.0071, + "step": 232350 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012415708512645613, + "loss": 0.0106, + "step": 232360 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012414951743344212, + "loss": 0.0083, + "step": 232370 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012414194974042812, + "loss": 0.0116, + "step": 232380 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241343820474141, + "loss": 0.0091, + "step": 232390 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241268143544001, + "loss": 0.0075, + "step": 232400 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241192466613861, + "loss": 0.01, + "step": 232410 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012411167896837208, + "loss": 0.0083, + "step": 232420 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012410411127535806, + "loss": 0.0091, + "step": 232430 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012409654358234407, + "loss": 0.0104, + "step": 232440 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012408897588933005, + "loss": 0.0101, + "step": 232450 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012408140819631603, + "loss": 0.0155, + "step": 232460 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124073840503302, + "loss": 0.0083, + "step": 232470 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012406627281028802, + "loss": 0.0081, + "step": 232480 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124058705117274, + "loss": 0.0088, + "step": 232490 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012405113742425998, + "loss": 0.0083, + "step": 232500 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124043569731246, + "loss": 0.0065, + "step": 232510 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012403600203823197, + "loss": 0.0081, + "step": 232520 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012402843434521795, + "loss": 0.0096, + "step": 232530 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012402086665220396, + "loss": 0.0096, + "step": 232540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012401329895918994, + "loss": 0.0118, + "step": 232550 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012400573126617593, + "loss": 0.007, + "step": 232560 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012399816357316193, + "loss": 0.0097, + "step": 232570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012399059588014792, + "loss": 0.0088, + "step": 232580 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239830281871339, + "loss": 0.0119, + "step": 232590 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239754604941199, + "loss": 0.0099, + "step": 232600 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239678928011059, + "loss": 0.0138, + "step": 232610 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012396032510809187, + "loss": 0.0096, + "step": 232620 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012395275741507788, + "loss": 0.0088, + "step": 232630 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012394518972206386, + "loss": 0.0091, + "step": 232640 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012393762202904984, + "loss": 0.0081, + "step": 232650 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012393005433603582, + "loss": 0.0071, + "step": 232660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012392248664302183, + "loss": 0.0077, + "step": 232670 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239149189500078, + "loss": 0.0078, + "step": 232680 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239073512569938, + "loss": 0.0119, + "step": 232690 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238997835639798, + "loss": 0.0099, + "step": 232700 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012389221587096578, + "loss": 0.0098, + "step": 232710 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012388464817795176, + "loss": 0.0084, + "step": 232720 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012387708048493777, + "loss": 0.0117, + "step": 232730 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012386951279192375, + "loss": 0.0083, + "step": 232740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012386194509890974, + "loss": 0.0105, + "step": 232750 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012385437740589574, + "loss": 0.0077, + "step": 232760 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012384680971288173, + "loss": 0.0089, + "step": 232770 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238392420198677, + "loss": 0.0071, + "step": 232780 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012383167432685372, + "loss": 0.0096, + "step": 232790 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238241066338397, + "loss": 0.0089, + "step": 232800 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012381653894082568, + "loss": 0.0087, + "step": 232810 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012380897124781166, + "loss": 0.0079, + "step": 232820 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012380140355479767, + "loss": 0.0089, + "step": 232830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012379383586178362, + "loss": 0.0102, + "step": 232840 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012378626816876963, + "loss": 0.0088, + "step": 232850 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237787004757556, + "loss": 0.0096, + "step": 232860 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237711327827416, + "loss": 0.0117, + "step": 232870 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237635650897276, + "loss": 0.009, + "step": 232880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012375599739671358, + "loss": 0.01, + "step": 232890 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012374842970369957, + "loss": 0.0089, + "step": 232900 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012374086201068557, + "loss": 0.0085, + "step": 232910 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012373329431767156, + "loss": 0.0087, + "step": 232920 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012372572662465754, + "loss": 0.0088, + "step": 232930 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012371815893164355, + "loss": 0.0067, + "step": 232940 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012371059123862953, + "loss": 0.0092, + "step": 232950 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237030235456155, + "loss": 0.0101, + "step": 232960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012369545585260152, + "loss": 0.0097, + "step": 232970 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236878881595875, + "loss": 0.008, + "step": 232980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012368032046657348, + "loss": 0.0083, + "step": 232990 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236727527735595, + "loss": 0.0077, + "step": 233000 + }, + { + "epoch": 1.18, + "eval_cer": 0.914438232831024, + "eval_loss": 0.006864336784929037, + "eval_runtime": 115.9429, + "eval_samples_per_second": 17.25, + "eval_steps_per_second": 4.312, + "step": 233000 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012366518508054547, + "loss": 0.0094, + "step": 233010 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012365761738753145, + "loss": 0.0101, + "step": 233020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012365004969451743, + "loss": 0.0131, + "step": 233030 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012364248200150344, + "loss": 0.0068, + "step": 233040 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012363491430848942, + "loss": 0.0107, + "step": 233050 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236273466154754, + "loss": 0.0104, + "step": 233060 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236197789224614, + "loss": 0.0077, + "step": 233070 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236122112294474, + "loss": 0.0091, + "step": 233080 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012360464353643338, + "loss": 0.0111, + "step": 233090 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012359707584341938, + "loss": 0.0103, + "step": 233100 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012358950815040537, + "loss": 0.0088, + "step": 233110 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012358194045739135, + "loss": 0.0085, + "step": 233120 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012357437276437736, + "loss": 0.0122, + "step": 233130 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012356680507136334, + "loss": 0.0069, + "step": 233140 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012355923737834932, + "loss": 0.0143, + "step": 233150 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012355166968533533, + "loss": 0.0093, + "step": 233160 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235441019923213, + "loss": 0.0086, + "step": 233170 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235365342993073, + "loss": 0.0092, + "step": 233180 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012352896660629327, + "loss": 0.0102, + "step": 233190 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012352139891327928, + "loss": 0.0094, + "step": 233200 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012351383122026526, + "loss": 0.0069, + "step": 233210 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012350626352725124, + "loss": 0.0081, + "step": 233220 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012349869583423725, + "loss": 0.0083, + "step": 233230 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012349112814122323, + "loss": 0.0092, + "step": 233240 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012348356044820921, + "loss": 0.0086, + "step": 233250 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012347599275519522, + "loss": 0.0086, + "step": 233260 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234684250621812, + "loss": 0.0103, + "step": 233270 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012346085736916719, + "loss": 0.0078, + "step": 233280 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234532896761532, + "loss": 0.0102, + "step": 233290 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012344572198313918, + "loss": 0.0083, + "step": 233300 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012343815429012516, + "loss": 0.0099, + "step": 233310 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012343058659711117, + "loss": 0.0102, + "step": 233320 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012342301890409715, + "loss": 0.0102, + "step": 233330 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012341545121108313, + "loss": 0.0088, + "step": 233340 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234078835180691, + "loss": 0.0065, + "step": 233350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012340031582505512, + "loss": 0.0068, + "step": 233360 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233927481320411, + "loss": 0.0084, + "step": 233370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012338518043902708, + "loss": 0.0079, + "step": 233380 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233776127460131, + "loss": 0.0106, + "step": 233390 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012337004505299907, + "loss": 0.0103, + "step": 233400 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012336247735998505, + "loss": 0.0073, + "step": 233410 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012335490966697106, + "loss": 0.0097, + "step": 233420 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012334734197395704, + "loss": 0.0101, + "step": 233430 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012333977428094302, + "loss": 0.0087, + "step": 233440 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012333220658792903, + "loss": 0.01, + "step": 233450 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012332463889491501, + "loss": 0.0091, + "step": 233460 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123317071201901, + "loss": 0.0092, + "step": 233470 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012330950350888698, + "loss": 0.0069, + "step": 233480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012330193581587296, + "loss": 0.0102, + "step": 233490 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012329436812285897, + "loss": 0.0082, + "step": 233500 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012328680042984495, + "loss": 0.0092, + "step": 233510 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012327923273683093, + "loss": 0.0103, + "step": 233520 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012327166504381694, + "loss": 0.0081, + "step": 233530 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012326409735080292, + "loss": 0.0075, + "step": 233540 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232565296577889, + "loss": 0.0106, + "step": 233550 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012324896196477488, + "loss": 0.0075, + "step": 233560 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232413942717609, + "loss": 0.0087, + "step": 233570 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012323382657874687, + "loss": 0.0078, + "step": 233580 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012322625888573285, + "loss": 0.0083, + "step": 233590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012321869119271886, + "loss": 0.0081, + "step": 233600 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012321112349970484, + "loss": 0.0126, + "step": 233610 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012320355580669083, + "loss": 0.008, + "step": 233620 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012319598811367683, + "loss": 0.0086, + "step": 233630 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012318842042066282, + "loss": 0.0078, + "step": 233640 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231808527276488, + "loss": 0.0081, + "step": 233650 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231732850346348, + "loss": 0.0112, + "step": 233660 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231657173416208, + "loss": 0.0114, + "step": 233670 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012315814964860677, + "loss": 0.011, + "step": 233680 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012315058195559278, + "loss": 0.0083, + "step": 233690 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012314301426257876, + "loss": 0.0157, + "step": 233700 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012313544656956474, + "loss": 0.011, + "step": 233710 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012312787887655072, + "loss": 0.0084, + "step": 233720 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012312031118353673, + "loss": 0.0101, + "step": 233730 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231127434905227, + "loss": 0.0101, + "step": 233740 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231051757975087, + "loss": 0.0087, + "step": 233750 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230976081044947, + "loss": 0.0082, + "step": 233760 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012309004041148068, + "loss": 0.0092, + "step": 233770 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012308247271846666, + "loss": 0.0129, + "step": 233780 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012307490502545267, + "loss": 0.0113, + "step": 233790 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012306733733243865, + "loss": 0.0075, + "step": 233800 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012305976963942464, + "loss": 0.0084, + "step": 233810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012305220194641064, + "loss": 0.0087, + "step": 233820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012304463425339663, + "loss": 0.0063, + "step": 233830 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230370665603826, + "loss": 0.0061, + "step": 233840 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012302949886736862, + "loss": 0.0081, + "step": 233850 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230219311743546, + "loss": 0.0119, + "step": 233860 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012301436348134058, + "loss": 0.009, + "step": 233870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012300679578832656, + "loss": 0.0106, + "step": 233880 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012299922809531257, + "loss": 0.0084, + "step": 233890 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012299166040229855, + "loss": 0.0093, + "step": 233900 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012298409270928453, + "loss": 0.0103, + "step": 233910 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012297652501627054, + "loss": 0.0079, + "step": 233920 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012296895732325652, + "loss": 0.0086, + "step": 233930 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229613896302425, + "loss": 0.0098, + "step": 233940 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229538219372285, + "loss": 0.0079, + "step": 233950 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229462542442145, + "loss": 0.0089, + "step": 233960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012293868655120047, + "loss": 0.0115, + "step": 233970 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012293111885818648, + "loss": 0.0069, + "step": 233980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012292355116517246, + "loss": 0.0086, + "step": 233990 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012291598347215845, + "loss": 0.0082, + "step": 234000 + }, + { + "epoch": 1.18, + "eval_cer": 0.9144275584736445, + "eval_loss": 0.0069518680684268475, + "eval_runtime": 115.6903, + "eval_samples_per_second": 17.288, + "eval_steps_per_second": 4.322, + "step": 234000 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012290841577914445, + "loss": 0.008, + "step": 234010 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012290084808613044, + "loss": 0.0114, + "step": 234020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012289328039311642, + "loss": 0.0118, + "step": 234030 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012288571270010243, + "loss": 0.0087, + "step": 234040 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228781450070884, + "loss": 0.0121, + "step": 234050 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228705773140744, + "loss": 0.0133, + "step": 234060 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012286300962106037, + "loss": 0.0101, + "step": 234070 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012285544192804638, + "loss": 0.0087, + "step": 234080 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012284787423503236, + "loss": 0.0087, + "step": 234090 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012284030654201834, + "loss": 0.009, + "step": 234100 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012283273884900432, + "loss": 0.0122, + "step": 234110 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228251711559903, + "loss": 0.0091, + "step": 234120 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228176034629763, + "loss": 0.0075, + "step": 234130 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228100357699623, + "loss": 0.0132, + "step": 234140 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012280246807694828, + "loss": 0.0093, + "step": 234150 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012279490038393428, + "loss": 0.0114, + "step": 234160 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012278733269092027, + "loss": 0.0084, + "step": 234170 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012277976499790625, + "loss": 0.0076, + "step": 234180 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012277219730489226, + "loss": 0.008, + "step": 234190 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012276462961187824, + "loss": 0.0101, + "step": 234200 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012275706191886422, + "loss": 0.0094, + "step": 234210 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012274949422585023, + "loss": 0.0091, + "step": 234220 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227419265328362, + "loss": 0.0084, + "step": 234230 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227343588398222, + "loss": 0.009, + "step": 234240 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012272679114680817, + "loss": 0.0096, + "step": 234250 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012271922345379418, + "loss": 0.0084, + "step": 234260 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012271165576078016, + "loss": 0.0093, + "step": 234270 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012270408806776614, + "loss": 0.009, + "step": 234280 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012269652037475215, + "loss": 0.0104, + "step": 234290 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012268895268173813, + "loss": 0.012, + "step": 234300 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012268138498872411, + "loss": 0.008, + "step": 234310 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012267381729571012, + "loss": 0.0097, + "step": 234320 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226662496026961, + "loss": 0.0094, + "step": 234330 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012265868190968209, + "loss": 0.0074, + "step": 234340 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226511142166681, + "loss": 0.0083, + "step": 234350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012264354652365408, + "loss": 0.0084, + "step": 234360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012263597883064006, + "loss": 0.0073, + "step": 234370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012262841113762607, + "loss": 0.0081, + "step": 234380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012262084344461205, + "loss": 0.0145, + "step": 234390 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012261327575159803, + "loss": 0.008, + "step": 234400 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122605708058584, + "loss": 0.0093, + "step": 234410 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012259814036557002, + "loss": 0.0098, + "step": 234420 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122590572672556, + "loss": 0.0073, + "step": 234430 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012258300497954198, + "loss": 0.0078, + "step": 234440 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122575437286528, + "loss": 0.0088, + "step": 234450 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012256786959351397, + "loss": 0.0077, + "step": 234460 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012256030190049995, + "loss": 0.0106, + "step": 234470 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012255273420748596, + "loss": 0.0096, + "step": 234480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012254516651447194, + "loss": 0.0084, + "step": 234490 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012253759882145792, + "loss": 0.0068, + "step": 234500 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012253003112844393, + "loss": 0.0092, + "step": 234510 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012252246343542991, + "loss": 0.0098, + "step": 234520 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225148957424159, + "loss": 0.009, + "step": 234530 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225073280494019, + "loss": 0.0088, + "step": 234540 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012249976035638789, + "loss": 0.0087, + "step": 234550 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012249219266337387, + "loss": 0.0109, + "step": 234560 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012248462497035988, + "loss": 0.0095, + "step": 234570 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012247705727734586, + "loss": 0.0097, + "step": 234580 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012246948958433184, + "loss": 0.0087, + "step": 234590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012246192189131782, + "loss": 0.0073, + "step": 234600 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012245435419830383, + "loss": 0.0079, + "step": 234610 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224467865052898, + "loss": 0.0123, + "step": 234620 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224392188122758, + "loss": 0.008, + "step": 234630 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224316511192618, + "loss": 0.0096, + "step": 234640 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012242408342624778, + "loss": 0.0111, + "step": 234650 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012241651573323376, + "loss": 0.0072, + "step": 234660 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012240894804021977, + "loss": 0.0067, + "step": 234670 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012240138034720575, + "loss": 0.0083, + "step": 234680 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012239381265419173, + "loss": 0.0082, + "step": 234690 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012238624496117774, + "loss": 0.0092, + "step": 234700 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012237867726816372, + "loss": 0.0081, + "step": 234710 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223711095751497, + "loss": 0.0094, + "step": 234720 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223635418821357, + "loss": 0.0126, + "step": 234730 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012235597418912167, + "loss": 0.0092, + "step": 234740 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012234840649610768, + "loss": 0.0095, + "step": 234750 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012234083880309366, + "loss": 0.009, + "step": 234760 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012233327111007964, + "loss": 0.0077, + "step": 234770 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012232570341706562, + "loss": 0.0098, + "step": 234780 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012231813572405163, + "loss": 0.0104, + "step": 234790 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223105680310376, + "loss": 0.0077, + "step": 234800 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223030003380236, + "loss": 0.0093, + "step": 234810 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222954326450096, + "loss": 0.009, + "step": 234820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012228786495199558, + "loss": 0.0072, + "step": 234830 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012228029725898156, + "loss": 0.0075, + "step": 234840 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012227272956596757, + "loss": 0.0096, + "step": 234850 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012226516187295355, + "loss": 0.0091, + "step": 234860 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012225759417993954, + "loss": 0.0098, + "step": 234870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012225002648692554, + "loss": 0.0073, + "step": 234880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012224245879391153, + "loss": 0.009, + "step": 234890 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222348911008975, + "loss": 0.01, + "step": 234900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012222732340788352, + "loss": 0.0075, + "step": 234910 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222197557148695, + "loss": 0.0084, + "step": 234920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012221218802185548, + "loss": 0.0083, + "step": 234930 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222046203288415, + "loss": 0.0104, + "step": 234940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012219705263582747, + "loss": 0.011, + "step": 234950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012218948494281345, + "loss": 0.0108, + "step": 234960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012218191724979943, + "loss": 0.0099, + "step": 234970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012217434955678544, + "loss": 0.0071, + "step": 234980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012216678186377142, + "loss": 0.0084, + "step": 234990 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221592141707574, + "loss": 0.0086, + "step": 235000 + }, + { + "epoch": 1.19, + "eval_cer": 0.9144362920387732, + "eval_loss": 0.0068534985184669495, + "eval_runtime": 115.6303, + "eval_samples_per_second": 17.297, + "eval_steps_per_second": 4.324, + "step": 235000 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221516464777434, + "loss": 0.008, + "step": 235010 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221440787847294, + "loss": 0.0096, + "step": 235020 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012213651109171537, + "loss": 0.0084, + "step": 235030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012212894339870138, + "loss": 0.0104, + "step": 235040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012212137570568736, + "loss": 0.011, + "step": 235050 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012211380801267335, + "loss": 0.0076, + "step": 235060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012210624031965935, + "loss": 0.0067, + "step": 235070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012209867262664534, + "loss": 0.0076, + "step": 235080 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012209110493363132, + "loss": 0.0078, + "step": 235090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012208353724061733, + "loss": 0.0137, + "step": 235100 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220759695476033, + "loss": 0.01, + "step": 235110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012206840185458929, + "loss": 0.0119, + "step": 235120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012206083416157528, + "loss": 0.0062, + "step": 235130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012205326646856128, + "loss": 0.007, + "step": 235140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012204569877554726, + "loss": 0.0088, + "step": 235150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012203813108253326, + "loss": 0.0084, + "step": 235160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012203056338951924, + "loss": 0.0076, + "step": 235170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012202299569650523, + "loss": 0.0117, + "step": 235180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012201542800349123, + "loss": 0.0087, + "step": 235190 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012200786031047721, + "loss": 0.009, + "step": 235200 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220002926174632, + "loss": 0.0074, + "step": 235210 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219927249244492, + "loss": 0.0066, + "step": 235220 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012198515723143518, + "loss": 0.0079, + "step": 235230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197758953842117, + "loss": 0.0104, + "step": 235240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197002184540716, + "loss": 0.0083, + "step": 235250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012196245415239315, + "loss": 0.0091, + "step": 235260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012195488645937915, + "loss": 0.0093, + "step": 235270 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012194731876636513, + "loss": 0.0099, + "step": 235280 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193975107335112, + "loss": 0.0095, + "step": 235290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193218338033712, + "loss": 0.0069, + "step": 235300 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219246156873231, + "loss": 0.0073, + "step": 235310 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219170479943091, + "loss": 0.0073, + "step": 235320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012190948030129508, + "loss": 0.0078, + "step": 235330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012190191260828107, + "loss": 0.0085, + "step": 235340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012189434491526707, + "loss": 0.0103, + "step": 235350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012188677722225303, + "loss": 0.008, + "step": 235360 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012187920952923903, + "loss": 0.0074, + "step": 235370 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012187164183622501, + "loss": 0.0074, + "step": 235380 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121864074143211, + "loss": 0.0115, + "step": 235390 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121856506450197, + "loss": 0.01, + "step": 235400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184893875718298, + "loss": 0.008, + "step": 235410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184137106416898, + "loss": 0.0076, + "step": 235420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012183380337115497, + "loss": 0.0083, + "step": 235430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012182623567814095, + "loss": 0.0069, + "step": 235440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012181866798512695, + "loss": 0.0111, + "step": 235450 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012181110029211293, + "loss": 0.0087, + "step": 235460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012180353259909892, + "loss": 0.0099, + "step": 235470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012179596490608492, + "loss": 0.0103, + "step": 235480 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001217883972130709, + "loss": 0.0076, + "step": 235490 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001217808295200569, + "loss": 0.011, + "step": 235500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012177326182704289, + "loss": 0.0087, + "step": 235510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012176569413402887, + "loss": 0.01, + "step": 235520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012175812644101487, + "loss": 0.0119, + "step": 235530 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012175055874800085, + "loss": 0.0106, + "step": 235540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012174299105498684, + "loss": 0.0085, + "step": 235550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012173542336197284, + "loss": 0.0083, + "step": 235560 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012172785566895882, + "loss": 0.0087, + "step": 235570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012172028797594481, + "loss": 0.0065, + "step": 235580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012171272028293081, + "loss": 0.0102, + "step": 235590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012170515258991679, + "loss": 0.0092, + "step": 235600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012169758489690279, + "loss": 0.0089, + "step": 235610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012169001720388877, + "loss": 0.0097, + "step": 235620 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012168244951087476, + "loss": 0.0092, + "step": 235630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012167488181786076, + "loss": 0.0095, + "step": 235640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012166731412484674, + "loss": 0.0089, + "step": 235650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165974643183273, + "loss": 0.0076, + "step": 235660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165217873881873, + "loss": 0.0089, + "step": 235670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012164461104580471, + "loss": 0.0101, + "step": 235680 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001216370433527907, + "loss": 0.0102, + "step": 235690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162947565977669, + "loss": 0.0073, + "step": 235700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162190796676268, + "loss": 0.0111, + "step": 235710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012161434027374868, + "loss": 0.0104, + "step": 235720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012160677258073466, + "loss": 0.0076, + "step": 235730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012159920488772065, + "loss": 0.0099, + "step": 235740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012159163719470665, + "loss": 0.0097, + "step": 235750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012158406950169263, + "loss": 0.0108, + "step": 235760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012157650180867862, + "loss": 0.0102, + "step": 235770 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001215689341156646, + "loss": 0.0076, + "step": 235780 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001215613664226506, + "loss": 0.0079, + "step": 235790 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001215537987296366, + "loss": 0.0084, + "step": 235800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012154623103662258, + "loss": 0.0086, + "step": 235810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153866334360857, + "loss": 0.0099, + "step": 235820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153109565059457, + "loss": 0.0096, + "step": 235830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012152352795758055, + "loss": 0.0077, + "step": 235840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012151596026456654, + "loss": 0.0094, + "step": 235850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012150839257155253, + "loss": 0.0099, + "step": 235860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012150082487853852, + "loss": 0.0109, + "step": 235870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012149325718552452, + "loss": 0.0102, + "step": 235880 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001214856894925105, + "loss": 0.0093, + "step": 235890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012147812179949649, + "loss": 0.0101, + "step": 235900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012147055410648249, + "loss": 0.0096, + "step": 235910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012146298641346847, + "loss": 0.0116, + "step": 235920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012145541872045446, + "loss": 0.008, + "step": 235930 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144785102744046, + "loss": 0.0091, + "step": 235940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144028333442644, + "loss": 0.0081, + "step": 235950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012143271564141243, + "loss": 0.0084, + "step": 235960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012142514794839842, + "loss": 0.0083, + "step": 235970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141758025538441, + "loss": 0.0092, + "step": 235980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141001256237038, + "loss": 0.0095, + "step": 235990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012140244486935637, + "loss": 0.0086, + "step": 236000 + }, + { + "epoch": 1.19, + "eval_cer": 0.9144469663961525, + "eval_loss": 0.0067824204452335835, + "eval_runtime": 116.0471, + "eval_samples_per_second": 17.234, + "eval_steps_per_second": 4.309, + "step": 236000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012139487717634237, + "loss": 0.0095, + "step": 236010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012138730948332835, + "loss": 0.0084, + "step": 236020 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012137974179031435, + "loss": 0.0092, + "step": 236030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012137217409730034, + "loss": 0.0083, + "step": 236040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012136460640428632, + "loss": 0.0062, + "step": 236050 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012135703871127232, + "loss": 0.0106, + "step": 236060 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001213494710182583, + "loss": 0.0077, + "step": 236070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134190332524429, + "loss": 0.008, + "step": 236080 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012133433563223029, + "loss": 0.0079, + "step": 236090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012132676793921627, + "loss": 0.0077, + "step": 236100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012131920024620226, + "loss": 0.008, + "step": 236110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012131163255318826, + "loss": 0.0112, + "step": 236120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012130406486017424, + "loss": 0.0098, + "step": 236130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012129649716716024, + "loss": 0.0091, + "step": 236140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128892947414622, + "loss": 0.0088, + "step": 236150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128136178113221, + "loss": 0.0092, + "step": 236160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012127379408811821, + "loss": 0.0089, + "step": 236170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012126622639510419, + "loss": 0.009, + "step": 236180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012125865870209018, + "loss": 0.0077, + "step": 236190 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012125109100907618, + "loss": 0.0105, + "step": 236200 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012124352331606216, + "loss": 0.0112, + "step": 236210 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012123595562304816, + "loss": 0.0075, + "step": 236220 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012122838793003414, + "loss": 0.0082, + "step": 236230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012122082023702013, + "loss": 0.0091, + "step": 236240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012121325254400613, + "loss": 0.009, + "step": 236250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012120568485099211, + "loss": 0.0099, + "step": 236260 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211981171579781, + "loss": 0.0083, + "step": 236270 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211905494649641, + "loss": 0.0066, + "step": 236280 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012118298177195008, + "loss": 0.0072, + "step": 236290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012117541407893607, + "loss": 0.0096, + "step": 236300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116784638592206, + "loss": 0.0085, + "step": 236310 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116027869290805, + "loss": 0.0092, + "step": 236320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012115271099989405, + "loss": 0.0091, + "step": 236330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012114514330688003, + "loss": 0.0081, + "step": 236340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113757561386602, + "loss": 0.0088, + "step": 236350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113000792085202, + "loss": 0.0112, + "step": 236360 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121122440227838, + "loss": 0.0093, + "step": 236370 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121114872534824, + "loss": 0.0099, + "step": 236380 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012110730484180999, + "loss": 0.008, + "step": 236390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012109973714879597, + "loss": 0.0097, + "step": 236400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012109216945578197, + "loss": 0.01, + "step": 236410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012108460176276795, + "loss": 0.0091, + "step": 236420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012107703406975394, + "loss": 0.0103, + "step": 236430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012106946637673994, + "loss": 0.0086, + "step": 236440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012106189868372592, + "loss": 0.01, + "step": 236450 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012105433099071191, + "loss": 0.0099, + "step": 236460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012104676329769791, + "loss": 0.0085, + "step": 236470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012103919560468389, + "loss": 0.0087, + "step": 236480 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012103162791166988, + "loss": 0.0097, + "step": 236490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012102406021865587, + "loss": 0.0094, + "step": 236500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012101649252564186, + "loss": 0.0103, + "step": 236510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100892483262786, + "loss": 0.0099, + "step": 236520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100135713961384, + "loss": 0.0103, + "step": 236530 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012099378944659983, + "loss": 0.0081, + "step": 236540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012098622175358583, + "loss": 0.0068, + "step": 236550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012097865406057181, + "loss": 0.0097, + "step": 236560 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209710863675578, + "loss": 0.0074, + "step": 236570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012096351867454379, + "loss": 0.0062, + "step": 236580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012095595098152978, + "loss": 0.0097, + "step": 236590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012094838328851578, + "loss": 0.0089, + "step": 236600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012094081559550174, + "loss": 0.0083, + "step": 236610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012093324790248774, + "loss": 0.0087, + "step": 236620 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012092568020947372, + "loss": 0.0095, + "step": 236630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012091811251645971, + "loss": 0.0083, + "step": 236640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012091054482344571, + "loss": 0.0109, + "step": 236650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012090297713043169, + "loss": 0.008, + "step": 236660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012089540943741769, + "loss": 0.0095, + "step": 236670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088784174440367, + "loss": 0.0082, + "step": 236680 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088027405138966, + "loss": 0.0108, + "step": 236690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012087270635837566, + "loss": 0.0072, + "step": 236700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012086513866536164, + "loss": 0.0085, + "step": 236710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012085757097234763, + "loss": 0.0084, + "step": 236720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012085000327933363, + "loss": 0.0116, + "step": 236730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012084243558631961, + "loss": 0.0098, + "step": 236740 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208348678933056, + "loss": 0.0089, + "step": 236750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012082730020029159, + "loss": 0.0076, + "step": 236760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012081973250727758, + "loss": 0.009, + "step": 236770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012081216481426358, + "loss": 0.0076, + "step": 236780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012080459712124956, + "loss": 0.0076, + "step": 236790 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012079702942823555, + "loss": 0.0078, + "step": 236800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078946173522155, + "loss": 0.0102, + "step": 236810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078189404220753, + "loss": 0.0106, + "step": 236820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012077432634919352, + "loss": 0.0089, + "step": 236830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012076675865617952, + "loss": 0.0093, + "step": 236840 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001207591909631655, + "loss": 0.0079, + "step": 236850 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001207516232701515, + "loss": 0.0105, + "step": 236860 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012074405557713748, + "loss": 0.0109, + "step": 236870 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012073648788412347, + "loss": 0.0144, + "step": 236880 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072892019110947, + "loss": 0.0087, + "step": 236890 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072135249809545, + "loss": 0.0086, + "step": 236900 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012071378480508144, + "loss": 0.0076, + "step": 236910 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012070621711206744, + "loss": 0.0099, + "step": 236920 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069864941905342, + "loss": 0.0101, + "step": 236930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069108172603942, + "loss": 0.008, + "step": 236940 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001206835140330254, + "loss": 0.0107, + "step": 236950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012067594634001139, + "loss": 0.009, + "step": 236960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012066837864699739, + "loss": 0.0087, + "step": 236970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012066081095398337, + "loss": 0.009, + "step": 236980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012065324326096936, + "loss": 0.008, + "step": 236990 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012064567556795536, + "loss": 0.0089, + "step": 237000 + }, + { + "epoch": 1.2, + "eval_cer": 0.9144498775845288, + "eval_loss": 0.006527193821966648, + "eval_runtime": 116.0102, + "eval_samples_per_second": 17.24, + "eval_steps_per_second": 4.31, + "step": 237000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012063810787494134, + "loss": 0.0077, + "step": 237010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012063054018192733, + "loss": 0.0088, + "step": 237020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012062297248891332, + "loss": 0.0082, + "step": 237030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012061540479589931, + "loss": 0.0078, + "step": 237040 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001206078371028853, + "loss": 0.0085, + "step": 237050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012060026940987129, + "loss": 0.0078, + "step": 237060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012059270171685728, + "loss": 0.0082, + "step": 237070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012058513402384328, + "loss": 0.009, + "step": 237080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012057756633082926, + "loss": 0.0074, + "step": 237090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012056999863781525, + "loss": 0.0083, + "step": 237100 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012056243094480124, + "loss": 0.0088, + "step": 237110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012055486325178723, + "loss": 0.0087, + "step": 237120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012054729555877323, + "loss": 0.0056, + "step": 237130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012053972786575921, + "loss": 0.0098, + "step": 237140 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001205321601727452, + "loss": 0.0074, + "step": 237150 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001205245924797312, + "loss": 0.01, + "step": 237160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012051702478671718, + "loss": 0.0059, + "step": 237170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050945709370317, + "loss": 0.0088, + "step": 237180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050188940068915, + "loss": 0.0105, + "step": 237190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012049432170767515, + "loss": 0.0096, + "step": 237200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012048675401466114, + "loss": 0.0077, + "step": 237210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012047918632164713, + "loss": 0.0107, + "step": 237220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012047161862863312, + "loss": 0.0078, + "step": 237230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012046405093561909, + "loss": 0.0099, + "step": 237240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012045648324260508, + "loss": 0.0119, + "step": 237250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044891554959108, + "loss": 0.0108, + "step": 237260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044134785657706, + "loss": 0.0089, + "step": 237270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043378016356306, + "loss": 0.0096, + "step": 237280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012042621247054905, + "loss": 0.0081, + "step": 237290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012041864477753503, + "loss": 0.0121, + "step": 237300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012041107708452103, + "loss": 0.0133, + "step": 237310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012040350939150701, + "loss": 0.0095, + "step": 237320 + }, + { + "epoch": 1.2, + "learning_rate": 0.000120395941698493, + "loss": 0.0087, + "step": 237330 + }, + { + "epoch": 1.2, + "learning_rate": 0.000120388374005479, + "loss": 0.0082, + "step": 237340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012038080631246498, + "loss": 0.0112, + "step": 237350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012037323861945097, + "loss": 0.0075, + "step": 237360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012036567092643697, + "loss": 0.0113, + "step": 237370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012035810323342295, + "loss": 0.0089, + "step": 237380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012035053554040895, + "loss": 0.0094, + "step": 237390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012034296784739493, + "loss": 0.0082, + "step": 237400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012033540015438092, + "loss": 0.0079, + "step": 237410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012032783246136692, + "loss": 0.0073, + "step": 237420 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001203202647683529, + "loss": 0.0091, + "step": 237430 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001203126970753389, + "loss": 0.0102, + "step": 237440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012030512938232489, + "loss": 0.0109, + "step": 237450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012029756168931087, + "loss": 0.0104, + "step": 237460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012028999399629687, + "loss": 0.0095, + "step": 237470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012028242630328285, + "loss": 0.0079, + "step": 237480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012027485861026884, + "loss": 0.0082, + "step": 237490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012026729091725484, + "loss": 0.0116, + "step": 237500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025972322424082, + "loss": 0.008, + "step": 237510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025215553122681, + "loss": 0.0079, + "step": 237520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012024458783821281, + "loss": 0.0075, + "step": 237530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012023702014519879, + "loss": 0.0077, + "step": 237540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012022945245218478, + "loss": 0.0101, + "step": 237550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012022188475917077, + "loss": 0.0086, + "step": 237560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012021431706615676, + "loss": 0.0096, + "step": 237570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012020674937314276, + "loss": 0.0081, + "step": 237580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012019918168012874, + "loss": 0.008, + "step": 237590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012019161398711473, + "loss": 0.0087, + "step": 237600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012018404629410073, + "loss": 0.0089, + "step": 237610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012017647860108671, + "loss": 0.0107, + "step": 237620 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001201689109080727, + "loss": 0.0099, + "step": 237630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012016134321505869, + "loss": 0.0073, + "step": 237640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012015377552204468, + "loss": 0.0076, + "step": 237650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012014620782903068, + "loss": 0.0096, + "step": 237660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013864013601666, + "loss": 0.0088, + "step": 237670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013107244300265, + "loss": 0.0068, + "step": 237680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012012350474998865, + "loss": 0.0092, + "step": 237690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012011593705697463, + "loss": 0.0114, + "step": 237700 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012010836936396062, + "loss": 0.0086, + "step": 237710 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001201008016709466, + "loss": 0.0068, + "step": 237720 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200932339779326, + "loss": 0.0136, + "step": 237730 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200856662849186, + "loss": 0.0099, + "step": 237740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012007809859190458, + "loss": 0.0104, + "step": 237750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012007053089889057, + "loss": 0.0075, + "step": 237760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012006296320587657, + "loss": 0.0079, + "step": 237770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012005539551286255, + "loss": 0.01, + "step": 237780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012004782781984854, + "loss": 0.0095, + "step": 237790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012004026012683452, + "loss": 0.0083, + "step": 237800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012003269243382052, + "loss": 0.0081, + "step": 237810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012002512474080651, + "loss": 0.009, + "step": 237820 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200175570477925, + "loss": 0.0106, + "step": 237830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012000998935477849, + "loss": 0.0073, + "step": 237840 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012000242166176449, + "loss": 0.0096, + "step": 237850 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011999485396875047, + "loss": 0.0091, + "step": 237860 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011998728627573645, + "loss": 0.0076, + "step": 237870 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011997971858272243, + "loss": 0.0106, + "step": 237880 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011997215088970843, + "loss": 0.0086, + "step": 237890 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011996458319669442, + "loss": 0.0106, + "step": 237900 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199570155036804, + "loss": 0.0089, + "step": 237910 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199494478106664, + "loss": 0.0094, + "step": 237920 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011994188011765238, + "loss": 0.0085, + "step": 237930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011993431242463837, + "loss": 0.0084, + "step": 237940 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011992674473162437, + "loss": 0.0087, + "step": 237950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011991917703861035, + "loss": 0.0086, + "step": 237960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011991160934559634, + "loss": 0.0083, + "step": 237970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011990404165258234, + "loss": 0.0088, + "step": 237980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011989647395956832, + "loss": 0.0099, + "step": 237990 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011988890626655432, + "loss": 0.0077, + "step": 238000 + }, + { + "epoch": 1.2, + "eval_cer": 0.9144586111496574, + "eval_loss": 0.006760002113878727, + "eval_runtime": 116.0385, + "eval_samples_per_second": 17.236, + "eval_steps_per_second": 4.309, + "step": 238000 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198813385735403, + "loss": 0.0085, + "step": 238010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011987377088052629, + "loss": 0.0084, + "step": 238020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011986620318751229, + "loss": 0.0085, + "step": 238030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011985863549449827, + "loss": 0.0106, + "step": 238040 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011985106780148426, + "loss": 0.0088, + "step": 238050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011984350010847026, + "loss": 0.0071, + "step": 238060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011983593241545624, + "loss": 0.0094, + "step": 238070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982836472244224, + "loss": 0.0105, + "step": 238080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982079702942822, + "loss": 0.0102, + "step": 238090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011981322933641421, + "loss": 0.0075, + "step": 238100 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198056616434002, + "loss": 0.0087, + "step": 238110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011979809395038619, + "loss": 0.009, + "step": 238120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011979052625737218, + "loss": 0.0088, + "step": 238130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011978295856435818, + "loss": 0.0101, + "step": 238140 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011977539087134416, + "loss": 0.0115, + "step": 238150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011976782317833015, + "loss": 0.0093, + "step": 238160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011976025548531614, + "loss": 0.0112, + "step": 238170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011975268779230213, + "loss": 0.0084, + "step": 238180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011974512009928813, + "loss": 0.0089, + "step": 238190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011973755240627411, + "loss": 0.0079, + "step": 238200 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197299847132601, + "loss": 0.0084, + "step": 238210 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197224170202461, + "loss": 0.0092, + "step": 238220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011971484932723208, + "loss": 0.0074, + "step": 238230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011970728163421807, + "loss": 0.0086, + "step": 238240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011969971394120406, + "loss": 0.0086, + "step": 238250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011969214624819005, + "loss": 0.0078, + "step": 238260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011968457855517605, + "loss": 0.0092, + "step": 238270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011967701086216203, + "loss": 0.0085, + "step": 238280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966944316914802, + "loss": 0.0106, + "step": 238290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966187547613402, + "loss": 0.0075, + "step": 238300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011965430778312, + "loss": 0.0098, + "step": 238310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011964674009010599, + "loss": 0.0083, + "step": 238320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011963917239709199, + "loss": 0.0078, + "step": 238330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011963160470407797, + "loss": 0.0074, + "step": 238340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011962403701106396, + "loss": 0.0089, + "step": 238350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011961646931804995, + "loss": 0.0101, + "step": 238360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011960890162503594, + "loss": 0.0079, + "step": 238370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011960133393202194, + "loss": 0.0082, + "step": 238380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011959376623900792, + "loss": 0.0094, + "step": 238390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011958619854599391, + "loss": 0.009, + "step": 238400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011957863085297991, + "loss": 0.01, + "step": 238410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011957106315996589, + "loss": 0.0107, + "step": 238420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011956349546695188, + "loss": 0.0081, + "step": 238430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011955592777393787, + "loss": 0.0084, + "step": 238440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954836008092386, + "loss": 0.0084, + "step": 238450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954079238790986, + "loss": 0.0076, + "step": 238460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011953322469489584, + "loss": 0.0066, + "step": 238470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011952565700188183, + "loss": 0.0095, + "step": 238480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011951808930886783, + "loss": 0.0117, + "step": 238490 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195105216158538, + "loss": 0.0088, + "step": 238500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011950295392283979, + "loss": 0.0094, + "step": 238510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011949538622982577, + "loss": 0.008, + "step": 238520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948781853681177, + "loss": 0.0072, + "step": 238530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948025084379775, + "loss": 0.0093, + "step": 238540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011947268315078374, + "loss": 0.0105, + "step": 238550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011946511545776974, + "loss": 0.0082, + "step": 238560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011945754776475572, + "loss": 0.0087, + "step": 238570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011944998007174171, + "loss": 0.0079, + "step": 238580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011944241237872771, + "loss": 0.0105, + "step": 238590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011943484468571369, + "loss": 0.0134, + "step": 238600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011942727699269969, + "loss": 0.0087, + "step": 238610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941970929968567, + "loss": 0.0089, + "step": 238620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941214160667166, + "loss": 0.0089, + "step": 238630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011940457391365766, + "loss": 0.008, + "step": 238640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011939700622064364, + "loss": 0.0086, + "step": 238650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938943852762963, + "loss": 0.006, + "step": 238660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938187083461563, + "loss": 0.008, + "step": 238670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011937430314160161, + "loss": 0.0102, + "step": 238680 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001193667354485876, + "loss": 0.0093, + "step": 238690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011935916775557359, + "loss": 0.0068, + "step": 238700 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011935160006255958, + "loss": 0.0154, + "step": 238710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011934403236954558, + "loss": 0.01, + "step": 238720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011933646467653156, + "loss": 0.011, + "step": 238730 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011932889698351755, + "loss": 0.014, + "step": 238740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011932132929050355, + "loss": 0.0096, + "step": 238750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011931376159748953, + "loss": 0.0136, + "step": 238760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011930619390447552, + "loss": 0.0114, + "step": 238770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011929862621146152, + "loss": 0.0117, + "step": 238780 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001192910585184475, + "loss": 0.0094, + "step": 238790 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001192834908254335, + "loss": 0.0101, + "step": 238800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011927592313241948, + "loss": 0.0109, + "step": 238810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011926835543940547, + "loss": 0.008, + "step": 238820 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011926078774639147, + "loss": 0.0087, + "step": 238830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011925322005337745, + "loss": 0.0087, + "step": 238840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011924565236036344, + "loss": 0.0089, + "step": 238850 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011923808466734944, + "loss": 0.0085, + "step": 238860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011923051697433542, + "loss": 0.008, + "step": 238870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922294928132141, + "loss": 0.0104, + "step": 238880 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001192153815883074, + "loss": 0.01, + "step": 238890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920781389529339, + "loss": 0.0075, + "step": 238900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920024620227939, + "loss": 0.0132, + "step": 238910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011919267850926537, + "loss": 0.0115, + "step": 238920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011918511081625136, + "loss": 0.0073, + "step": 238930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011917754312323736, + "loss": 0.0087, + "step": 238940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011916997543022334, + "loss": 0.0086, + "step": 238950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011916240773720933, + "loss": 0.0075, + "step": 238960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011915484004419532, + "loss": 0.01, + "step": 238970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011914727235118131, + "loss": 0.0095, + "step": 238980 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191397046581673, + "loss": 0.0074, + "step": 238990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011913213696515329, + "loss": 0.0104, + "step": 239000 + }, + { + "epoch": 1.21, + "eval_cer": 0.914452788772905, + "eval_loss": 0.006802674382925034, + "eval_runtime": 116.1446, + "eval_samples_per_second": 17.22, + "eval_steps_per_second": 4.305, + "step": 239000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011912456927213928, + "loss": 0.0092, + "step": 239010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011911700157912528, + "loss": 0.0083, + "step": 239020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011910943388611126, + "loss": 0.0094, + "step": 239030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011910186619309725, + "loss": 0.0085, + "step": 239040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011909429850008323, + "loss": 0.0076, + "step": 239050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011908673080706923, + "loss": 0.0081, + "step": 239060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011907916311405522, + "loss": 0.0099, + "step": 239070 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190715954210412, + "loss": 0.0075, + "step": 239080 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190640277280272, + "loss": 0.008, + "step": 239090 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190564600350132, + "loss": 0.007, + "step": 239100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011904889234199918, + "loss": 0.008, + "step": 239110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011904132464898517, + "loss": 0.008, + "step": 239120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011903375695597114, + "loss": 0.0085, + "step": 239130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011902618926295714, + "loss": 0.0094, + "step": 239140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011901862156994312, + "loss": 0.0086, + "step": 239150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011901105387692911, + "loss": 0.0069, + "step": 239160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011900348618391511, + "loss": 0.0095, + "step": 239170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011899591849090109, + "loss": 0.0115, + "step": 239180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011898835079788708, + "loss": 0.0105, + "step": 239190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011898078310487308, + "loss": 0.0095, + "step": 239200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011897321541185906, + "loss": 0.009, + "step": 239210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011896564771884505, + "loss": 0.0087, + "step": 239220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011895808002583105, + "loss": 0.0114, + "step": 239230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011895051233281703, + "loss": 0.0121, + "step": 239240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011894294463980303, + "loss": 0.0107, + "step": 239250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011893537694678901, + "loss": 0.0095, + "step": 239260 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118927809253775, + "loss": 0.01, + "step": 239270 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118920241560761, + "loss": 0.0069, + "step": 239280 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011891267386774698, + "loss": 0.0089, + "step": 239290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011890510617473297, + "loss": 0.0079, + "step": 239300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011889753848171897, + "loss": 0.0109, + "step": 239310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011888997078870495, + "loss": 0.0067, + "step": 239320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011888240309569095, + "loss": 0.0119, + "step": 239330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011887483540267693, + "loss": 0.0096, + "step": 239340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011886726770966292, + "loss": 0.009, + "step": 239350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011885970001664892, + "loss": 0.0089, + "step": 239360 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188521323236349, + "loss": 0.0122, + "step": 239370 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188445646306209, + "loss": 0.0085, + "step": 239380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011883699693760689, + "loss": 0.0121, + "step": 239390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882942924459287, + "loss": 0.0157, + "step": 239400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882186155157886, + "loss": 0.0116, + "step": 239410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011881429385856485, + "loss": 0.009, + "step": 239420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011880672616555084, + "loss": 0.008, + "step": 239430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011879915847253684, + "loss": 0.0129, + "step": 239440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011879159077952282, + "loss": 0.0101, + "step": 239450 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011878402308650881, + "loss": 0.0082, + "step": 239460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011877645539349481, + "loss": 0.0088, + "step": 239470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011876888770048079, + "loss": 0.0076, + "step": 239480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011876132000746678, + "loss": 0.0095, + "step": 239490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011875375231445277, + "loss": 0.008, + "step": 239500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011874618462143876, + "loss": 0.0095, + "step": 239510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011873861692842476, + "loss": 0.0069, + "step": 239520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011873104923541074, + "loss": 0.0066, + "step": 239530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011872348154239673, + "loss": 0.0062, + "step": 239540 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011871591384938273, + "loss": 0.0083, + "step": 239550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011870834615636871, + "loss": 0.0108, + "step": 239560 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001187007784633547, + "loss": 0.007, + "step": 239570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011869321077034068, + "loss": 0.0102, + "step": 239580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011868564307732668, + "loss": 0.011, + "step": 239590 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011867807538431267, + "loss": 0.0107, + "step": 239600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011867050769129866, + "loss": 0.0106, + "step": 239610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011866293999828465, + "loss": 0.0095, + "step": 239620 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011865537230527065, + "loss": 0.0095, + "step": 239630 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864780461225663, + "loss": 0.0091, + "step": 239640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864023691924262, + "loss": 0.0085, + "step": 239650 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186326692262286, + "loss": 0.0107, + "step": 239660 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186251015332146, + "loss": 0.0118, + "step": 239670 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186175338402006, + "loss": 0.009, + "step": 239680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011860996614718658, + "loss": 0.0103, + "step": 239690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011860239845417257, + "loss": 0.0054, + "step": 239700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011859483076115857, + "loss": 0.0111, + "step": 239710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011858726306814455, + "loss": 0.0119, + "step": 239720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857969537513054, + "loss": 0.0082, + "step": 239730 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857212768211652, + "loss": 0.0077, + "step": 239740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011856455998910252, + "loss": 0.0077, + "step": 239750 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001185569922960885, + "loss": 0.0089, + "step": 239760 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854942460307448, + "loss": 0.008, + "step": 239770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854185691006048, + "loss": 0.0062, + "step": 239780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011853428921704646, + "loss": 0.0078, + "step": 239790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011852672152403245, + "loss": 0.0077, + "step": 239800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011851915383101845, + "loss": 0.008, + "step": 239810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011851158613800443, + "loss": 0.009, + "step": 239820 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011850401844499042, + "loss": 0.0081, + "step": 239830 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011849645075197642, + "loss": 0.0091, + "step": 239840 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001184888830589624, + "loss": 0.0097, + "step": 239850 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001184813153659484, + "loss": 0.0075, + "step": 239860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011847374767293438, + "loss": 0.0067, + "step": 239870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011846617997992037, + "loss": 0.0084, + "step": 239880 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011845861228690637, + "loss": 0.0079, + "step": 239890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011845104459389235, + "loss": 0.0075, + "step": 239900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011844347690087834, + "loss": 0.0079, + "step": 239910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011843590920786434, + "loss": 0.0084, + "step": 239920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011842834151485032, + "loss": 0.0077, + "step": 239930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011842077382183631, + "loss": 0.0082, + "step": 239940 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001184132061288223, + "loss": 0.009, + "step": 239950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011840563843580829, + "loss": 0.0076, + "step": 239960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011839807074279429, + "loss": 0.0085, + "step": 239970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011839050304978027, + "loss": 0.0076, + "step": 239980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011838293535676626, + "loss": 0.0097, + "step": 239990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011837536766375226, + "loss": 0.0094, + "step": 240000 + }, + { + "epoch": 1.21, + "eval_cer": 0.9144537591690304, + "eval_loss": 0.006650357041507959, + "eval_runtime": 116.0541, + "eval_samples_per_second": 17.233, + "eval_steps_per_second": 4.308, + "step": 240000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011836779997073824, + "loss": 0.0113, + "step": 240010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011836023227772423, + "loss": 0.0091, + "step": 240020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011835266458471022, + "loss": 0.0129, + "step": 240030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011834509689169621, + "loss": 0.0065, + "step": 240040 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001183375291986822, + "loss": 0.0102, + "step": 240050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011832996150566819, + "loss": 0.0102, + "step": 240060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011832239381265418, + "loss": 0.0093, + "step": 240070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011831482611964018, + "loss": 0.0099, + "step": 240080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011830725842662616, + "loss": 0.0091, + "step": 240090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829969073361215, + "loss": 0.0108, + "step": 240100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829212304059813, + "loss": 0.0067, + "step": 240110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011828455534758413, + "loss": 0.0085, + "step": 240120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011827698765457012, + "loss": 0.0086, + "step": 240130 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001182694199615561, + "loss": 0.0085, + "step": 240140 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001182618522685421, + "loss": 0.0077, + "step": 240150 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001182542845755281, + "loss": 0.0075, + "step": 240160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011824671688251408, + "loss": 0.0091, + "step": 240170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011823914918950007, + "loss": 0.0082, + "step": 240180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011823158149648605, + "loss": 0.0077, + "step": 240190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011822401380347205, + "loss": 0.009, + "step": 240200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011821644611045804, + "loss": 0.0085, + "step": 240210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011820887841744403, + "loss": 0.0086, + "step": 240220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011820131072443002, + "loss": 0.0077, + "step": 240230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011819374303141602, + "loss": 0.009, + "step": 240240 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118186175338402, + "loss": 0.0079, + "step": 240250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011817860764538799, + "loss": 0.0118, + "step": 240260 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011817103995237399, + "loss": 0.008, + "step": 240270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011816347225935997, + "loss": 0.0072, + "step": 240280 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011815590456634596, + "loss": 0.0075, + "step": 240290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011814833687333194, + "loss": 0.008, + "step": 240300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011814076918031794, + "loss": 0.008, + "step": 240310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011813320148730393, + "loss": 0.0086, + "step": 240320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011812563379428992, + "loss": 0.0074, + "step": 240330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011811806610127591, + "loss": 0.0094, + "step": 240340 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181104984082619, + "loss": 0.0072, + "step": 240350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011810293071524789, + "loss": 0.009, + "step": 240360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011809536302223388, + "loss": 0.0111, + "step": 240370 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808779532921985, + "loss": 0.0085, + "step": 240380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808022763620585, + "loss": 0.0093, + "step": 240390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011807265994319183, + "loss": 0.0099, + "step": 240400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011806509225017782, + "loss": 0.0093, + "step": 240410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011805752455716382, + "loss": 0.0074, + "step": 240420 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180499568641498, + "loss": 0.0078, + "step": 240430 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180423891711358, + "loss": 0.0111, + "step": 240440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011803482147812179, + "loss": 0.0108, + "step": 240450 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011802725378510777, + "loss": 0.0064, + "step": 240460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801968609209376, + "loss": 0.0073, + "step": 240470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801211839907975, + "loss": 0.0078, + "step": 240480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800455070606574, + "loss": 0.0115, + "step": 240490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011799698301305174, + "loss": 0.0078, + "step": 240500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011798941532003772, + "loss": 0.009, + "step": 240510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011798184762702371, + "loss": 0.0067, + "step": 240520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011797427993400971, + "loss": 0.0092, + "step": 240530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011796671224099569, + "loss": 0.0081, + "step": 240540 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011795914454798168, + "loss": 0.0083, + "step": 240550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011795157685496767, + "loss": 0.0081, + "step": 240560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011794400916195366, + "loss": 0.0073, + "step": 240570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011793644146893966, + "loss": 0.0076, + "step": 240580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011792887377592564, + "loss": 0.0071, + "step": 240590 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011792130608291163, + "loss": 0.0091, + "step": 240600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011791373838989763, + "loss": 0.0074, + "step": 240610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011790617069688361, + "loss": 0.0104, + "step": 240620 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178986030038696, + "loss": 0.0088, + "step": 240630 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011789103531085559, + "loss": 0.0082, + "step": 240640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011788346761784158, + "loss": 0.0143, + "step": 240650 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011787589992482758, + "loss": 0.0065, + "step": 240660 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786833223181356, + "loss": 0.0099, + "step": 240670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786076453879955, + "loss": 0.0077, + "step": 240680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011785319684578555, + "loss": 0.0119, + "step": 240690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011784562915277153, + "loss": 0.008, + "step": 240700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011783806145975752, + "loss": 0.0092, + "step": 240710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011783049376674352, + "loss": 0.0078, + "step": 240720 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178229260737295, + "loss": 0.0086, + "step": 240730 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178153583807155, + "loss": 0.0084, + "step": 240740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780779068770148, + "loss": 0.0095, + "step": 240750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780022299468747, + "loss": 0.0092, + "step": 240760 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011779265530167347, + "loss": 0.0088, + "step": 240770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011778508760865945, + "loss": 0.01, + "step": 240780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011777751991564544, + "loss": 0.0105, + "step": 240790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011776995222263144, + "loss": 0.0083, + "step": 240800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011776238452961742, + "loss": 0.0094, + "step": 240810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011775481683660341, + "loss": 0.0067, + "step": 240820 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001177472491435894, + "loss": 0.0084, + "step": 240830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011773968145057539, + "loss": 0.0106, + "step": 240840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011773211375756139, + "loss": 0.0092, + "step": 240850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011772454606454737, + "loss": 0.0089, + "step": 240860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011771697837153336, + "loss": 0.0101, + "step": 240870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770941067851936, + "loss": 0.0092, + "step": 240880 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770184298550534, + "loss": 0.0093, + "step": 240890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011769427529249133, + "loss": 0.0081, + "step": 240900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011768670759947731, + "loss": 0.0071, + "step": 240910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011767913990646331, + "loss": 0.0068, + "step": 240920 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176715722134493, + "loss": 0.0152, + "step": 240930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011766400452043529, + "loss": 0.0089, + "step": 240940 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011765643682742128, + "loss": 0.01, + "step": 240950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011764886913440728, + "loss": 0.0083, + "step": 240960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011764130144139326, + "loss": 0.0104, + "step": 240970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011763373374837925, + "loss": 0.01, + "step": 240980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011762616605536523, + "loss": 0.0068, + "step": 240990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011761859836235123, + "loss": 0.0096, + "step": 241000 + }, + { + "epoch": 1.22, + "eval_cer": 0.9144644335264098, + "eval_loss": 0.00682118721306324, + "eval_runtime": 115.8371, + "eval_samples_per_second": 17.266, + "eval_steps_per_second": 4.316, + "step": 241000 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176110306693372, + "loss": 0.009, + "step": 241010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011760346297632319, + "loss": 0.0076, + "step": 241020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011759589528330919, + "loss": 0.0101, + "step": 241030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011758832759029517, + "loss": 0.008, + "step": 241040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011758075989728116, + "loss": 0.0074, + "step": 241050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011757319220426716, + "loss": 0.0099, + "step": 241060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011756562451125314, + "loss": 0.0094, + "step": 241070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011755805681823913, + "loss": 0.0089, + "step": 241080 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011755048912522512, + "loss": 0.0091, + "step": 241090 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011754292143221111, + "loss": 0.0092, + "step": 241100 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001175353537391971, + "loss": 0.0076, + "step": 241110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011752778604618309, + "loss": 0.0101, + "step": 241120 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011752021835316908, + "loss": 0.008, + "step": 241130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011751265066015508, + "loss": 0.0094, + "step": 241140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011750508296714106, + "loss": 0.0082, + "step": 241150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011749751527412705, + "loss": 0.0109, + "step": 241160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011748994758111305, + "loss": 0.007, + "step": 241170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011748237988809903, + "loss": 0.0094, + "step": 241180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011747481219508503, + "loss": 0.012, + "step": 241190 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117467244502071, + "loss": 0.0086, + "step": 241200 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117459676809057, + "loss": 0.0098, + "step": 241210 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117452109116043, + "loss": 0.0079, + "step": 241220 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011744454142302898, + "loss": 0.0094, + "step": 241230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011743697373001497, + "loss": 0.0072, + "step": 241240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742940603700097, + "loss": 0.0093, + "step": 241250 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742183834398695, + "loss": 0.0075, + "step": 241260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011741427065097294, + "loss": 0.0064, + "step": 241270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011740670295795893, + "loss": 0.0112, + "step": 241280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739913526494492, + "loss": 0.008, + "step": 241290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739156757193092, + "loss": 0.0069, + "step": 241300 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001173839998789169, + "loss": 0.0092, + "step": 241310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011737643218590289, + "loss": 0.0076, + "step": 241320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011736886449288889, + "loss": 0.0095, + "step": 241330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011736129679987487, + "loss": 0.0076, + "step": 241340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011735372910686086, + "loss": 0.0086, + "step": 241350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011734616141384685, + "loss": 0.0082, + "step": 241360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733859372083284, + "loss": 0.0092, + "step": 241370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733102602781884, + "loss": 0.0105, + "step": 241380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011732345833480482, + "loss": 0.008, + "step": 241390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011731589064179081, + "loss": 0.0086, + "step": 241400 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001173083229487768, + "loss": 0.0106, + "step": 241410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011730075525576279, + "loss": 0.0089, + "step": 241420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011729318756274878, + "loss": 0.0082, + "step": 241430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011728561986973476, + "loss": 0.0106, + "step": 241440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011727805217672076, + "loss": 0.0094, + "step": 241450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011727048448370675, + "loss": 0.0086, + "step": 241460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011726291679069274, + "loss": 0.0089, + "step": 241470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011725534909767873, + "loss": 0.0072, + "step": 241480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724778140466473, + "loss": 0.0098, + "step": 241490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724021371165071, + "loss": 0.0069, + "step": 241500 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001172326460186367, + "loss": 0.0082, + "step": 241510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011722507832562268, + "loss": 0.0103, + "step": 241520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011721751063260868, + "loss": 0.0091, + "step": 241530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011720994293959467, + "loss": 0.0061, + "step": 241540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011720237524658066, + "loss": 0.0092, + "step": 241550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011719480755356665, + "loss": 0.0088, + "step": 241560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011718723986055265, + "loss": 0.0072, + "step": 241570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717967216753863, + "loss": 0.0063, + "step": 241580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717210447452462, + "loss": 0.0099, + "step": 241590 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001171645367815106, + "loss": 0.0075, + "step": 241600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001171569690884966, + "loss": 0.01, + "step": 241610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011714940139548259, + "loss": 0.007, + "step": 241620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011714183370246857, + "loss": 0.0139, + "step": 241630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011713426600945456, + "loss": 0.0063, + "step": 241640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011712669831644054, + "loss": 0.0064, + "step": 241650 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011711913062342653, + "loss": 0.0109, + "step": 241660 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011711156293041253, + "loss": 0.0095, + "step": 241670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011710399523739851, + "loss": 0.0121, + "step": 241680 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170964275443845, + "loss": 0.0091, + "step": 241690 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170888598513705, + "loss": 0.0068, + "step": 241700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011708129215835648, + "loss": 0.0092, + "step": 241710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011707372446534248, + "loss": 0.0075, + "step": 241720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011706615677232846, + "loss": 0.009, + "step": 241730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705858907931445, + "loss": 0.0067, + "step": 241740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705102138630045, + "loss": 0.0087, + "step": 241750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011704345369328643, + "loss": 0.0099, + "step": 241760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011703588600027242, + "loss": 0.0085, + "step": 241770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011702831830725842, + "loss": 0.0084, + "step": 241780 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170207506142444, + "loss": 0.0078, + "step": 241790 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170131829212304, + "loss": 0.0106, + "step": 241800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011700561522821638, + "loss": 0.0083, + "step": 241810 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011699804753520237, + "loss": 0.0099, + "step": 241820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011699047984218837, + "loss": 0.0091, + "step": 241830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011698291214917435, + "loss": 0.0086, + "step": 241840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011697534445616034, + "loss": 0.0081, + "step": 241850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011696777676314634, + "loss": 0.0075, + "step": 241860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011696020907013232, + "loss": 0.0075, + "step": 241870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011695264137711831, + "loss": 0.0098, + "step": 241880 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169450736841043, + "loss": 0.0075, + "step": 241890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011693750599109029, + "loss": 0.0063, + "step": 241900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011692993829807629, + "loss": 0.0092, + "step": 241910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011692237060506227, + "loss": 0.0076, + "step": 241920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011691480291204826, + "loss": 0.0099, + "step": 241930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011690723521903426, + "loss": 0.0111, + "step": 241940 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011689966752602024, + "loss": 0.01, + "step": 241950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011689209983300623, + "loss": 0.0082, + "step": 241960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011688453213999221, + "loss": 0.0092, + "step": 241970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011687696444697821, + "loss": 0.0101, + "step": 241980 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168693967539642, + "loss": 0.0077, + "step": 241990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011686182906095019, + "loss": 0.0066, + "step": 242000 + }, + { + "epoch": 1.22, + "eval_cer": 0.914452788772905, + "eval_loss": 0.006828702986240387, + "eval_runtime": 115.9715, + "eval_samples_per_second": 17.246, + "eval_steps_per_second": 4.311, + "step": 242000 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011685426136793618, + "loss": 0.0095, + "step": 242010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011684669367492218, + "loss": 0.0078, + "step": 242020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011683912598190816, + "loss": 0.0118, + "step": 242030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011683155828889415, + "loss": 0.0077, + "step": 242040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011682399059588013, + "loss": 0.0069, + "step": 242050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011681642290286613, + "loss": 0.0081, + "step": 242060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011680885520985212, + "loss": 0.0084, + "step": 242070 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168012875168381, + "loss": 0.0099, + "step": 242080 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167937198238241, + "loss": 0.0099, + "step": 242090 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167861521308101, + "loss": 0.0084, + "step": 242100 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011677858443779608, + "loss": 0.0108, + "step": 242110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011677101674478207, + "loss": 0.0062, + "step": 242120 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011676344905176805, + "loss": 0.0079, + "step": 242130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011675588135875405, + "loss": 0.0175, + "step": 242140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011674831366574004, + "loss": 0.0095, + "step": 242150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011674074597272602, + "loss": 0.007, + "step": 242160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011673317827971202, + "loss": 0.0118, + "step": 242170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011672561058669801, + "loss": 0.0104, + "step": 242180 + }, + { + "epoch": 1.22, + "learning_rate": 0.000116718042893684, + "loss": 0.0086, + "step": 242190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011671047520066999, + "loss": 0.0094, + "step": 242200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011670290750765599, + "loss": 0.0085, + "step": 242210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011669533981464197, + "loss": 0.0105, + "step": 242220 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011668777212162796, + "loss": 0.0074, + "step": 242230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011668020442861394, + "loss": 0.0078, + "step": 242240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011667263673559994, + "loss": 0.0091, + "step": 242250 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011666506904258593, + "loss": 0.0106, + "step": 242260 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166575013495719, + "loss": 0.0089, + "step": 242270 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166499336565579, + "loss": 0.0077, + "step": 242280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011664236596354388, + "loss": 0.0124, + "step": 242290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011663479827052987, + "loss": 0.0078, + "step": 242300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011662723057751587, + "loss": 0.0122, + "step": 242310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011661966288450185, + "loss": 0.008, + "step": 242320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011661209519148784, + "loss": 0.0117, + "step": 242330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011660452749847383, + "loss": 0.0086, + "step": 242340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011659695980545982, + "loss": 0.0096, + "step": 242350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011658939211244582, + "loss": 0.0084, + "step": 242360 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001165818244194318, + "loss": 0.012, + "step": 242370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011657425672641779, + "loss": 0.0099, + "step": 242380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011656668903340379, + "loss": 0.0084, + "step": 242390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655912134038977, + "loss": 0.0101, + "step": 242400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655155364737576, + "loss": 0.0102, + "step": 242410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011654398595436175, + "loss": 0.0097, + "step": 242420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011653641826134774, + "loss": 0.0113, + "step": 242430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011652885056833374, + "loss": 0.0103, + "step": 242440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011652128287531972, + "loss": 0.0093, + "step": 242450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011651371518230571, + "loss": 0.0087, + "step": 242460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011650614748929171, + "loss": 0.0088, + "step": 242470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011649857979627769, + "loss": 0.011, + "step": 242480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011649101210326368, + "loss": 0.0075, + "step": 242490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648344441024966, + "loss": 0.0078, + "step": 242500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011647587671723566, + "loss": 0.0076, + "step": 242510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646830902422165, + "loss": 0.0074, + "step": 242520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646074133120764, + "loss": 0.0097, + "step": 242530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011645317363819363, + "loss": 0.0106, + "step": 242540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011644560594517963, + "loss": 0.0096, + "step": 242550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011643803825216561, + "loss": 0.0083, + "step": 242560 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001164304705591516, + "loss": 0.008, + "step": 242570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011642290286613758, + "loss": 0.0097, + "step": 242580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011641533517312358, + "loss": 0.0077, + "step": 242590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011640776748010957, + "loss": 0.0096, + "step": 242600 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011640019978709556, + "loss": 0.0104, + "step": 242610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011639263209408155, + "loss": 0.0094, + "step": 242620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011638506440106755, + "loss": 0.0079, + "step": 242630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011637749670805353, + "loss": 0.0072, + "step": 242640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011636992901503952, + "loss": 0.0078, + "step": 242650 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011636236132202552, + "loss": 0.0078, + "step": 242660 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163547936290115, + "loss": 0.0083, + "step": 242670 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163472259359975, + "loss": 0.007, + "step": 242680 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011633965824298347, + "loss": 0.0072, + "step": 242690 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011633209054996947, + "loss": 0.0079, + "step": 242700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011632452285695546, + "loss": 0.0102, + "step": 242710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011631695516394145, + "loss": 0.0082, + "step": 242720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630938747092744, + "loss": 0.0093, + "step": 242730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630181977791344, + "loss": 0.0074, + "step": 242740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011629425208489942, + "loss": 0.0108, + "step": 242750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011628668439188541, + "loss": 0.0086, + "step": 242760 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001162791166988714, + "loss": 0.0104, + "step": 242770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011627154900585739, + "loss": 0.0114, + "step": 242780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011626398131284338, + "loss": 0.0087, + "step": 242790 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011625641361982937, + "loss": 0.0087, + "step": 242800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011624884592681536, + "loss": 0.0112, + "step": 242810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011624127823380136, + "loss": 0.0091, + "step": 242820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011623371054078734, + "loss": 0.0068, + "step": 242830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011622614284777333, + "loss": 0.0089, + "step": 242840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621857515475931, + "loss": 0.0091, + "step": 242850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621100746174531, + "loss": 0.0098, + "step": 242860 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001162034397687313, + "loss": 0.008, + "step": 242870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011619587207571728, + "loss": 0.0095, + "step": 242880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618830438270328, + "loss": 0.0126, + "step": 242890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618073668968925, + "loss": 0.0092, + "step": 242900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011617316899667524, + "loss": 0.0085, + "step": 242910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011616560130366124, + "loss": 0.01, + "step": 242920 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011615803361064722, + "loss": 0.0084, + "step": 242930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011615046591763321, + "loss": 0.008, + "step": 242940 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161428982246192, + "loss": 0.0072, + "step": 242950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011613533053160519, + "loss": 0.0086, + "step": 242960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011612776283859119, + "loss": 0.007, + "step": 242970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011612019514557717, + "loss": 0.0097, + "step": 242980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011611262745256316, + "loss": 0.0086, + "step": 242990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011610505975954916, + "loss": 0.0072, + "step": 243000 + }, + { + "epoch": 1.23, + "eval_cer": 0.9144401736232748, + "eval_loss": 0.006801496725529432, + "eval_runtime": 115.8442, + "eval_samples_per_second": 17.265, + "eval_steps_per_second": 4.316, + "step": 243000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011609749206653514, + "loss": 0.008, + "step": 243010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011608992437352113, + "loss": 0.0087, + "step": 243020 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011608235668050711, + "loss": 0.008, + "step": 243030 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011607478898749311, + "loss": 0.0099, + "step": 243040 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001160672212944791, + "loss": 0.0075, + "step": 243050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011605965360146509, + "loss": 0.0095, + "step": 243060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011605208590845108, + "loss": 0.0066, + "step": 243070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011604451821543708, + "loss": 0.0085, + "step": 243080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011603695052242306, + "loss": 0.0087, + "step": 243090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602938282940905, + "loss": 0.0074, + "step": 243100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602181513639505, + "loss": 0.0061, + "step": 243110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011601424744338103, + "loss": 0.0112, + "step": 243120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011600667975036702, + "loss": 0.0095, + "step": 243130 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115999112057353, + "loss": 0.0083, + "step": 243140 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115991544364339, + "loss": 0.0089, + "step": 243150 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115983976671325, + "loss": 0.0105, + "step": 243160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011597640897831098, + "loss": 0.0081, + "step": 243170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011596884128529697, + "loss": 0.0112, + "step": 243180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011596127359228297, + "loss": 0.0081, + "step": 243190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011595370589926895, + "loss": 0.0083, + "step": 243200 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011594613820625494, + "loss": 0.0116, + "step": 243210 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011593857051324092, + "loss": 0.0099, + "step": 243220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011593100282022692, + "loss": 0.0075, + "step": 243230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011592343512721291, + "loss": 0.0065, + "step": 243240 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159158674341989, + "loss": 0.0084, + "step": 243250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011590829974118489, + "loss": 0.0082, + "step": 243260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011590073204817089, + "loss": 0.0113, + "step": 243270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011589316435515687, + "loss": 0.0084, + "step": 243280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011588559666214286, + "loss": 0.008, + "step": 243290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011587802896912884, + "loss": 0.009, + "step": 243300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011587046127611484, + "loss": 0.0114, + "step": 243310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011586289358310083, + "loss": 0.0094, + "step": 243320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011585532589008682, + "loss": 0.0073, + "step": 243330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011584775819707281, + "loss": 0.0095, + "step": 243340 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158401905040588, + "loss": 0.0098, + "step": 243350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011583262281104479, + "loss": 0.0084, + "step": 243360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011582505511803078, + "loss": 0.0064, + "step": 243370 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011581748742501676, + "loss": 0.0093, + "step": 243380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011580991973200276, + "loss": 0.0094, + "step": 243390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011580235203898875, + "loss": 0.0099, + "step": 243400 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011579478434597473, + "loss": 0.0103, + "step": 243410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011578721665296073, + "loss": 0.0087, + "step": 243420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011577964895994672, + "loss": 0.0092, + "step": 243430 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157720812669327, + "loss": 0.0077, + "step": 243440 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157645135739187, + "loss": 0.0105, + "step": 243450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011575694588090468, + "loss": 0.0064, + "step": 243460 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011574937818789068, + "loss": 0.0084, + "step": 243470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011574181049487667, + "loss": 0.0086, + "step": 243480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011573424280186265, + "loss": 0.0076, + "step": 243490 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011572667510884865, + "loss": 0.0082, + "step": 243500 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011571910741583464, + "loss": 0.0068, + "step": 243510 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011571153972282063, + "loss": 0.01, + "step": 243520 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011570397202980661, + "loss": 0.0089, + "step": 243530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011569640433679259, + "loss": 0.0078, + "step": 243540 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011568883664377858, + "loss": 0.007, + "step": 243550 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011568126895076458, + "loss": 0.0085, + "step": 243560 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011567370125775056, + "loss": 0.0097, + "step": 243570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011566613356473656, + "loss": 0.0106, + "step": 243580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011565856587172254, + "loss": 0.0081, + "step": 243590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011565099817870853, + "loss": 0.0091, + "step": 243600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011564343048569453, + "loss": 0.0128, + "step": 243610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011563586279268051, + "loss": 0.0085, + "step": 243620 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156282950996665, + "loss": 0.0087, + "step": 243630 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156207274066525, + "loss": 0.0089, + "step": 243640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011561315971363848, + "loss": 0.0075, + "step": 243650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011560559202062447, + "loss": 0.0074, + "step": 243660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011559802432761046, + "loss": 0.0089, + "step": 243670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011559045663459645, + "loss": 0.0084, + "step": 243680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011558288894158245, + "loss": 0.0083, + "step": 243690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011557532124856843, + "loss": 0.008, + "step": 243700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011556775355555442, + "loss": 0.0082, + "step": 243710 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011556018586254042, + "loss": 0.0079, + "step": 243720 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155526181695264, + "loss": 0.0062, + "step": 243730 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155450504765124, + "loss": 0.0079, + "step": 243740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011553748278349838, + "loss": 0.0086, + "step": 243750 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011552991509048437, + "loss": 0.0108, + "step": 243760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011552234739747037, + "loss": 0.0095, + "step": 243770 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011551477970445635, + "loss": 0.0083, + "step": 243780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011550721201144234, + "loss": 0.0077, + "step": 243790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011549964431842834, + "loss": 0.0078, + "step": 243800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011549207662541432, + "loss": 0.0095, + "step": 243810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011548450893240031, + "loss": 0.0108, + "step": 243820 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001154769412393863, + "loss": 0.0075, + "step": 243830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546937354637229, + "loss": 0.007, + "step": 243840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546180585335828, + "loss": 0.0094, + "step": 243850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011545423816034427, + "loss": 0.0087, + "step": 243860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011544667046733026, + "loss": 0.0076, + "step": 243870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543910277431626, + "loss": 0.0091, + "step": 243880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543153508130224, + "loss": 0.0088, + "step": 243890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011542396738828823, + "loss": 0.0078, + "step": 243900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011541639969527421, + "loss": 0.0072, + "step": 243910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011540883200226021, + "loss": 0.0076, + "step": 243920 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001154012643092462, + "loss": 0.0079, + "step": 243930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011539369661623219, + "loss": 0.0091, + "step": 243940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011538612892321818, + "loss": 0.0087, + "step": 243950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537856123020418, + "loss": 0.008, + "step": 243960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537099353719016, + "loss": 0.006, + "step": 243970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011536342584417615, + "loss": 0.0075, + "step": 243980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011535585815116213, + "loss": 0.0075, + "step": 243990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011534829045814813, + "loss": 0.0077, + "step": 244000 + }, + { + "epoch": 1.23, + "eval_cer": 0.9144731670915385, + "eval_loss": 0.00690747844055295, + "eval_runtime": 116.0173, + "eval_samples_per_second": 17.239, + "eval_steps_per_second": 4.31, + "step": 244000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011534072276513412, + "loss": 0.007, + "step": 244010 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153331550721201, + "loss": 0.0058, + "step": 244020 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153255873791061, + "loss": 0.0058, + "step": 244030 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153180196860921, + "loss": 0.0135, + "step": 244040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011531045199307808, + "loss": 0.009, + "step": 244050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011530288430006407, + "loss": 0.0083, + "step": 244060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011529531660705005, + "loss": 0.0095, + "step": 244070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011528774891403605, + "loss": 0.0074, + "step": 244080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011528018122102204, + "loss": 0.0089, + "step": 244090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011527261352800802, + "loss": 0.0083, + "step": 244100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011526504583499402, + "loss": 0.0085, + "step": 244110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011525747814198001, + "loss": 0.0083, + "step": 244120 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115249910448966, + "loss": 0.0076, + "step": 244130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011524234275595199, + "loss": 0.0103, + "step": 244140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011523477506293799, + "loss": 0.0077, + "step": 244150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011522720736992395, + "loss": 0.0104, + "step": 244160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011521963967690995, + "loss": 0.0092, + "step": 244170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011521207198389593, + "loss": 0.0099, + "step": 244180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011520450429088192, + "loss": 0.0099, + "step": 244190 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151969365978679, + "loss": 0.0085, + "step": 244200 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151893689048539, + "loss": 0.0087, + "step": 244210 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151818012118399, + "loss": 0.0111, + "step": 244220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011517423351882588, + "loss": 0.0085, + "step": 244230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011516666582581187, + "loss": 0.0106, + "step": 244240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515909813279787, + "loss": 0.0089, + "step": 244250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515153043978385, + "loss": 0.0116, + "step": 244260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011514396274676984, + "loss": 0.009, + "step": 244270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011513639505375583, + "loss": 0.0083, + "step": 244280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011512882736074182, + "loss": 0.0093, + "step": 244290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011512125966772782, + "loss": 0.0078, + "step": 244300 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151136919747138, + "loss": 0.0082, + "step": 244310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011510612428169979, + "loss": 0.0081, + "step": 244320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011509855658868579, + "loss": 0.0124, + "step": 244330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011509098889567177, + "loss": 0.0068, + "step": 244340 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011508342120265776, + "loss": 0.01, + "step": 244350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011507585350964374, + "loss": 0.0093, + "step": 244360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506828581662974, + "loss": 0.0085, + "step": 244370 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506071812361573, + "loss": 0.0086, + "step": 244380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011505315043060172, + "loss": 0.009, + "step": 244390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011504558273758771, + "loss": 0.0076, + "step": 244400 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150380150445737, + "loss": 0.0076, + "step": 244410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011503044735155969, + "loss": 0.0121, + "step": 244420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011502287965854568, + "loss": 0.0088, + "step": 244430 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011501531196553166, + "loss": 0.0085, + "step": 244440 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011500774427251766, + "loss": 0.0091, + "step": 244450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011500017657950365, + "loss": 0.0089, + "step": 244460 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011499260888648964, + "loss": 0.0087, + "step": 244470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011498504119347563, + "loss": 0.0099, + "step": 244480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011497747350046163, + "loss": 0.0102, + "step": 244490 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149699058074476, + "loss": 0.0073, + "step": 244500 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149623381144336, + "loss": 0.013, + "step": 244510 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011495477042141958, + "loss": 0.0087, + "step": 244520 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011494720272840558, + "loss": 0.0093, + "step": 244530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011493963503539157, + "loss": 0.0091, + "step": 244540 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011493206734237755, + "loss": 0.0103, + "step": 244550 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011492449964936355, + "loss": 0.0096, + "step": 244560 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011491693195634954, + "loss": 0.0086, + "step": 244570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011490936426333553, + "loss": 0.0098, + "step": 244580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011490179657032152, + "loss": 0.0086, + "step": 244590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011489422887730752, + "loss": 0.0095, + "step": 244600 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148866611842935, + "loss": 0.0092, + "step": 244610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011487909349127949, + "loss": 0.0092, + "step": 244620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011487152579826547, + "loss": 0.0105, + "step": 244630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011486395810525147, + "loss": 0.009, + "step": 244640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011485639041223746, + "loss": 0.0071, + "step": 244650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011484882271922345, + "loss": 0.0095, + "step": 244660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011484125502620944, + "loss": 0.0117, + "step": 244670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011483368733319544, + "loss": 0.0106, + "step": 244680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011482611964018142, + "loss": 0.0073, + "step": 244690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011481855194716741, + "loss": 0.0073, + "step": 244700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011481098425415339, + "loss": 0.0147, + "step": 244710 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011480341656113939, + "loss": 0.01, + "step": 244720 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011479584886812538, + "loss": 0.0083, + "step": 244730 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011478828117511136, + "loss": 0.0085, + "step": 244740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011478071348209736, + "loss": 0.0076, + "step": 244750 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011477314578908335, + "loss": 0.0077, + "step": 244760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011476557809606934, + "loss": 0.0118, + "step": 244770 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011475801040305532, + "loss": 0.0099, + "step": 244780 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147504427100413, + "loss": 0.0101, + "step": 244790 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001147428750170273, + "loss": 0.0093, + "step": 244800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011473530732401328, + "loss": 0.0073, + "step": 244810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011472773963099927, + "loss": 0.0087, + "step": 244820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011472017193798527, + "loss": 0.009, + "step": 244830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011471260424497125, + "loss": 0.0075, + "step": 244840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011470503655195724, + "loss": 0.0085, + "step": 244850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011469746885894324, + "loss": 0.0088, + "step": 244860 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011468990116592922, + "loss": 0.0071, + "step": 244870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011468233347291521, + "loss": 0.0079, + "step": 244880 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001146747657799012, + "loss": 0.0101, + "step": 244890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011466719808688719, + "loss": 0.0074, + "step": 244900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011465963039387318, + "loss": 0.0117, + "step": 244910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011465206270085917, + "loss": 0.0089, + "step": 244920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011464449500784516, + "loss": 0.0079, + "step": 244930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011463692731483116, + "loss": 0.0119, + "step": 244940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462935962181714, + "loss": 0.0103, + "step": 244950 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462179192880313, + "loss": 0.0083, + "step": 244960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011461422423578911, + "loss": 0.0081, + "step": 244970 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011460665654277511, + "loss": 0.0092, + "step": 244980 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145990888497611, + "loss": 0.0088, + "step": 244990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011459152115674709, + "loss": 0.0093, + "step": 245000 + }, + { + "epoch": 1.24, + "eval_cer": 0.9144741374876638, + "eval_loss": 0.006758058909326792, + "eval_runtime": 115.9822, + "eval_samples_per_second": 17.244, + "eval_steps_per_second": 4.311, + "step": 245000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011458395346373308, + "loss": 0.0081, + "step": 245010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011457638577071908, + "loss": 0.0073, + "step": 245020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011456881807770506, + "loss": 0.0077, + "step": 245030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011456125038469105, + "loss": 0.0079, + "step": 245040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011455368269167705, + "loss": 0.007, + "step": 245050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011454611499866303, + "loss": 0.0085, + "step": 245060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011453854730564902, + "loss": 0.0083, + "step": 245070 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114530979612635, + "loss": 0.0075, + "step": 245080 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114523411919621, + "loss": 0.0091, + "step": 245090 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114515844226607, + "loss": 0.011, + "step": 245100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450827653359298, + "loss": 0.008, + "step": 245110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450070884057897, + "loss": 0.0092, + "step": 245120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011449314114756497, + "loss": 0.0094, + "step": 245130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011448557345455095, + "loss": 0.0102, + "step": 245140 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011447800576153694, + "loss": 0.0085, + "step": 245150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011447043806852292, + "loss": 0.0099, + "step": 245160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011446287037550892, + "loss": 0.0073, + "step": 245170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011445530268249491, + "loss": 0.0094, + "step": 245180 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144477349894809, + "loss": 0.0084, + "step": 245190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011444016729646689, + "loss": 0.0087, + "step": 245200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011443259960345289, + "loss": 0.0093, + "step": 245210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011442503191043887, + "loss": 0.0103, + "step": 245220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011441746421742486, + "loss": 0.0085, + "step": 245230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011440989652441084, + "loss": 0.0087, + "step": 245240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011440232883139684, + "loss": 0.0089, + "step": 245250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011439476113838283, + "loss": 0.0092, + "step": 245260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011438719344536881, + "loss": 0.0082, + "step": 245270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011437962575235481, + "loss": 0.0095, + "step": 245280 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001143720580593408, + "loss": 0.0092, + "step": 245290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436449036632679, + "loss": 0.0118, + "step": 245300 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011435692267331278, + "loss": 0.0076, + "step": 245310 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011434935498029876, + "loss": 0.0085, + "step": 245320 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011434178728728476, + "loss": 0.0175, + "step": 245330 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011433421959427075, + "loss": 0.0096, + "step": 245340 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011432665190125673, + "loss": 0.009, + "step": 245350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431908420824273, + "loss": 0.0069, + "step": 245360 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431151651522872, + "loss": 0.0088, + "step": 245370 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001143039488222147, + "loss": 0.0099, + "step": 245380 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001142963811292007, + "loss": 0.0097, + "step": 245390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011428881343618668, + "loss": 0.007, + "step": 245400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011428124574317266, + "loss": 0.0089, + "step": 245410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011427367805015864, + "loss": 0.0078, + "step": 245420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011426611035714464, + "loss": 0.0098, + "step": 245430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425854266413063, + "loss": 0.0104, + "step": 245440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425097497111662, + "loss": 0.008, + "step": 245450 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011424340727810261, + "loss": 0.0094, + "step": 245460 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001142358395850886, + "loss": 0.0083, + "step": 245470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011422827189207459, + "loss": 0.0099, + "step": 245480 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011422070419906058, + "loss": 0.0099, + "step": 245490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011421313650604658, + "loss": 0.0114, + "step": 245500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011420556881303256, + "loss": 0.0087, + "step": 245510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011419800112001855, + "loss": 0.0078, + "step": 245520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011419043342700454, + "loss": 0.0087, + "step": 245530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011418286573399053, + "loss": 0.0088, + "step": 245540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011417529804097653, + "loss": 0.0097, + "step": 245550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011416773034796251, + "loss": 0.0084, + "step": 245560 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141601626549485, + "loss": 0.009, + "step": 245570 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141525949619345, + "loss": 0.009, + "step": 245580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011414502726892048, + "loss": 0.0068, + "step": 245590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011413745957590647, + "loss": 0.0081, + "step": 245600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011412989188289245, + "loss": 0.0078, + "step": 245610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011412232418987845, + "loss": 0.0099, + "step": 245620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011411475649686444, + "loss": 0.0121, + "step": 245630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011410718880385043, + "loss": 0.0116, + "step": 245640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011409962111083642, + "loss": 0.0088, + "step": 245650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011409205341782242, + "loss": 0.0087, + "step": 245660 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140844857248084, + "loss": 0.0069, + "step": 245670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011407691803179439, + "loss": 0.0077, + "step": 245680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011406935033878037, + "loss": 0.0086, + "step": 245690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011406178264576637, + "loss": 0.008, + "step": 245700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011405421495275236, + "loss": 0.0081, + "step": 245710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011404664725973835, + "loss": 0.0077, + "step": 245720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011403907956672434, + "loss": 0.0108, + "step": 245730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011403151187371034, + "loss": 0.0085, + "step": 245740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011402394418069632, + "loss": 0.0094, + "step": 245750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011401637648768231, + "loss": 0.0082, + "step": 245760 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140088087946683, + "loss": 0.0068, + "step": 245770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011400124110165429, + "loss": 0.0072, + "step": 245780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011399367340864028, + "loss": 0.008, + "step": 245790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011398610571562626, + "loss": 0.0109, + "step": 245800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011397853802261226, + "loss": 0.0073, + "step": 245810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011397097032959825, + "loss": 0.0092, + "step": 245820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011396340263658424, + "loss": 0.0086, + "step": 245830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011395583494357023, + "loss": 0.0068, + "step": 245840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011394826725055621, + "loss": 0.0118, + "step": 245850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011394069955754221, + "loss": 0.0098, + "step": 245860 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139331318645282, + "loss": 0.0093, + "step": 245870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011392556417151418, + "loss": 0.0087, + "step": 245880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011391799647850018, + "loss": 0.0084, + "step": 245890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011391042878548617, + "loss": 0.0091, + "step": 245900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011390286109247216, + "loss": 0.0074, + "step": 245910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011389529339945815, + "loss": 0.0078, + "step": 245920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011388772570644413, + "loss": 0.0077, + "step": 245930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011388015801343013, + "loss": 0.0085, + "step": 245940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011387259032041612, + "loss": 0.0089, + "step": 245950 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138650226274021, + "loss": 0.0082, + "step": 245960 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138574549343881, + "loss": 0.0077, + "step": 245970 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138498872413741, + "loss": 0.0091, + "step": 245980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011384231954836007, + "loss": 0.0083, + "step": 245990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011383475185534607, + "loss": 0.0084, + "step": 246000 + }, + { + "epoch": 1.24, + "eval_cer": 0.9144343512465224, + "eval_loss": 0.006622600369155407, + "eval_runtime": 115.7041, + "eval_samples_per_second": 17.285, + "eval_steps_per_second": 4.321, + "step": 246000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011382718416233205, + "loss": 0.0117, + "step": 246010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011381961646931805, + "loss": 0.011, + "step": 246020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011381204877630404, + "loss": 0.009, + "step": 246030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011380448108329001, + "loss": 0.009, + "step": 246040 + }, + { + "epoch": 1.24, + "learning_rate": 0.000113796913390276, + "loss": 0.0117, + "step": 246050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011378934569726199, + "loss": 0.0121, + "step": 246060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011378177800424798, + "loss": 0.0087, + "step": 246070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011377421031123398, + "loss": 0.0069, + "step": 246080 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011376664261821996, + "loss": 0.0072, + "step": 246090 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375907492520595, + "loss": 0.009, + "step": 246100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375150723219195, + "loss": 0.0082, + "step": 246110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011374393953917793, + "loss": 0.0083, + "step": 246120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011373637184616392, + "loss": 0.0108, + "step": 246130 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137288041531499, + "loss": 0.0092, + "step": 246140 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137212364601359, + "loss": 0.0074, + "step": 246150 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137136687671219, + "loss": 0.0091, + "step": 246160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011370610107410788, + "loss": 0.0083, + "step": 246170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011369853338109387, + "loss": 0.0102, + "step": 246180 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011369096568807987, + "loss": 0.0095, + "step": 246190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011368339799506585, + "loss": 0.0086, + "step": 246200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011367583030205184, + "loss": 0.0094, + "step": 246210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366826260903782, + "loss": 0.0091, + "step": 246220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366069491602382, + "loss": 0.0078, + "step": 246230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011365312722300981, + "loss": 0.0105, + "step": 246240 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136455595299958, + "loss": 0.0097, + "step": 246250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011363799183698179, + "loss": 0.0107, + "step": 246260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011363042414396779, + "loss": 0.0089, + "step": 246270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011362285645095377, + "loss": 0.0098, + "step": 246280 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011361528875793976, + "loss": 0.012, + "step": 246290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011360772106492574, + "loss": 0.0097, + "step": 246300 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011360015337191174, + "loss": 0.0083, + "step": 246310 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011359258567889773, + "loss": 0.0079, + "step": 246320 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011358501798588371, + "loss": 0.0103, + "step": 246330 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011357745029286971, + "loss": 0.0075, + "step": 246340 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001135698825998557, + "loss": 0.007, + "step": 246350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011356231490684169, + "loss": 0.0092, + "step": 246360 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011355474721382768, + "loss": 0.01, + "step": 246370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011354717952081366, + "loss": 0.0113, + "step": 246380 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011353961182779966, + "loss": 0.0075, + "step": 246390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011353204413478565, + "loss": 0.0083, + "step": 246400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011352447644177163, + "loss": 0.0071, + "step": 246410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011351690874875763, + "loss": 0.0095, + "step": 246420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011350934105574362, + "loss": 0.0113, + "step": 246430 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001135017733627296, + "loss": 0.0079, + "step": 246440 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134942056697156, + "loss": 0.01, + "step": 246450 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011348663797670158, + "loss": 0.0087, + "step": 246460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347907028368758, + "loss": 0.0081, + "step": 246470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347150259067357, + "loss": 0.0097, + "step": 246480 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011346393489765955, + "loss": 0.0094, + "step": 246490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011345636720464555, + "loss": 0.0087, + "step": 246500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011344879951163154, + "loss": 0.0078, + "step": 246510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011344123181861753, + "loss": 0.0095, + "step": 246520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011343366412560352, + "loss": 0.0107, + "step": 246530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011342609643258952, + "loss": 0.0082, + "step": 246540 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134185287395755, + "loss": 0.0086, + "step": 246550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011341096104656149, + "loss": 0.0064, + "step": 246560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011340339335354747, + "loss": 0.0116, + "step": 246570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011339582566053347, + "loss": 0.0077, + "step": 246580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338825796751946, + "loss": 0.0114, + "step": 246590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338069027450544, + "loss": 0.0078, + "step": 246600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011337312258149144, + "loss": 0.0086, + "step": 246610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011336555488847743, + "loss": 0.0109, + "step": 246620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335798719546342, + "loss": 0.0097, + "step": 246630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335041950244941, + "loss": 0.0087, + "step": 246640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011334285180943539, + "loss": 0.0085, + "step": 246650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011333528411642139, + "loss": 0.0071, + "step": 246660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011332771642340736, + "loss": 0.0083, + "step": 246670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011332014873039335, + "loss": 0.0093, + "step": 246680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011331258103737935, + "loss": 0.0078, + "step": 246690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011330501334436533, + "loss": 0.0088, + "step": 246700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011329744565135132, + "loss": 0.0079, + "step": 246710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011328987795833732, + "loss": 0.0111, + "step": 246720 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001132823102653233, + "loss": 0.0111, + "step": 246730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011327474257230929, + "loss": 0.0091, + "step": 246740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011326717487929527, + "loss": 0.0078, + "step": 246750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011325960718628127, + "loss": 0.0083, + "step": 246760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011325203949326726, + "loss": 0.0069, + "step": 246770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011324447180025325, + "loss": 0.0077, + "step": 246780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011323690410723924, + "loss": 0.0096, + "step": 246790 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322933641422524, + "loss": 0.0079, + "step": 246800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322176872121122, + "loss": 0.0104, + "step": 246810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011321420102819721, + "loss": 0.0072, + "step": 246820 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001132066333351832, + "loss": 0.0076, + "step": 246830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319906564216919, + "loss": 0.0087, + "step": 246840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319149794915518, + "loss": 0.0078, + "step": 246850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011318393025614117, + "loss": 0.0085, + "step": 246860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011317636256312716, + "loss": 0.008, + "step": 246870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011316879487011316, + "loss": 0.0088, + "step": 246880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011316122717709914, + "loss": 0.0074, + "step": 246890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011315365948408513, + "loss": 0.0087, + "step": 246900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011314609179107111, + "loss": 0.0078, + "step": 246910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011313852409805711, + "loss": 0.0114, + "step": 246920 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131309564050431, + "loss": 0.0079, + "step": 246930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011312338871202908, + "loss": 0.0084, + "step": 246940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011311582101901508, + "loss": 0.0083, + "step": 246950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011310825332600107, + "loss": 0.0092, + "step": 246960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011310068563298706, + "loss": 0.0094, + "step": 246970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011309311793997305, + "loss": 0.0071, + "step": 246980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011308555024695905, + "loss": 0.0085, + "step": 246990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011307798255394503, + "loss": 0.0074, + "step": 247000 + }, + { + "epoch": 1.25, + "eval_cer": 0.914457640753532, + "eval_loss": 0.0065944562666118145, + "eval_runtime": 115.9058, + "eval_samples_per_second": 17.255, + "eval_steps_per_second": 4.314, + "step": 247000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011307041486093102, + "loss": 0.0071, + "step": 247010 + }, + { + "epoch": 1.25, + "learning_rate": 0.000113062847167917, + "loss": 0.0072, + "step": 247020 + }, + { + "epoch": 1.25, + "learning_rate": 0.000113055279474903, + "loss": 0.0116, + "step": 247030 + }, + { + "epoch": 1.25, + "learning_rate": 0.000113047711781889, + "loss": 0.0117, + "step": 247040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011304014408887498, + "loss": 0.0084, + "step": 247050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011303257639586097, + "loss": 0.0063, + "step": 247060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011302500870284697, + "loss": 0.0082, + "step": 247070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011301744100983295, + "loss": 0.0065, + "step": 247080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300987331681894, + "loss": 0.0079, + "step": 247090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300230562380492, + "loss": 0.0095, + "step": 247100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011299473793079092, + "loss": 0.0101, + "step": 247110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011298717023777691, + "loss": 0.0083, + "step": 247120 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129796025447629, + "loss": 0.0125, + "step": 247130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011297203485174889, + "loss": 0.0077, + "step": 247140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011296446715873488, + "loss": 0.013, + "step": 247150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011295689946572087, + "loss": 0.0101, + "step": 247160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294933177270686, + "loss": 0.0075, + "step": 247170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294176407969284, + "loss": 0.0093, + "step": 247180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011293419638667884, + "loss": 0.0076, + "step": 247190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011292662869366483, + "loss": 0.0078, + "step": 247200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011291906100065081, + "loss": 0.0093, + "step": 247210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011291149330763681, + "loss": 0.0114, + "step": 247220 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129039256146228, + "loss": 0.0104, + "step": 247230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011289635792160879, + "loss": 0.0094, + "step": 247240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011288879022859478, + "loss": 0.0088, + "step": 247250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011288122253558076, + "loss": 0.0096, + "step": 247260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011287365484256676, + "loss": 0.0067, + "step": 247270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011286608714955275, + "loss": 0.0094, + "step": 247280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011285851945653873, + "loss": 0.0072, + "step": 247290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011285095176352471, + "loss": 0.0096, + "step": 247300 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128433840705107, + "loss": 0.0096, + "step": 247310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011283581637749669, + "loss": 0.0072, + "step": 247320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282824868448269, + "loss": 0.0112, + "step": 247330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282068099146867, + "loss": 0.0096, + "step": 247340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011281311329845466, + "loss": 0.0078, + "step": 247350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011280554560544064, + "loss": 0.0086, + "step": 247360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011279797791242664, + "loss": 0.007, + "step": 247370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011279041021941263, + "loss": 0.0093, + "step": 247380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011278284252639862, + "loss": 0.0105, + "step": 247390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011277527483338461, + "loss": 0.0089, + "step": 247400 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001127677071403706, + "loss": 0.0075, + "step": 247410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011276013944735659, + "loss": 0.0084, + "step": 247420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011275257175434258, + "loss": 0.0072, + "step": 247430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011274500406132858, + "loss": 0.0094, + "step": 247440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011273743636831456, + "loss": 0.0073, + "step": 247450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011272986867530055, + "loss": 0.0092, + "step": 247460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011272230098228653, + "loss": 0.0097, + "step": 247470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011271473328927253, + "loss": 0.0089, + "step": 247480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011270716559625852, + "loss": 0.0069, + "step": 247490 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126995979032445, + "loss": 0.0071, + "step": 247500 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126920302102305, + "loss": 0.0077, + "step": 247510 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126844625172165, + "loss": 0.0071, + "step": 247520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011267689482420248, + "loss": 0.013, + "step": 247530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266932713118847, + "loss": 0.008, + "step": 247540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266175943817445, + "loss": 0.0083, + "step": 247550 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011265419174516045, + "loss": 0.009, + "step": 247560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011264662405214644, + "loss": 0.007, + "step": 247570 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263905635913243, + "loss": 0.0116, + "step": 247580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263148866611842, + "loss": 0.0071, + "step": 247590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011262392097310442, + "loss": 0.0104, + "step": 247600 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126163532800904, + "loss": 0.0109, + "step": 247610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011260878558707639, + "loss": 0.0094, + "step": 247620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011260121789406237, + "loss": 0.0095, + "step": 247630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011259365020104837, + "loss": 0.0079, + "step": 247640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011258608250803436, + "loss": 0.0097, + "step": 247650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011257851481502034, + "loss": 0.0113, + "step": 247660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011257094712200634, + "loss": 0.0082, + "step": 247670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011256337942899233, + "loss": 0.0112, + "step": 247680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011255581173597832, + "loss": 0.0082, + "step": 247690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011254824404296431, + "loss": 0.0065, + "step": 247700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011254067634995029, + "loss": 0.0094, + "step": 247710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011253310865693629, + "loss": 0.0067, + "step": 247720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011252554096392228, + "loss": 0.0091, + "step": 247730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251797327090826, + "loss": 0.0085, + "step": 247740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251040557789426, + "loss": 0.007, + "step": 247750 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011250283788488025, + "loss": 0.009, + "step": 247760 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011249527019186624, + "loss": 0.008, + "step": 247770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011248770249885223, + "loss": 0.0084, + "step": 247780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011248013480583821, + "loss": 0.0093, + "step": 247790 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001124725671128242, + "loss": 0.0076, + "step": 247800 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001124649994198102, + "loss": 0.009, + "step": 247810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011245743172679618, + "loss": 0.0098, + "step": 247820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244986403378218, + "loss": 0.0107, + "step": 247830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244229634076817, + "loss": 0.009, + "step": 247840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011243472864775415, + "loss": 0.0113, + "step": 247850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011242716095474015, + "loss": 0.0066, + "step": 247860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011241959326172613, + "loss": 0.0096, + "step": 247870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011241202556871213, + "loss": 0.0104, + "step": 247880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011240445787569812, + "loss": 0.0082, + "step": 247890 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001123968901826841, + "loss": 0.0103, + "step": 247900 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001123893224896701, + "loss": 0.0089, + "step": 247910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011238175479665609, + "loss": 0.0091, + "step": 247920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011237418710364206, + "loss": 0.007, + "step": 247930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011236661941062806, + "loss": 0.0096, + "step": 247940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235905171761404, + "loss": 0.0075, + "step": 247950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235148402460003, + "loss": 0.0092, + "step": 247960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011234391633158603, + "loss": 0.0093, + "step": 247970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011233634863857201, + "loss": 0.0112, + "step": 247980 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112328780945558, + "loss": 0.0092, + "step": 247990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011232121325254398, + "loss": 0.0083, + "step": 248000 + }, + { + "epoch": 1.25, + "eval_cer": 0.914462492734159, + "eval_loss": 0.006537660490721464, + "eval_runtime": 115.8787, + "eval_samples_per_second": 17.259, + "eval_steps_per_second": 4.315, + "step": 248000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011231364555952998, + "loss": 0.0089, + "step": 248010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011230607786651597, + "loss": 0.01, + "step": 248020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011229851017350196, + "loss": 0.01, + "step": 248030 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011229094248048795, + "loss": 0.0116, + "step": 248040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011228337478747395, + "loss": 0.0099, + "step": 248050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011227580709445993, + "loss": 0.0073, + "step": 248060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011226823940144592, + "loss": 0.0092, + "step": 248070 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001122606717084319, + "loss": 0.0095, + "step": 248080 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001122531040154179, + "loss": 0.0082, + "step": 248090 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001122455363224039, + "loss": 0.0089, + "step": 248100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223796862938988, + "loss": 0.0087, + "step": 248110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223040093637587, + "loss": 0.0082, + "step": 248120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011222283324336187, + "loss": 0.0067, + "step": 248130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011221526555034785, + "loss": 0.0081, + "step": 248140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011220769785733384, + "loss": 0.0053, + "step": 248150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011220013016431982, + "loss": 0.0078, + "step": 248160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011219256247130582, + "loss": 0.0096, + "step": 248170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011218499477829181, + "loss": 0.0102, + "step": 248180 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001121774270852778, + "loss": 0.007, + "step": 248190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216985939226379, + "loss": 0.0075, + "step": 248200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216229169924978, + "loss": 0.0106, + "step": 248210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011215472400623577, + "loss": 0.0094, + "step": 248220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011214715631322176, + "loss": 0.0096, + "step": 248230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011213958862020774, + "loss": 0.0081, + "step": 248240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011213202092719374, + "loss": 0.0086, + "step": 248250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011212445323417973, + "loss": 0.0088, + "step": 248260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011211688554116571, + "loss": 0.0069, + "step": 248270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011210931784815171, + "loss": 0.0086, + "step": 248280 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001121017501551377, + "loss": 0.0112, + "step": 248290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011209418246212369, + "loss": 0.0103, + "step": 248300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011208661476910968, + "loss": 0.0074, + "step": 248310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207904707609566, + "loss": 0.0073, + "step": 248320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207147938308166, + "loss": 0.0095, + "step": 248330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011206391169006765, + "loss": 0.009, + "step": 248340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011205634399705363, + "loss": 0.0157, + "step": 248350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011204877630403963, + "loss": 0.0075, + "step": 248360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011204120861102562, + "loss": 0.0073, + "step": 248370 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001120336409180116, + "loss": 0.0082, + "step": 248380 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001120260732249976, + "loss": 0.0088, + "step": 248390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011201850553198358, + "loss": 0.0128, + "step": 248400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011201093783896958, + "loss": 0.0089, + "step": 248410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011200337014595557, + "loss": 0.0084, + "step": 248420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011199580245294155, + "loss": 0.0087, + "step": 248430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011198823475992755, + "loss": 0.0077, + "step": 248440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011198066706691354, + "loss": 0.0079, + "step": 248450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011197309937389952, + "loss": 0.0082, + "step": 248460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011196553168088552, + "loss": 0.01, + "step": 248470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011195796398787151, + "loss": 0.007, + "step": 248480 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001119503962948575, + "loss": 0.009, + "step": 248490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011194282860184349, + "loss": 0.0088, + "step": 248500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193526090882947, + "loss": 0.0075, + "step": 248510 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011192769321581547, + "loss": 0.0085, + "step": 248520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011192012552280146, + "loss": 0.0073, + "step": 248530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011191255782978744, + "loss": 0.0085, + "step": 248540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011190499013677342, + "loss": 0.0078, + "step": 248550 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118974224437594, + "loss": 0.0087, + "step": 248560 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118898547507454, + "loss": 0.0085, + "step": 248570 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118822870577314, + "loss": 0.0071, + "step": 248580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011187471936471738, + "loss": 0.0055, + "step": 248590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011186715167170337, + "loss": 0.0078, + "step": 248600 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011185958397868935, + "loss": 0.0079, + "step": 248610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011185201628567535, + "loss": 0.0065, + "step": 248620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011184444859266134, + "loss": 0.0103, + "step": 248630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011183688089964733, + "loss": 0.0068, + "step": 248640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182931320663332, + "loss": 0.0089, + "step": 248650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182174551361932, + "loss": 0.0082, + "step": 248660 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118141778206053, + "loss": 0.0066, + "step": 248670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011180661012759129, + "loss": 0.0079, + "step": 248680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011179904243457727, + "loss": 0.0108, + "step": 248690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011179147474156327, + "loss": 0.0074, + "step": 248700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011178390704854926, + "loss": 0.0099, + "step": 248710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011177633935553524, + "loss": 0.0077, + "step": 248720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011176877166252124, + "loss": 0.0081, + "step": 248730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011176120396950723, + "loss": 0.0074, + "step": 248740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011175363627649322, + "loss": 0.0082, + "step": 248750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011174606858347921, + "loss": 0.0082, + "step": 248760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011173850089046519, + "loss": 0.0071, + "step": 248770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011173093319745119, + "loss": 0.0117, + "step": 248780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011172336550443718, + "loss": 0.0085, + "step": 248790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011171579781142316, + "loss": 0.0081, + "step": 248800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170823011840916, + "loss": 0.011, + "step": 248810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170066242539515, + "loss": 0.0055, + "step": 248820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011169309473238114, + "loss": 0.014, + "step": 248830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011168552703936713, + "loss": 0.0116, + "step": 248840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167795934635311, + "loss": 0.0121, + "step": 248850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167039165333911, + "loss": 0.0106, + "step": 248860 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001116628239603251, + "loss": 0.0061, + "step": 248870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011165525626731108, + "loss": 0.008, + "step": 248880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011164768857429708, + "loss": 0.009, + "step": 248890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011164012088128307, + "loss": 0.0073, + "step": 248900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011163255318826905, + "loss": 0.0091, + "step": 248910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011162498549525505, + "loss": 0.0079, + "step": 248920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011161741780224104, + "loss": 0.0079, + "step": 248930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011160985010922703, + "loss": 0.0073, + "step": 248940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011160228241621302, + "loss": 0.0081, + "step": 248950 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111594714723199, + "loss": 0.0071, + "step": 248960 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111587147030185, + "loss": 0.0081, + "step": 248970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011157957933717099, + "loss": 0.0072, + "step": 248980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011157201164415697, + "loss": 0.0082, + "step": 248990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011156444395114297, + "loss": 0.0098, + "step": 249000 + }, + { + "epoch": 1.26, + "eval_cer": 0.9144459960000272, + "eval_loss": 0.0065380726009607315, + "eval_runtime": 116.0227, + "eval_samples_per_second": 17.238, + "eval_steps_per_second": 4.31, + "step": 249000 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011155687625812896, + "loss": 0.0078, + "step": 249010 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154930856511495, + "loss": 0.0102, + "step": 249020 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154174087210094, + "loss": 0.0087, + "step": 249030 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011153417317908692, + "loss": 0.0088, + "step": 249040 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011152660548607292, + "loss": 0.0087, + "step": 249050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011151903779305891, + "loss": 0.0083, + "step": 249060 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001115114701000449, + "loss": 0.0094, + "step": 249070 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011150390240703089, + "loss": 0.0092, + "step": 249080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011149633471401688, + "loss": 0.0103, + "step": 249090 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011148876702100286, + "loss": 0.0098, + "step": 249100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011148119932798886, + "loss": 0.0088, + "step": 249110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011147363163497484, + "loss": 0.0103, + "step": 249120 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011146606394196084, + "loss": 0.0086, + "step": 249130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011145849624894683, + "loss": 0.0074, + "step": 249140 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011145092855593281, + "loss": 0.0073, + "step": 249150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011144336086291881, + "loss": 0.0089, + "step": 249160 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001114357931699048, + "loss": 0.0086, + "step": 249170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142822547689077, + "loss": 0.0079, + "step": 249180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142065778387677, + "loss": 0.0073, + "step": 249190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011141309009086275, + "loss": 0.01, + "step": 249200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011140552239784874, + "loss": 0.0088, + "step": 249210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139795470483472, + "loss": 0.0086, + "step": 249220 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139038701182072, + "loss": 0.0081, + "step": 249230 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011138281931880671, + "loss": 0.0085, + "step": 249240 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001113752516257927, + "loss": 0.0093, + "step": 249250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011136768393277869, + "loss": 0.0072, + "step": 249260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011136011623976468, + "loss": 0.0131, + "step": 249270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011135254854675067, + "loss": 0.0073, + "step": 249280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011134498085373666, + "loss": 0.0081, + "step": 249290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011133741316072264, + "loss": 0.008, + "step": 249300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132984546770864, + "loss": 0.0079, + "step": 249310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132227777469463, + "loss": 0.0091, + "step": 249320 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011131471008168061, + "loss": 0.0098, + "step": 249330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011130714238866661, + "loss": 0.0087, + "step": 249340 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112995746956526, + "loss": 0.0099, + "step": 249350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011129200700263859, + "loss": 0.0089, + "step": 249360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011128443930962458, + "loss": 0.009, + "step": 249370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011127687161661056, + "loss": 0.0063, + "step": 249380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126930392359656, + "loss": 0.0089, + "step": 249390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126173623058255, + "loss": 0.0098, + "step": 249400 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011125416853756853, + "loss": 0.0076, + "step": 249410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011124660084455453, + "loss": 0.01, + "step": 249420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011123903315154052, + "loss": 0.0076, + "step": 249430 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112314654585265, + "loss": 0.0069, + "step": 249440 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112238977655125, + "loss": 0.0082, + "step": 249450 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112163300724985, + "loss": 0.0091, + "step": 249460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011120876237948448, + "loss": 0.0102, + "step": 249470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011120119468647047, + "loss": 0.0084, + "step": 249480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011119362699345645, + "loss": 0.0075, + "step": 249490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011118605930044245, + "loss": 0.0081, + "step": 249500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011117849160742844, + "loss": 0.0085, + "step": 249510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011117092391441442, + "loss": 0.0091, + "step": 249520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011116335622140042, + "loss": 0.0071, + "step": 249530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011115578852838641, + "loss": 0.0082, + "step": 249540 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001111482208353724, + "loss": 0.0078, + "step": 249550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011114065314235839, + "loss": 0.011, + "step": 249560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011113308544934437, + "loss": 0.0076, + "step": 249570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011112551775633037, + "loss": 0.0072, + "step": 249580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111795006331636, + "loss": 0.0099, + "step": 249590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111038237030234, + "loss": 0.0096, + "step": 249600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011110281467728834, + "loss": 0.0088, + "step": 249610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011109524698427433, + "loss": 0.0079, + "step": 249620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011108767929126032, + "loss": 0.0093, + "step": 249630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011108011159824631, + "loss": 0.0095, + "step": 249640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011107254390523229, + "loss": 0.0076, + "step": 249650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011106497621221829, + "loss": 0.0132, + "step": 249660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011105740851920428, + "loss": 0.011, + "step": 249670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104984082619026, + "loss": 0.0128, + "step": 249680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104227313317626, + "loss": 0.0088, + "step": 249690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011103470544016225, + "loss": 0.0089, + "step": 249700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011102713774714823, + "loss": 0.0087, + "step": 249710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011101957005413423, + "loss": 0.0105, + "step": 249720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011101200236112021, + "loss": 0.0078, + "step": 249730 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110044346681062, + "loss": 0.01, + "step": 249740 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109968669750922, + "loss": 0.0086, + "step": 249750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098929928207818, + "loss": 0.0102, + "step": 249760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098173158906418, + "loss": 0.0095, + "step": 249770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011097416389605017, + "loss": 0.0066, + "step": 249780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011096659620303615, + "loss": 0.0099, + "step": 249790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011095902851002215, + "loss": 0.0086, + "step": 249800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011095146081700812, + "loss": 0.0089, + "step": 249810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011094389312399411, + "loss": 0.0072, + "step": 249820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011093632543098009, + "loss": 0.0065, + "step": 249830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011092875773796609, + "loss": 0.0085, + "step": 249840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011092119004495208, + "loss": 0.0074, + "step": 249850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011091362235193806, + "loss": 0.0085, + "step": 249860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011090605465892406, + "loss": 0.0113, + "step": 249870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011089848696591005, + "loss": 0.0093, + "step": 249880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011089091927289604, + "loss": 0.0078, + "step": 249890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011088335157988203, + "loss": 0.0072, + "step": 249900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011087578388686803, + "loss": 0.0131, + "step": 249910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086821619385401, + "loss": 0.0095, + "step": 249920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086064850084, + "loss": 0.009, + "step": 249930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011085308080782598, + "loss": 0.008, + "step": 249940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011084551311481198, + "loss": 0.0107, + "step": 249950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011083794542179797, + "loss": 0.0086, + "step": 249960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011083037772878396, + "loss": 0.0092, + "step": 249970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011082281003576995, + "loss": 0.0072, + "step": 249980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011081524234275595, + "loss": 0.0098, + "step": 249990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011080767464974193, + "loss": 0.0082, + "step": 250000 + }, + { + "epoch": 1.26, + "eval_cer": 0.9144537591690304, + "eval_loss": 0.0067350054159760475, + "eval_runtime": 115.9925, + "eval_samples_per_second": 17.243, + "eval_steps_per_second": 4.311, + "step": 250000 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011080010695672792, + "loss": 0.0085, + "step": 250010 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107925392637139, + "loss": 0.0154, + "step": 250020 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107849715706999, + "loss": 0.0071, + "step": 250030 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011077740387768589, + "loss": 0.0072, + "step": 250040 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011076983618467187, + "loss": 0.0067, + "step": 250050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011076226849165787, + "loss": 0.0066, + "step": 250060 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011075470079864386, + "loss": 0.0121, + "step": 250070 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011074713310562985, + "loss": 0.0063, + "step": 250080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011073956541261584, + "loss": 0.0088, + "step": 250090 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011073199771960182, + "loss": 0.0071, + "step": 250100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011072443002658782, + "loss": 0.0084, + "step": 250110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011071686233357381, + "loss": 0.0107, + "step": 250120 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107092946405598, + "loss": 0.0104, + "step": 250130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011070172694754579, + "loss": 0.008, + "step": 250140 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011069415925453178, + "loss": 0.0079, + "step": 250150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011068659156151777, + "loss": 0.0079, + "step": 250160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011067902386850376, + "loss": 0.007, + "step": 250170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011067145617548974, + "loss": 0.0088, + "step": 250180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011066388848247574, + "loss": 0.0085, + "step": 250190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011065632078946173, + "loss": 0.0106, + "step": 250200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011064875309644771, + "loss": 0.0085, + "step": 250210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011064118540343371, + "loss": 0.0104, + "step": 250220 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106336177104197, + "loss": 0.007, + "step": 250230 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011062605001740568, + "loss": 0.0087, + "step": 250240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011061848232439168, + "loss": 0.0104, + "step": 250250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011061091463137766, + "loss": 0.0107, + "step": 250260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011060334693836366, + "loss": 0.0108, + "step": 250270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011059577924534965, + "loss": 0.0069, + "step": 250280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011058821155233563, + "loss": 0.0086, + "step": 250290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011058064385932163, + "loss": 0.0125, + "step": 250300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011057307616630762, + "loss": 0.006, + "step": 250310 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105655084732936, + "loss": 0.0094, + "step": 250320 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105579407802796, + "loss": 0.0072, + "step": 250330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011055037308726558, + "loss": 0.0094, + "step": 250340 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011054280539425158, + "loss": 0.0074, + "step": 250350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011053523770123757, + "loss": 0.0099, + "step": 250360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011052767000822355, + "loss": 0.0101, + "step": 250370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011052010231520955, + "loss": 0.0101, + "step": 250380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011051253462219554, + "loss": 0.0078, + "step": 250390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011050496692918152, + "loss": 0.013, + "step": 250400 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011049739923616752, + "loss": 0.0104, + "step": 250410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011048983154315351, + "loss": 0.0068, + "step": 250420 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001104822638501395, + "loss": 0.0083, + "step": 250430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011047469615712548, + "loss": 0.009, + "step": 250440 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011046712846411146, + "loss": 0.0075, + "step": 250450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011045956077109745, + "loss": 0.0087, + "step": 250460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011045199307808343, + "loss": 0.0065, + "step": 250470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011044442538506943, + "loss": 0.0091, + "step": 250480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011043685769205542, + "loss": 0.0077, + "step": 250490 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001104292899990414, + "loss": 0.0068, + "step": 250500 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001104217223060274, + "loss": 0.0067, + "step": 250510 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001104141546130134, + "loss": 0.0116, + "step": 250520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011040658691999938, + "loss": 0.0096, + "step": 250530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039901922698537, + "loss": 0.0068, + "step": 250540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039145153397135, + "loss": 0.0066, + "step": 250550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011038388384095735, + "loss": 0.0085, + "step": 250560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011037631614794334, + "loss": 0.0078, + "step": 250570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011036874845492932, + "loss": 0.0086, + "step": 250580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011036118076191532, + "loss": 0.0092, + "step": 250590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011035361306890131, + "loss": 0.0072, + "step": 250600 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001103460453758873, + "loss": 0.0147, + "step": 250610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011033847768287329, + "loss": 0.0101, + "step": 250620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011033090998985927, + "loss": 0.0103, + "step": 250630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011032334229684527, + "loss": 0.0112, + "step": 250640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011031577460383126, + "loss": 0.007, + "step": 250650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030820691081724, + "loss": 0.009, + "step": 250660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030063921780324, + "loss": 0.0072, + "step": 250670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011029307152478923, + "loss": 0.0099, + "step": 250680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011028550383177522, + "loss": 0.0082, + "step": 250690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011027793613876121, + "loss": 0.0091, + "step": 250700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011027036844574719, + "loss": 0.0071, + "step": 250710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011026280075273319, + "loss": 0.0089, + "step": 250720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011025523305971918, + "loss": 0.0071, + "step": 250730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011024766536670516, + "loss": 0.0068, + "step": 250740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011024009767369116, + "loss": 0.0087, + "step": 250750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011023252998067715, + "loss": 0.0115, + "step": 250760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011022496228766313, + "loss": 0.0079, + "step": 250770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011021739459464913, + "loss": 0.013, + "step": 250780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011020982690163511, + "loss": 0.0095, + "step": 250790 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001102022592086211, + "loss": 0.0059, + "step": 250800 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001101946915156071, + "loss": 0.0074, + "step": 250810 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011018712382259308, + "loss": 0.0091, + "step": 250820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011017955612957908, + "loss": 0.0113, + "step": 250830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011017198843656507, + "loss": 0.0089, + "step": 250840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011016442074355105, + "loss": 0.0103, + "step": 250850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011015685305053705, + "loss": 0.0079, + "step": 250860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011014928535752304, + "loss": 0.0082, + "step": 250870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011014171766450903, + "loss": 0.0073, + "step": 250880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011013414997149502, + "loss": 0.0103, + "step": 250890 + }, + { + "epoch": 1.27, + "learning_rate": 0.000110126582278481, + "loss": 0.0083, + "step": 250900 + }, + { + "epoch": 1.27, + "learning_rate": 0.000110119014585467, + "loss": 0.009, + "step": 250910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011011144689245299, + "loss": 0.0092, + "step": 250920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011010387919943897, + "loss": 0.0134, + "step": 250930 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011009631150642497, + "loss": 0.008, + "step": 250940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008874381341096, + "loss": 0.0071, + "step": 250950 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008117612039694, + "loss": 0.0106, + "step": 250960 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011007360842738294, + "loss": 0.0072, + "step": 250970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011006604073436892, + "loss": 0.0057, + "step": 250980 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011005847304135492, + "loss": 0.0099, + "step": 250990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011005090534834091, + "loss": 0.01, + "step": 251000 + }, + { + "epoch": 1.27, + "eval_cer": 0.9144605519419082, + "eval_loss": 0.0065511371940374374, + "eval_runtime": 116.1225, + "eval_samples_per_second": 17.223, + "eval_steps_per_second": 4.306, + "step": 251000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011004333765532689, + "loss": 0.008, + "step": 251010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011003576996231289, + "loss": 0.0103, + "step": 251020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002820226929888, + "loss": 0.0099, + "step": 251030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002063457628486, + "loss": 0.0089, + "step": 251040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011001306688327086, + "loss": 0.0064, + "step": 251050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011000549919025684, + "loss": 0.0073, + "step": 251060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010999793149724282, + "loss": 0.0122, + "step": 251070 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099903638042288, + "loss": 0.0112, + "step": 251080 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099827961112148, + "loss": 0.0081, + "step": 251090 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099752284182008, + "loss": 0.0078, + "step": 251100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010996766072518677, + "loss": 0.0107, + "step": 251110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010996009303217277, + "loss": 0.0084, + "step": 251120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010995252533915876, + "loss": 0.0076, + "step": 251130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010994495764614475, + "loss": 0.009, + "step": 251140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010993738995313074, + "loss": 0.0084, + "step": 251150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010992982226011672, + "loss": 0.0088, + "step": 251160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010992225456710272, + "loss": 0.0078, + "step": 251170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010991468687408871, + "loss": 0.0075, + "step": 251180 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099071191810747, + "loss": 0.0084, + "step": 251190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010989955148806069, + "loss": 0.007, + "step": 251200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010989198379504668, + "loss": 0.0082, + "step": 251210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010988441610203267, + "loss": 0.0088, + "step": 251220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010987684840901866, + "loss": 0.008, + "step": 251230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010986928071600464, + "loss": 0.0102, + "step": 251240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010986171302299064, + "loss": 0.0115, + "step": 251250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010985414532997663, + "loss": 0.009, + "step": 251260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010984657763696261, + "loss": 0.0064, + "step": 251270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010983900994394861, + "loss": 0.0101, + "step": 251280 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098314422509346, + "loss": 0.0092, + "step": 251290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010982387455792058, + "loss": 0.008, + "step": 251300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010981630686490658, + "loss": 0.0094, + "step": 251310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980873917189256, + "loss": 0.0088, + "step": 251320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980117147887856, + "loss": 0.0083, + "step": 251330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010979360378586455, + "loss": 0.0069, + "step": 251340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010978603609285053, + "loss": 0.0097, + "step": 251350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010977846839983653, + "loss": 0.0093, + "step": 251360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010977090070682252, + "loss": 0.0067, + "step": 251370 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097633330138085, + "loss": 0.0083, + "step": 251380 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097557653207945, + "loss": 0.0096, + "step": 251390 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097481976277805, + "loss": 0.0085, + "step": 251400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010974062993476648, + "loss": 0.0088, + "step": 251410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010973306224175247, + "loss": 0.0075, + "step": 251420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010972549454873845, + "loss": 0.0082, + "step": 251430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010971792685572445, + "loss": 0.01, + "step": 251440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010971035916271044, + "loss": 0.0093, + "step": 251450 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010970279146969642, + "loss": 0.0108, + "step": 251460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010969522377668242, + "loss": 0.0089, + "step": 251470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010968765608366841, + "loss": 0.0074, + "step": 251480 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096800883906544, + "loss": 0.0113, + "step": 251490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010967252069764039, + "loss": 0.0082, + "step": 251500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010966495300462637, + "loss": 0.0085, + "step": 251510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010965738531161237, + "loss": 0.0115, + "step": 251520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010964981761859836, + "loss": 0.0091, + "step": 251530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010964224992558434, + "loss": 0.0076, + "step": 251540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010963468223257034, + "loss": 0.0101, + "step": 251550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010962711453955633, + "loss": 0.0086, + "step": 251560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010961954684654231, + "loss": 0.0072, + "step": 251570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010961197915352831, + "loss": 0.0104, + "step": 251580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010960441146051429, + "loss": 0.0085, + "step": 251590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010959684376750029, + "loss": 0.0097, + "step": 251600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010958927607448628, + "loss": 0.0101, + "step": 251610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010958170838147226, + "loss": 0.0098, + "step": 251620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010957414068845826, + "loss": 0.0068, + "step": 251630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010956657299544425, + "loss": 0.0095, + "step": 251640 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010955900530243023, + "loss": 0.009, + "step": 251650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010955143760941623, + "loss": 0.0099, + "step": 251660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010954386991640221, + "loss": 0.0068, + "step": 251670 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095363022233882, + "loss": 0.008, + "step": 251680 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095287345303742, + "loss": 0.0092, + "step": 251690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010952116683736017, + "loss": 0.0072, + "step": 251700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010951359914434616, + "loss": 0.0091, + "step": 251710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010950603145133214, + "loss": 0.0075, + "step": 251720 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949846375831814, + "loss": 0.0081, + "step": 251730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949089606530413, + "loss": 0.009, + "step": 251740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010948332837229012, + "loss": 0.0122, + "step": 251750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010947576067927611, + "loss": 0.0083, + "step": 251760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010946819298626209, + "loss": 0.0077, + "step": 251770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010946062529324809, + "loss": 0.0097, + "step": 251780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010945305760023408, + "loss": 0.0082, + "step": 251790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010944548990722006, + "loss": 0.0094, + "step": 251800 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010943792221420606, + "loss": 0.0111, + "step": 251810 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010943035452119205, + "loss": 0.0094, + "step": 251820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010942278682817803, + "loss": 0.0086, + "step": 251830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010941521913516403, + "loss": 0.0095, + "step": 251840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010940765144215002, + "loss": 0.0117, + "step": 251850 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109400083749136, + "loss": 0.011, + "step": 251860 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109392516056122, + "loss": 0.0084, + "step": 251870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010938494836310798, + "loss": 0.0079, + "step": 251880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010937738067009398, + "loss": 0.0087, + "step": 251890 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936981297707997, + "loss": 0.0064, + "step": 251900 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936224528406595, + "loss": 0.0084, + "step": 251910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010935467759105195, + "loss": 0.0076, + "step": 251920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010934710989803794, + "loss": 0.0084, + "step": 251930 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010933954220502393, + "loss": 0.0093, + "step": 251940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010933197451200992, + "loss": 0.0097, + "step": 251950 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001093244068189959, + "loss": 0.0075, + "step": 251960 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001093168391259819, + "loss": 0.0095, + "step": 251970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010930927143296789, + "loss": 0.0093, + "step": 251980 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010930170373995387, + "loss": 0.0078, + "step": 251990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010929413604693987, + "loss": 0.0073, + "step": 252000 + }, + { + "epoch": 1.27, + "eval_cer": 0.9144789894682909, + "eval_loss": 0.006821473129093647, + "eval_runtime": 116.1992, + "eval_samples_per_second": 17.212, + "eval_steps_per_second": 4.303, + "step": 252000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010928656835392586, + "loss": 0.0073, + "step": 252010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010927900066091184, + "loss": 0.008, + "step": 252020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010927143296789784, + "loss": 0.008, + "step": 252030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010926386527488382, + "loss": 0.0102, + "step": 252040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010925629758186982, + "loss": 0.0111, + "step": 252050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924872988885581, + "loss": 0.0092, + "step": 252060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924116219584179, + "loss": 0.0105, + "step": 252070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010923359450282779, + "loss": 0.0085, + "step": 252080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010922602680981378, + "loss": 0.0093, + "step": 252090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010921845911679976, + "loss": 0.0074, + "step": 252100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010921089142378576, + "loss": 0.008, + "step": 252110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010920332373077174, + "loss": 0.0098, + "step": 252120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010919575603775774, + "loss": 0.0109, + "step": 252130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918818834474373, + "loss": 0.0083, + "step": 252140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918062065172971, + "loss": 0.0078, + "step": 252150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010917305295871571, + "loss": 0.0095, + "step": 252160 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001091654852657017, + "loss": 0.0081, + "step": 252170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915791757268768, + "loss": 0.0083, + "step": 252180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915034987967368, + "loss": 0.0097, + "step": 252190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010914278218665966, + "loss": 0.0115, + "step": 252200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010913521449364565, + "loss": 0.0086, + "step": 252210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010912764680063165, + "loss": 0.0091, + "step": 252220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010912007910761763, + "loss": 0.0093, + "step": 252230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010911251141460363, + "loss": 0.0101, + "step": 252240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010910494372158962, + "loss": 0.0114, + "step": 252250 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001090973760285756, + "loss": 0.0113, + "step": 252260 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001090898083355616, + "loss": 0.0083, + "step": 252270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010908224064254758, + "loss": 0.0098, + "step": 252280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010907467294953357, + "loss": 0.0095, + "step": 252290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010906710525651957, + "loss": 0.0058, + "step": 252300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010905953756350555, + "loss": 0.0095, + "step": 252310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010905196987049153, + "loss": 0.0078, + "step": 252320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010904440217747751, + "loss": 0.0087, + "step": 252330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010903683448446351, + "loss": 0.0099, + "step": 252340 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001090292667914495, + "loss": 0.013, + "step": 252350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010902169909843549, + "loss": 0.0082, + "step": 252360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010901413140542148, + "loss": 0.0077, + "step": 252370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010900656371240748, + "loss": 0.0088, + "step": 252380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010899899601939346, + "loss": 0.0075, + "step": 252390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010899142832637945, + "loss": 0.0079, + "step": 252400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010898386063336543, + "loss": 0.0111, + "step": 252410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010897629294035143, + "loss": 0.009, + "step": 252420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010896872524733742, + "loss": 0.0089, + "step": 252430 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089611575543234, + "loss": 0.0071, + "step": 252440 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089535898613094, + "loss": 0.01, + "step": 252450 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089460221682954, + "loss": 0.007, + "step": 252460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010893845447528138, + "loss": 0.0075, + "step": 252470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010893088678226737, + "loss": 0.0082, + "step": 252480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010892331908925335, + "loss": 0.0066, + "step": 252490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010891575139623935, + "loss": 0.0091, + "step": 252500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010890818370322534, + "loss": 0.0088, + "step": 252510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010890061601021132, + "loss": 0.0069, + "step": 252520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010889304831719732, + "loss": 0.0084, + "step": 252530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010888548062418331, + "loss": 0.0076, + "step": 252540 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088779129311693, + "loss": 0.0093, + "step": 252550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010887034523815529, + "loss": 0.01, + "step": 252560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010886277754514127, + "loss": 0.0071, + "step": 252570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010885520985212727, + "loss": 0.0075, + "step": 252580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010884764215911326, + "loss": 0.0073, + "step": 252590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010884007446609924, + "loss": 0.0089, + "step": 252600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010883250677308524, + "loss": 0.0086, + "step": 252610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010882493908007123, + "loss": 0.0087, + "step": 252620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010881737138705721, + "loss": 0.0078, + "step": 252630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010880980369404321, + "loss": 0.0086, + "step": 252640 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010880223600102919, + "loss": 0.0088, + "step": 252650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010879466830801519, + "loss": 0.01, + "step": 252660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010878710061500118, + "loss": 0.0066, + "step": 252670 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010877953292198716, + "loss": 0.0095, + "step": 252680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010877196522897316, + "loss": 0.0091, + "step": 252690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010876439753595915, + "loss": 0.0073, + "step": 252700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010875682984294513, + "loss": 0.007, + "step": 252710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010874926214993113, + "loss": 0.0081, + "step": 252720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010874169445691711, + "loss": 0.0079, + "step": 252730 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087341267639031, + "loss": 0.0083, + "step": 252740 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087265590708891, + "loss": 0.0078, + "step": 252750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010871899137787508, + "loss": 0.008, + "step": 252760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010871142368486108, + "loss": 0.0079, + "step": 252770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010870385599184707, + "loss": 0.0082, + "step": 252780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010869628829883305, + "loss": 0.0076, + "step": 252790 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868872060581905, + "loss": 0.007, + "step": 252800 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868115291280504, + "loss": 0.0071, + "step": 252810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010867358521979102, + "loss": 0.0149, + "step": 252820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010866601752677702, + "loss": 0.0081, + "step": 252830 + }, + { + "epoch": 1.28, + "learning_rate": 0.000108658449833763, + "loss": 0.0081, + "step": 252840 + }, + { + "epoch": 1.28, + "learning_rate": 0.000108650882140749, + "loss": 0.0087, + "step": 252850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010864331444773499, + "loss": 0.0088, + "step": 252860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010863574675472097, + "loss": 0.0068, + "step": 252870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862817906170697, + "loss": 0.0077, + "step": 252880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862061136869296, + "loss": 0.0066, + "step": 252890 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010861304367567894, + "loss": 0.0096, + "step": 252900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010860547598266494, + "loss": 0.006, + "step": 252910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859790828965092, + "loss": 0.0083, + "step": 252920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859034059663692, + "loss": 0.0099, + "step": 252930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010858277290362291, + "loss": 0.0076, + "step": 252940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010857520521060888, + "loss": 0.0091, + "step": 252950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010856763751759487, + "loss": 0.0137, + "step": 252960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010856006982458085, + "loss": 0.008, + "step": 252970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010855250213156685, + "loss": 0.0133, + "step": 252980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010854493443855284, + "loss": 0.009, + "step": 252990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010853736674553883, + "loss": 0.0104, + "step": 253000 + }, + { + "epoch": 1.28, + "eval_cer": 0.914462492734159, + "eval_loss": 0.006441994570195675, + "eval_runtime": 116.0386, + "eval_samples_per_second": 17.236, + "eval_steps_per_second": 4.309, + "step": 253000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010852979905252482, + "loss": 0.0092, + "step": 253010 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085222313595108, + "loss": 0.0089, + "step": 253020 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085146636664968, + "loss": 0.0102, + "step": 253030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010850709597348279, + "loss": 0.0077, + "step": 253040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010849952828046877, + "loss": 0.0061, + "step": 253050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010849196058745477, + "loss": 0.0063, + "step": 253060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010848439289444076, + "loss": 0.0087, + "step": 253070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010847682520142675, + "loss": 0.0101, + "step": 253080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010846925750841274, + "loss": 0.0072, + "step": 253090 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010846168981539872, + "loss": 0.0116, + "step": 253100 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010845412212238472, + "loss": 0.0094, + "step": 253110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010844655442937071, + "loss": 0.0119, + "step": 253120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843898673635669, + "loss": 0.0078, + "step": 253130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843141904334269, + "loss": 0.0098, + "step": 253140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010842385135032868, + "loss": 0.0076, + "step": 253150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010841628365731466, + "loss": 0.0073, + "step": 253160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010840871596430066, + "loss": 0.0101, + "step": 253170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010840114827128664, + "loss": 0.0056, + "step": 253180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010839358057827264, + "loss": 0.0105, + "step": 253190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010838601288525863, + "loss": 0.0076, + "step": 253200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010837844519224461, + "loss": 0.0093, + "step": 253210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010837087749923061, + "loss": 0.0098, + "step": 253220 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001083633098062166, + "loss": 0.0087, + "step": 253230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010835574211320258, + "loss": 0.0076, + "step": 253240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834817442018858, + "loss": 0.0082, + "step": 253250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834060672717456, + "loss": 0.0101, + "step": 253260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010833303903416056, + "loss": 0.0087, + "step": 253270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010832547134114655, + "loss": 0.0085, + "step": 253280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831790364813253, + "loss": 0.0092, + "step": 253290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831033595511853, + "loss": 0.0082, + "step": 253300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010830276826210452, + "loss": 0.0058, + "step": 253310 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001082952005690905, + "loss": 0.0075, + "step": 253320 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001082876328760765, + "loss": 0.008, + "step": 253330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010828006518306249, + "loss": 0.008, + "step": 253340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010827249749004847, + "loss": 0.0085, + "step": 253350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010826492979703447, + "loss": 0.0099, + "step": 253360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010825736210402045, + "loss": 0.0093, + "step": 253370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824979441100645, + "loss": 0.0081, + "step": 253380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824222671799244, + "loss": 0.0081, + "step": 253390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010823465902497842, + "loss": 0.0096, + "step": 253400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010822709133196442, + "loss": 0.0087, + "step": 253410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010821952363895041, + "loss": 0.0083, + "step": 253420 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001082119559459364, + "loss": 0.0083, + "step": 253430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010820438825292239, + "loss": 0.008, + "step": 253440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010819682055990837, + "loss": 0.0079, + "step": 253450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010818925286689437, + "loss": 0.0076, + "step": 253460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010818168517388036, + "loss": 0.0065, + "step": 253470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010817411748086634, + "loss": 0.0085, + "step": 253480 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010816654978785234, + "loss": 0.0091, + "step": 253490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815898209483833, + "loss": 0.0084, + "step": 253500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815141440182431, + "loss": 0.0096, + "step": 253510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010814384670881031, + "loss": 0.0078, + "step": 253520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010813627901579629, + "loss": 0.0063, + "step": 253530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812871132278228, + "loss": 0.0098, + "step": 253540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812114362976828, + "loss": 0.0076, + "step": 253550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010811357593675426, + "loss": 0.0078, + "step": 253560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010810600824374026, + "loss": 0.0088, + "step": 253570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010809844055072622, + "loss": 0.0088, + "step": 253580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010809087285771222, + "loss": 0.0081, + "step": 253590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010808330516469821, + "loss": 0.0106, + "step": 253600 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001080757374716842, + "loss": 0.0098, + "step": 253610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010806816977867019, + "loss": 0.0077, + "step": 253620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010806060208565617, + "loss": 0.0113, + "step": 253630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010805303439264217, + "loss": 0.0108, + "step": 253640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010804546669962816, + "loss": 0.0066, + "step": 253650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010803789900661414, + "loss": 0.0083, + "step": 253660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010803033131360014, + "loss": 0.0077, + "step": 253670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010802276362058613, + "loss": 0.0091, + "step": 253680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010801519592757211, + "loss": 0.0111, + "step": 253690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010800762823455811, + "loss": 0.0066, + "step": 253700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010800006054154409, + "loss": 0.0086, + "step": 253710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010799249284853009, + "loss": 0.0077, + "step": 253720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010798492515551608, + "loss": 0.0101, + "step": 253730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010797735746250206, + "loss": 0.0064, + "step": 253740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796978976948806, + "loss": 0.0095, + "step": 253750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796222207647405, + "loss": 0.0089, + "step": 253760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010795465438346003, + "loss": 0.0085, + "step": 253770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010794708669044603, + "loss": 0.0114, + "step": 253780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010793951899743202, + "loss": 0.0083, + "step": 253790 + }, + { + "epoch": 1.28, + "learning_rate": 0.000107931951304418, + "loss": 0.0082, + "step": 253800 + }, + { + "epoch": 1.28, + "learning_rate": 0.000107924383611404, + "loss": 0.0098, + "step": 253810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010791681591838998, + "loss": 0.0109, + "step": 253820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010790924822537598, + "loss": 0.0069, + "step": 253830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010790168053236197, + "loss": 0.0092, + "step": 253840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010789411283934795, + "loss": 0.0066, + "step": 253850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010788654514633395, + "loss": 0.0077, + "step": 253860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010787897745331994, + "loss": 0.0086, + "step": 253870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010787140976030592, + "loss": 0.008, + "step": 253880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010786384206729192, + "loss": 0.0077, + "step": 253890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078562743742779, + "loss": 0.0068, + "step": 253900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078487066812639, + "loss": 0.0079, + "step": 253910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010784113898824989, + "loss": 0.0103, + "step": 253920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010783357129523587, + "loss": 0.0084, + "step": 253930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010782600360222187, + "loss": 0.0103, + "step": 253940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010781843590920786, + "loss": 0.0072, + "step": 253950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010781086821619384, + "loss": 0.0081, + "step": 253960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010780330052317984, + "loss": 0.0073, + "step": 253970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010779573283016582, + "loss": 0.0068, + "step": 253980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010778816513715182, + "loss": 0.0079, + "step": 253990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010778059744413781, + "loss": 0.0083, + "step": 254000 + }, + { + "epoch": 1.28, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.00646965904161334, + "eval_runtime": 116.1648, + "eval_samples_per_second": 17.217, + "eval_steps_per_second": 4.304, + "step": 254000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010777302975112379, + "loss": 0.0087, + "step": 254010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010776546205810979, + "loss": 0.0091, + "step": 254020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010775789436509578, + "loss": 0.0086, + "step": 254030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010775032667208176, + "loss": 0.007, + "step": 254040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010774275897906776, + "loss": 0.0056, + "step": 254050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010773519128605374, + "loss": 0.0102, + "step": 254060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010772762359303973, + "loss": 0.0067, + "step": 254070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010772005590002573, + "loss": 0.0117, + "step": 254080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010771248820701171, + "loss": 0.0115, + "step": 254090 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077049205139977, + "loss": 0.0086, + "step": 254100 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001076973528209837, + "loss": 0.0099, + "step": 254110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010768978512796968, + "loss": 0.0091, + "step": 254120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010768221743495568, + "loss": 0.0071, + "step": 254130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010767464974194166, + "loss": 0.0087, + "step": 254140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010766708204892765, + "loss": 0.0093, + "step": 254150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010765951435591365, + "loss": 0.0119, + "step": 254160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010765194666289963, + "loss": 0.0076, + "step": 254170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010764437896988563, + "loss": 0.0086, + "step": 254180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010763681127687162, + "loss": 0.007, + "step": 254190 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001076292435838576, + "loss": 0.0095, + "step": 254200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010762167589084358, + "loss": 0.0099, + "step": 254210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010761410819782956, + "loss": 0.0076, + "step": 254220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010760654050481556, + "loss": 0.0084, + "step": 254230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759897281180155, + "loss": 0.0107, + "step": 254240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759140511878754, + "loss": 0.0091, + "step": 254250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010758383742577353, + "loss": 0.0097, + "step": 254260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010757626973275951, + "loss": 0.0082, + "step": 254270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010756870203974551, + "loss": 0.0086, + "step": 254280 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001075611343467315, + "loss": 0.0054, + "step": 254290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010755356665371748, + "loss": 0.0101, + "step": 254300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010754599896070348, + "loss": 0.0087, + "step": 254310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010753843126768947, + "loss": 0.008, + "step": 254320 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010753086357467546, + "loss": 0.0066, + "step": 254330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010752329588166145, + "loss": 0.0086, + "step": 254340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010751572818864743, + "loss": 0.0067, + "step": 254350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010750816049563343, + "loss": 0.0075, + "step": 254360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010750059280261942, + "loss": 0.0091, + "step": 254370 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074930251096054, + "loss": 0.0079, + "step": 254380 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074854574165914, + "loss": 0.0082, + "step": 254390 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074778897235774, + "loss": 0.0079, + "step": 254400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010747032203056337, + "loss": 0.0081, + "step": 254410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010746275433754937, + "loss": 0.0174, + "step": 254420 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010745518664453535, + "loss": 0.0067, + "step": 254430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010744761895152135, + "loss": 0.0102, + "step": 254440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010744005125850734, + "loss": 0.0054, + "step": 254450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010743248356549332, + "loss": 0.0075, + "step": 254460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010742491587247932, + "loss": 0.0085, + "step": 254470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010741734817946531, + "loss": 0.0096, + "step": 254480 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074097804864513, + "loss": 0.0095, + "step": 254490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010740221279343729, + "loss": 0.0095, + "step": 254500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010739464510042327, + "loss": 0.0093, + "step": 254510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010738707740740927, + "loss": 0.011, + "step": 254520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010737950971439526, + "loss": 0.0073, + "step": 254530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010737194202138124, + "loss": 0.0104, + "step": 254540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010736437432836724, + "loss": 0.0081, + "step": 254550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010735680663535323, + "loss": 0.0097, + "step": 254560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010734923894233921, + "loss": 0.0077, + "step": 254570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010734167124932521, + "loss": 0.0076, + "step": 254580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010733410355631119, + "loss": 0.0079, + "step": 254590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010732653586329718, + "loss": 0.0133, + "step": 254600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731896817028318, + "loss": 0.0108, + "step": 254610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731140047726916, + "loss": 0.0079, + "step": 254620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010730383278425516, + "loss": 0.0094, + "step": 254630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010729626509124115, + "loss": 0.0073, + "step": 254640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728869739822713, + "loss": 0.0094, + "step": 254650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728112970521313, + "loss": 0.0096, + "step": 254660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010727356201219911, + "loss": 0.0085, + "step": 254670 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001072659943191851, + "loss": 0.0091, + "step": 254680 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001072584266261711, + "loss": 0.0088, + "step": 254690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010725085893315708, + "loss": 0.0103, + "step": 254700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010724329124014308, + "loss": 0.0095, + "step": 254710 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010723572354712907, + "loss": 0.0085, + "step": 254720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010722815585411505, + "loss": 0.0077, + "step": 254730 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010722058816110105, + "loss": 0.0079, + "step": 254740 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010721302046808704, + "loss": 0.0082, + "step": 254750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010720545277507302, + "loss": 0.0093, + "step": 254760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010719788508205902, + "loss": 0.0098, + "step": 254770 + }, + { + "epoch": 1.29, + "learning_rate": 0.000107190317389045, + "loss": 0.0109, + "step": 254780 + }, + { + "epoch": 1.29, + "learning_rate": 0.000107182749696031, + "loss": 0.0098, + "step": 254790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010717518200301699, + "loss": 0.0088, + "step": 254800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716761431000297, + "loss": 0.0068, + "step": 254810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716004661698897, + "loss": 0.0066, + "step": 254820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010715247892397496, + "loss": 0.0084, + "step": 254830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010714491123096093, + "loss": 0.0066, + "step": 254840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010713734353794692, + "loss": 0.0097, + "step": 254850 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001071297758449329, + "loss": 0.0091, + "step": 254860 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001071222081519189, + "loss": 0.0077, + "step": 254870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010711464045890488, + "loss": 0.0077, + "step": 254880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010710707276589088, + "loss": 0.0065, + "step": 254890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709950507287687, + "loss": 0.0063, + "step": 254900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709193737986285, + "loss": 0.0095, + "step": 254910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010708436968684885, + "loss": 0.0085, + "step": 254920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010707680199383484, + "loss": 0.0083, + "step": 254930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706923430082082, + "loss": 0.0083, + "step": 254940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706166660780682, + "loss": 0.0091, + "step": 254950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001070540989147928, + "loss": 0.0081, + "step": 254960 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001070465312217788, + "loss": 0.0079, + "step": 254970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010703896352876479, + "loss": 0.0076, + "step": 254980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010703139583575077, + "loss": 0.0068, + "step": 254990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010702382814273677, + "loss": 0.0085, + "step": 255000 + }, + { + "epoch": 1.29, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.006503617390990257, + "eval_runtime": 116.441, + "eval_samples_per_second": 17.176, + "eval_steps_per_second": 4.294, + "step": 255000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010701626044972276, + "loss": 0.0077, + "step": 255010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700869275670874, + "loss": 0.0102, + "step": 255020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700112506369474, + "loss": 0.01, + "step": 255030 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010699355737068072, + "loss": 0.0079, + "step": 255040 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010698598967766672, + "loss": 0.0077, + "step": 255050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010697842198465271, + "loss": 0.0095, + "step": 255060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010697085429163869, + "loss": 0.0066, + "step": 255070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010696328659862469, + "loss": 0.0077, + "step": 255080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010695571890561068, + "loss": 0.0085, + "step": 255090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010694815121259666, + "loss": 0.0082, + "step": 255100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010694058351958266, + "loss": 0.0094, + "step": 255110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010693301582656864, + "loss": 0.0108, + "step": 255120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010692544813355463, + "loss": 0.0079, + "step": 255130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010691788044054063, + "loss": 0.0101, + "step": 255140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010691031274752661, + "loss": 0.0099, + "step": 255150 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069027450545126, + "loss": 0.0064, + "step": 255160 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001068951773614986, + "loss": 0.0099, + "step": 255170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688760966848458, + "loss": 0.0072, + "step": 255180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688004197547058, + "loss": 0.0076, + "step": 255190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010687247428245656, + "loss": 0.0069, + "step": 255200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010686490658944255, + "loss": 0.0071, + "step": 255210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010685733889642855, + "loss": 0.0081, + "step": 255220 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010684977120341453, + "loss": 0.0077, + "step": 255230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010684220351040053, + "loss": 0.0082, + "step": 255240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010683463581738652, + "loss": 0.0086, + "step": 255250 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001068270681243725, + "loss": 0.0077, + "step": 255260 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001068195004313585, + "loss": 0.0067, + "step": 255270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010681193273834449, + "loss": 0.0075, + "step": 255280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010680436504533047, + "loss": 0.0084, + "step": 255290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010679679735231647, + "loss": 0.009, + "step": 255300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010678922965930245, + "loss": 0.0091, + "step": 255310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010678166196628845, + "loss": 0.0089, + "step": 255320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010677409427327444, + "loss": 0.0099, + "step": 255330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010676652658026042, + "loss": 0.0086, + "step": 255340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010675895888724642, + "loss": 0.0082, + "step": 255350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010675139119423241, + "loss": 0.0066, + "step": 255360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010674382350121839, + "loss": 0.0111, + "step": 255370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010673625580820439, + "loss": 0.0081, + "step": 255380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010672868811519037, + "loss": 0.0074, + "step": 255390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010672112042217636, + "loss": 0.0077, + "step": 255400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010671355272916236, + "loss": 0.0106, + "step": 255410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010670598503614834, + "loss": 0.0102, + "step": 255420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010669841734313434, + "loss": 0.0095, + "step": 255430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010669084965012033, + "loss": 0.0085, + "step": 255440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010668328195710631, + "loss": 0.0077, + "step": 255450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010667571426409231, + "loss": 0.007, + "step": 255460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010666814657107828, + "loss": 0.0067, + "step": 255470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010666057887806427, + "loss": 0.0087, + "step": 255480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010665301118505025, + "loss": 0.0079, + "step": 255490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010664544349203625, + "loss": 0.0123, + "step": 255500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010663787579902224, + "loss": 0.0079, + "step": 255510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010663030810600822, + "loss": 0.0073, + "step": 255520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010662274041299422, + "loss": 0.0078, + "step": 255530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010661517271998021, + "loss": 0.0081, + "step": 255540 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066076050269662, + "loss": 0.0059, + "step": 255550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010660003733395219, + "loss": 0.0078, + "step": 255560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010659246964093817, + "loss": 0.0106, + "step": 255570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010658490194792417, + "loss": 0.0103, + "step": 255580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010657733425491016, + "loss": 0.0072, + "step": 255590 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010656976656189614, + "loss": 0.0102, + "step": 255600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010656219886888214, + "loss": 0.0095, + "step": 255610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010655463117586813, + "loss": 0.01, + "step": 255620 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010654706348285411, + "loss": 0.0071, + "step": 255630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010653949578984011, + "loss": 0.0072, + "step": 255640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010653192809682609, + "loss": 0.0082, + "step": 255650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010652436040381209, + "loss": 0.0116, + "step": 255660 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010651679271079808, + "loss": 0.0079, + "step": 255670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010650922501778406, + "loss": 0.0082, + "step": 255680 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010650165732477006, + "loss": 0.0076, + "step": 255690 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010649408963175605, + "loss": 0.0062, + "step": 255700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010648652193874203, + "loss": 0.0081, + "step": 255710 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010647895424572803, + "loss": 0.006, + "step": 255720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010647138655271402, + "loss": 0.0097, + "step": 255730 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001064638188597, + "loss": 0.009, + "step": 255740 + }, + { + "epoch": 1.29, + "learning_rate": 0.000106456251166686, + "loss": 0.007, + "step": 255750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644868347367198, + "loss": 0.0082, + "step": 255760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644111578065798, + "loss": 0.0082, + "step": 255770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010643354808764397, + "loss": 0.0096, + "step": 255780 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010642598039462995, + "loss": 0.0097, + "step": 255790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010641841270161595, + "loss": 0.0076, + "step": 255800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010641084500860194, + "loss": 0.0061, + "step": 255810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010640327731558792, + "loss": 0.0092, + "step": 255820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010639570962257392, + "loss": 0.0111, + "step": 255830 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063881419295599, + "loss": 0.0082, + "step": 255840 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063805742365459, + "loss": 0.0073, + "step": 255850 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010637300654353189, + "loss": 0.01, + "step": 255860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010636543885051787, + "loss": 0.0084, + "step": 255870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635787115750387, + "loss": 0.0084, + "step": 255880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635030346448986, + "loss": 0.0101, + "step": 255890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010634273577147584, + "loss": 0.0082, + "step": 255900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010633516807846184, + "loss": 0.0078, + "step": 255910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632760038544782, + "loss": 0.008, + "step": 255920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632003269243381, + "loss": 0.0119, + "step": 255930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010631246499941981, + "loss": 0.0065, + "step": 255940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010630489730640579, + "loss": 0.0079, + "step": 255950 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010629732961339179, + "loss": 0.0069, + "step": 255960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628976192037778, + "loss": 0.0073, + "step": 255970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628219422736376, + "loss": 0.01, + "step": 255980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010627462653434976, + "loss": 0.0083, + "step": 255990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010626705884133574, + "loss": 0.0072, + "step": 256000 + }, + { + "epoch": 1.29, + "eval_cer": 0.9144615223380336, + "eval_loss": 0.00655102264136076, + "eval_runtime": 116.4546, + "eval_samples_per_second": 17.174, + "eval_steps_per_second": 4.294, + "step": 256000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625949114832173, + "loss": 0.0075, + "step": 256010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625192345530773, + "loss": 0.007, + "step": 256020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010624435576229371, + "loss": 0.01, + "step": 256030 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001062367880692797, + "loss": 0.0083, + "step": 256040 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001062292203762657, + "loss": 0.0073, + "step": 256050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010622165268325168, + "loss": 0.0081, + "step": 256060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010621408499023768, + "loss": 0.0099, + "step": 256070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010620651729722366, + "loss": 0.0083, + "step": 256080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619894960420965, + "loss": 0.0073, + "step": 256090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619138191119562, + "loss": 0.0084, + "step": 256100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010618381421818162, + "loss": 0.0085, + "step": 256110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010617624652516761, + "loss": 0.008, + "step": 256120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616867883215359, + "loss": 0.0109, + "step": 256130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616111113913959, + "loss": 0.0098, + "step": 256140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010615354344612558, + "loss": 0.0094, + "step": 256150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010614597575311156, + "loss": 0.0076, + "step": 256160 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010613840806009756, + "loss": 0.0082, + "step": 256170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010613084036708355, + "loss": 0.0084, + "step": 256180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010612327267406954, + "loss": 0.0103, + "step": 256190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010611570498105553, + "loss": 0.0092, + "step": 256200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010610813728804151, + "loss": 0.0091, + "step": 256210 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001061005695950275, + "loss": 0.0086, + "step": 256220 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060930019020135, + "loss": 0.0085, + "step": 256230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010608543420899948, + "loss": 0.0095, + "step": 256240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010607786651598548, + "loss": 0.0098, + "step": 256250 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010607029882297147, + "loss": 0.0072, + "step": 256260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010606273112995745, + "loss": 0.0059, + "step": 256270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010605516343694345, + "loss": 0.0112, + "step": 256280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604759574392943, + "loss": 0.0104, + "step": 256290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604002805091543, + "loss": 0.0111, + "step": 256300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010603246035790142, + "loss": 0.0069, + "step": 256310 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060248926648874, + "loss": 0.0092, + "step": 256320 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060173249718734, + "loss": 0.0073, + "step": 256330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600975727885939, + "loss": 0.0066, + "step": 256340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600218958584537, + "loss": 0.0065, + "step": 256350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010599462189283137, + "loss": 0.0083, + "step": 256360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010598705419981735, + "loss": 0.0079, + "step": 256370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597948650680335, + "loss": 0.0065, + "step": 256380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597191881378934, + "loss": 0.0103, + "step": 256390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010596435112077532, + "loss": 0.0078, + "step": 256400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010595678342776132, + "loss": 0.0073, + "step": 256410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010594921573474731, + "loss": 0.0068, + "step": 256420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010594164804173329, + "loss": 0.0089, + "step": 256430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010593408034871929, + "loss": 0.0068, + "step": 256440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010592651265570527, + "loss": 0.0098, + "step": 256450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010591894496269126, + "loss": 0.0068, + "step": 256460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010591137726967726, + "loss": 0.0096, + "step": 256470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010590380957666324, + "loss": 0.0087, + "step": 256480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010589624188364924, + "loss": 0.0102, + "step": 256490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010588867419063523, + "loss": 0.0071, + "step": 256500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010588110649762121, + "loss": 0.0083, + "step": 256510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010587353880460721, + "loss": 0.0073, + "step": 256520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010586597111159319, + "loss": 0.0082, + "step": 256530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585840341857918, + "loss": 0.0058, + "step": 256540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585083572556518, + "loss": 0.0082, + "step": 256550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010584326803255116, + "loss": 0.0075, + "step": 256560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010583570033953716, + "loss": 0.0111, + "step": 256570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010582813264652315, + "loss": 0.0122, + "step": 256580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010582056495350913, + "loss": 0.0064, + "step": 256590 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010581299726049513, + "loss": 0.007, + "step": 256600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010580542956748111, + "loss": 0.0099, + "step": 256610 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057978618744671, + "loss": 0.0096, + "step": 256620 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057902941814531, + "loss": 0.0086, + "step": 256630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010578272648843908, + "loss": 0.0067, + "step": 256640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010577515879542507, + "loss": 0.0092, + "step": 256650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010576759110241107, + "loss": 0.0104, + "step": 256660 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010576002340939705, + "loss": 0.0091, + "step": 256670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010575245571638305, + "loss": 0.0085, + "step": 256680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010574488802336904, + "loss": 0.0091, + "step": 256690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010573732033035502, + "loss": 0.0096, + "step": 256700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010572975263734102, + "loss": 0.0076, + "step": 256710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010572218494432699, + "loss": 0.0088, + "step": 256720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010571461725131298, + "loss": 0.0076, + "step": 256730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010570704955829896, + "loss": 0.0076, + "step": 256740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010569948186528496, + "loss": 0.007, + "step": 256750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010569191417227095, + "loss": 0.0103, + "step": 256760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010568434647925693, + "loss": 0.0113, + "step": 256770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010567677878624293, + "loss": 0.0086, + "step": 256780 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010566921109322892, + "loss": 0.0086, + "step": 256790 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056616434002149, + "loss": 0.0076, + "step": 256800 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056540757072009, + "loss": 0.0071, + "step": 256810 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010564650801418688, + "loss": 0.0076, + "step": 256820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563894032117288, + "loss": 0.0079, + "step": 256830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563137262815887, + "loss": 0.0084, + "step": 256840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010562380493514485, + "loss": 0.0096, + "step": 256850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010561623724213085, + "loss": 0.0077, + "step": 256860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010560866954911684, + "loss": 0.0073, + "step": 256870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010560110185610282, + "loss": 0.0058, + "step": 256880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010559353416308882, + "loss": 0.0077, + "step": 256890 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055859664700748, + "loss": 0.009, + "step": 256900 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055783987770608, + "loss": 0.0109, + "step": 256910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010557083108404679, + "loss": 0.0076, + "step": 256920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010556326339103277, + "loss": 0.0121, + "step": 256930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010555569569801877, + "loss": 0.0067, + "step": 256940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010554812800500476, + "loss": 0.0082, + "step": 256950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010554056031199074, + "loss": 0.0062, + "step": 256960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010553299261897674, + "loss": 0.0082, + "step": 256970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010552542492596272, + "loss": 0.007, + "step": 256980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010551785723294871, + "loss": 0.0085, + "step": 256990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010551028953993471, + "loss": 0.0071, + "step": 257000 + }, + { + "epoch": 1.3, + "eval_cer": 0.914467344714786, + "eval_loss": 0.006512925960123539, + "eval_runtime": 116.5432, + "eval_samples_per_second": 17.161, + "eval_steps_per_second": 4.29, + "step": 257000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010550272184692069, + "loss": 0.0082, + "step": 257010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010549515415390669, + "loss": 0.0078, + "step": 257020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548758646089268, + "loss": 0.0088, + "step": 257030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548001876787866, + "loss": 0.0096, + "step": 257040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010547245107486466, + "loss": 0.0073, + "step": 257050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010546488338185064, + "loss": 0.0076, + "step": 257060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010545731568883663, + "loss": 0.0102, + "step": 257070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544974799582263, + "loss": 0.009, + "step": 257080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544218030280861, + "loss": 0.0085, + "step": 257090 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001054346126097946, + "loss": 0.011, + "step": 257100 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001054270449167806, + "loss": 0.0064, + "step": 257110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541947722376658, + "loss": 0.0097, + "step": 257120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541190953075258, + "loss": 0.0094, + "step": 257130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010540434183773856, + "loss": 0.0082, + "step": 257140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010539677414472455, + "loss": 0.0079, + "step": 257150 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010538920645171055, + "loss": 0.0079, + "step": 257160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010538163875869653, + "loss": 0.0105, + "step": 257170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010537407106568252, + "loss": 0.0108, + "step": 257180 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010536650337266852, + "loss": 0.0124, + "step": 257190 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053589356796545, + "loss": 0.0101, + "step": 257200 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053513679866405, + "loss": 0.0067, + "step": 257210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010534380029362649, + "loss": 0.0089, + "step": 257220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010533623260061247, + "loss": 0.0073, + "step": 257230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532866490759847, + "loss": 0.01, + "step": 257240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532109721458445, + "loss": 0.0087, + "step": 257250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010531352952157044, + "loss": 0.0102, + "step": 257260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010530596182855644, + "loss": 0.0081, + "step": 257270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010529839413554242, + "loss": 0.0079, + "step": 257280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010529082644252842, + "loss": 0.0071, + "step": 257290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010528325874951441, + "loss": 0.0066, + "step": 257300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010527569105650039, + "loss": 0.0088, + "step": 257310 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010526812336348639, + "loss": 0.0085, + "step": 257320 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010526055567047237, + "loss": 0.0074, + "step": 257330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010525298797745836, + "loss": 0.0088, + "step": 257340 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010524542028444433, + "loss": 0.0078, + "step": 257350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523785259143033, + "loss": 0.0096, + "step": 257360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523028489841632, + "loss": 0.0087, + "step": 257370 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001052227172054023, + "loss": 0.0079, + "step": 257380 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001052151495123883, + "loss": 0.0085, + "step": 257390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520758181937429, + "loss": 0.0082, + "step": 257400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520001412636027, + "loss": 0.0067, + "step": 257410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010519244643334627, + "loss": 0.0085, + "step": 257420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010518487874033225, + "loss": 0.0092, + "step": 257430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010517731104731825, + "loss": 0.0061, + "step": 257440 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516974335430424, + "loss": 0.0104, + "step": 257450 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516217566129022, + "loss": 0.0088, + "step": 257460 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010515460796827622, + "loss": 0.0077, + "step": 257470 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010514704027526221, + "loss": 0.007, + "step": 257480 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051394725822482, + "loss": 0.008, + "step": 257490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010513190488923419, + "loss": 0.0072, + "step": 257500 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010512433719622017, + "loss": 0.0091, + "step": 257510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010511676950320616, + "loss": 0.0077, + "step": 257520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010510920181019216, + "loss": 0.007, + "step": 257530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010510163411717814, + "loss": 0.0059, + "step": 257540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010509406642416414, + "loss": 0.009, + "step": 257550 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010508649873115013, + "loss": 0.0077, + "step": 257560 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010507893103813611, + "loss": 0.009, + "step": 257570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010507136334512211, + "loss": 0.0083, + "step": 257580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010506379565210809, + "loss": 0.008, + "step": 257590 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010505622795909408, + "loss": 0.008, + "step": 257600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504866026608008, + "loss": 0.0073, + "step": 257610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504109257306606, + "loss": 0.0072, + "step": 257620 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010503352488005206, + "loss": 0.008, + "step": 257630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010502595718703805, + "loss": 0.009, + "step": 257640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010501838949402403, + "loss": 0.0075, + "step": 257650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010501082180101003, + "loss": 0.0096, + "step": 257660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010500325410799602, + "loss": 0.0074, + "step": 257670 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104995686414982, + "loss": 0.0097, + "step": 257680 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104988118721968, + "loss": 0.0064, + "step": 257690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010498055102895398, + "loss": 0.0084, + "step": 257700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010497298333593997, + "loss": 0.0089, + "step": 257710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010496541564292597, + "loss": 0.0076, + "step": 257720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010495784794991195, + "loss": 0.0089, + "step": 257730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010495028025689795, + "loss": 0.0091, + "step": 257740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010494271256388394, + "loss": 0.0084, + "step": 257750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010493514487086992, + "loss": 0.0105, + "step": 257760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010492757717785592, + "loss": 0.0098, + "step": 257770 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049200094848419, + "loss": 0.0094, + "step": 257780 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049124417918279, + "loss": 0.0105, + "step": 257790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010490487409881389, + "loss": 0.0093, + "step": 257800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010489730640579987, + "loss": 0.0108, + "step": 257810 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010488973871278587, + "loss": 0.008, + "step": 257820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010488217101977186, + "loss": 0.0075, + "step": 257830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010487460332675784, + "loss": 0.0106, + "step": 257840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010486703563374384, + "loss": 0.0066, + "step": 257850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010485946794072982, + "loss": 0.0099, + "step": 257860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010485190024771581, + "loss": 0.0085, + "step": 257870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010484433255470181, + "loss": 0.0074, + "step": 257880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010483676486168779, + "loss": 0.0097, + "step": 257890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010482919716867378, + "loss": 0.0063, + "step": 257900 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010482162947565978, + "loss": 0.0108, + "step": 257910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010481406178264576, + "loss": 0.0082, + "step": 257920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010480649408963176, + "loss": 0.011, + "step": 257930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010479892639661774, + "loss": 0.0069, + "step": 257940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010479135870360373, + "loss": 0.0096, + "step": 257950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010478379101058973, + "loss": 0.0081, + "step": 257960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010477622331757571, + "loss": 0.0073, + "step": 257970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010476865562456169, + "loss": 0.0075, + "step": 257980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010476108793154767, + "loss": 0.0078, + "step": 257990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010475352023853367, + "loss": 0.007, + "step": 258000 + }, + { + "epoch": 1.3, + "eval_cer": 0.9144421144155256, + "eval_loss": 0.006312798708677292, + "eval_runtime": 116.232, + "eval_samples_per_second": 17.207, + "eval_steps_per_second": 4.302, + "step": 258000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010474595254551966, + "loss": 0.0089, + "step": 258010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010473838485250564, + "loss": 0.0082, + "step": 258020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010473081715949164, + "loss": 0.0086, + "step": 258030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010472324946647762, + "loss": 0.0103, + "step": 258040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010471568177346362, + "loss": 0.0107, + "step": 258050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010470811408044961, + "loss": 0.0083, + "step": 258060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010470054638743559, + "loss": 0.0068, + "step": 258070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010469297869442159, + "loss": 0.0113, + "step": 258080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010468541100140758, + "loss": 0.0092, + "step": 258090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010467784330839356, + "loss": 0.0082, + "step": 258100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010467027561537956, + "loss": 0.0086, + "step": 258110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010466270792236555, + "loss": 0.007, + "step": 258120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010465514022935153, + "loss": 0.0097, + "step": 258130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464757253633753, + "loss": 0.0092, + "step": 258140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464000484332351, + "loss": 0.0081, + "step": 258150 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046324371503095, + "loss": 0.0077, + "step": 258160 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046248694572955, + "loss": 0.0097, + "step": 258170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010461730176428148, + "loss": 0.0071, + "step": 258180 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010460973407126748, + "loss": 0.009, + "step": 258190 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010460216637825347, + "loss": 0.0083, + "step": 258200 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010459459868523945, + "loss": 0.0077, + "step": 258210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010458703099222545, + "loss": 0.0066, + "step": 258220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010457946329921143, + "loss": 0.0066, + "step": 258230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010457189560619743, + "loss": 0.011, + "step": 258240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010456432791318342, + "loss": 0.0082, + "step": 258250 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045567602201694, + "loss": 0.0067, + "step": 258260 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045491925271554, + "loss": 0.0081, + "step": 258270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010454162483414139, + "loss": 0.0085, + "step": 258280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010453405714112737, + "loss": 0.007, + "step": 258290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010452648944811337, + "loss": 0.0118, + "step": 258300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451892175509935, + "loss": 0.0094, + "step": 258310 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451135406208534, + "loss": 0.008, + "step": 258320 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010450378636907134, + "loss": 0.0089, + "step": 258330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010449621867605732, + "loss": 0.006, + "step": 258340 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010448865098304332, + "loss": 0.0077, + "step": 258350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010448108329002931, + "loss": 0.0082, + "step": 258360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010447351559701529, + "loss": 0.0083, + "step": 258370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010446594790400129, + "loss": 0.0097, + "step": 258380 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010445838021098727, + "loss": 0.0065, + "step": 258390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010445081251797326, + "loss": 0.0105, + "step": 258400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010444324482495926, + "loss": 0.0073, + "step": 258410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010443567713194524, + "loss": 0.0108, + "step": 258420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010442810943893124, + "loss": 0.0085, + "step": 258430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010442054174591723, + "loss": 0.0084, + "step": 258440 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010441297405290321, + "loss": 0.0084, + "step": 258450 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044054063598892, + "loss": 0.0079, + "step": 258460 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439783866687519, + "loss": 0.0085, + "step": 258470 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439027097386118, + "loss": 0.0098, + "step": 258480 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010438270328084718, + "loss": 0.008, + "step": 258490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010437513558783316, + "loss": 0.0082, + "step": 258500 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010436756789481915, + "loss": 0.0082, + "step": 258510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010436000020180515, + "loss": 0.0095, + "step": 258520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010435243250879113, + "loss": 0.0095, + "step": 258530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010434486481577713, + "loss": 0.0096, + "step": 258540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010433729712276311, + "loss": 0.007, + "step": 258550 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001043297294297491, + "loss": 0.0083, + "step": 258560 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001043221617367351, + "loss": 0.0082, + "step": 258570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010431459404372108, + "loss": 0.01, + "step": 258580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010430702635070707, + "loss": 0.0061, + "step": 258590 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010429945865769307, + "loss": 0.0076, + "step": 258600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010429189096467904, + "loss": 0.0081, + "step": 258610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010428432327166503, + "loss": 0.0086, + "step": 258620 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010427675557865101, + "loss": 0.0075, + "step": 258630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010426918788563701, + "loss": 0.0092, + "step": 258640 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104261620192623, + "loss": 0.0064, + "step": 258650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010425405249960898, + "loss": 0.0091, + "step": 258660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010424648480659498, + "loss": 0.007, + "step": 258670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010423891711358096, + "loss": 0.0089, + "step": 258680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010423134942056696, + "loss": 0.0069, + "step": 258690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010422378172755295, + "loss": 0.0081, + "step": 258700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010421621403453893, + "loss": 0.0078, + "step": 258710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420864634152493, + "loss": 0.0069, + "step": 258720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420107864851092, + "loss": 0.0089, + "step": 258730 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041935109554969, + "loss": 0.0078, + "step": 258740 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041859432624829, + "loss": 0.0086, + "step": 258750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010417837556946888, + "loss": 0.0085, + "step": 258760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010417080787645488, + "loss": 0.0093, + "step": 258770 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010416324018344087, + "loss": 0.0079, + "step": 258780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010415567249042685, + "loss": 0.0091, + "step": 258790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010414810479741285, + "loss": 0.0072, + "step": 258800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010414053710439884, + "loss": 0.0086, + "step": 258810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010413296941138482, + "loss": 0.011, + "step": 258820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010412540171837082, + "loss": 0.0079, + "step": 258830 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041178340253568, + "loss": 0.0096, + "step": 258840 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041102663323428, + "loss": 0.0082, + "step": 258850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010410269863932879, + "loss": 0.0087, + "step": 258860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010409513094631477, + "loss": 0.0074, + "step": 258870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010408756325330077, + "loss": 0.0072, + "step": 258880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010407999556028676, + "loss": 0.01, + "step": 258890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010407242786727274, + "loss": 0.0152, + "step": 258900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010406486017425874, + "loss": 0.0074, + "step": 258910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010405729248124472, + "loss": 0.0074, + "step": 258920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404972478823071, + "loss": 0.0082, + "step": 258930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404215709521671, + "loss": 0.0058, + "step": 258940 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403458940220269, + "loss": 0.007, + "step": 258950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010402702170918869, + "loss": 0.0074, + "step": 258960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401945401617468, + "loss": 0.0096, + "step": 258970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401188632316066, + "loss": 0.0112, + "step": 258980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010400431863014666, + "loss": 0.0079, + "step": 258990 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010399675093713264, + "loss": 0.0105, + "step": 259000 + }, + { + "epoch": 1.31, + "eval_cer": 0.914452788772905, + "eval_loss": 0.006329988595098257, + "eval_runtime": 116.6658, + "eval_samples_per_second": 17.143, + "eval_steps_per_second": 4.286, + "step": 259000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010398918324411863, + "loss": 0.0085, + "step": 259010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010398161555110463, + "loss": 0.0072, + "step": 259020 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010397404785809061, + "loss": 0.0092, + "step": 259030 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039664801650766, + "loss": 0.0097, + "step": 259040 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039589124720626, + "loss": 0.0078, + "step": 259050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010395134477904858, + "loss": 0.0083, + "step": 259060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010394377708603458, + "loss": 0.0086, + "step": 259070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010393620939302056, + "loss": 0.009, + "step": 259080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010392864170000655, + "loss": 0.0076, + "step": 259090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010392107400699255, + "loss": 0.0084, + "step": 259100 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010391350631397853, + "loss": 0.0069, + "step": 259110 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010390593862096452, + "loss": 0.0081, + "step": 259120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010389837092795052, + "loss": 0.0088, + "step": 259130 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038908032349365, + "loss": 0.0083, + "step": 259140 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038832355419225, + "loss": 0.0065, + "step": 259150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010387566784890849, + "loss": 0.007, + "step": 259160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010386810015589447, + "loss": 0.0096, + "step": 259170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010386053246288047, + "loss": 0.0081, + "step": 259180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010385296476986645, + "loss": 0.0085, + "step": 259190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010384539707685244, + "loss": 0.0118, + "step": 259200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010383782938383844, + "loss": 0.0087, + "step": 259210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010383026169082442, + "loss": 0.0084, + "step": 259220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010382269399781041, + "loss": 0.0109, + "step": 259230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010381512630479638, + "loss": 0.0094, + "step": 259240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010380755861178238, + "loss": 0.007, + "step": 259250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010379999091876837, + "loss": 0.007, + "step": 259260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010379242322575435, + "loss": 0.0124, + "step": 259270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010378485553274035, + "loss": 0.0077, + "step": 259280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010377728783972633, + "loss": 0.0089, + "step": 259290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010376972014671233, + "loss": 0.0106, + "step": 259300 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010376215245369832, + "loss": 0.0071, + "step": 259310 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037545847606843, + "loss": 0.0108, + "step": 259320 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037470170676703, + "loss": 0.0091, + "step": 259330 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010373944937465629, + "loss": 0.0085, + "step": 259340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010373188168164227, + "loss": 0.0084, + "step": 259350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010372431398862827, + "loss": 0.0087, + "step": 259360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010371674629561425, + "loss": 0.0107, + "step": 259370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010370917860260024, + "loss": 0.0077, + "step": 259380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010370161090958624, + "loss": 0.0072, + "step": 259390 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010369404321657222, + "loss": 0.009, + "step": 259400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010368647552355822, + "loss": 0.0103, + "step": 259410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010367890783054421, + "loss": 0.0078, + "step": 259420 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010367134013753019, + "loss": 0.0077, + "step": 259430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010366377244451619, + "loss": 0.0069, + "step": 259440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010365620475150217, + "loss": 0.0096, + "step": 259450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010364863705848816, + "loss": 0.0117, + "step": 259460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010364106936547416, + "loss": 0.0069, + "step": 259470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010363350167246014, + "loss": 0.0068, + "step": 259480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010362593397944614, + "loss": 0.008, + "step": 259490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010361836628643213, + "loss": 0.0072, + "step": 259500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010361079859341811, + "loss": 0.0092, + "step": 259510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010360323090040411, + "loss": 0.0104, + "step": 259520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010359566320739009, + "loss": 0.0086, + "step": 259530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010358809551437608, + "loss": 0.0081, + "step": 259540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010358052782136208, + "loss": 0.0067, + "step": 259550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010357296012834806, + "loss": 0.0122, + "step": 259560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010356539243533405, + "loss": 0.0065, + "step": 259570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010355782474232005, + "loss": 0.0083, + "step": 259580 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010355025704930603, + "loss": 0.012, + "step": 259590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010354268935629203, + "loss": 0.0089, + "step": 259600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010353512166327802, + "loss": 0.0074, + "step": 259610 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103527553970264, + "loss": 0.0066, + "step": 259620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010351998627725, + "loss": 0.0082, + "step": 259630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010351241858423598, + "loss": 0.0114, + "step": 259640 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010350485089122197, + "loss": 0.0073, + "step": 259650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010349728319820797, + "loss": 0.0078, + "step": 259660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348971550519395, + "loss": 0.01, + "step": 259670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348214781217995, + "loss": 0.0067, + "step": 259680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010347458011916594, + "loss": 0.0074, + "step": 259690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010346701242615192, + "loss": 0.0085, + "step": 259700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010345944473313792, + "loss": 0.0106, + "step": 259710 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034518770401239, + "loss": 0.0067, + "step": 259720 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034443093471099, + "loss": 0.0073, + "step": 259730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010343674165409589, + "loss": 0.0093, + "step": 259740 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342917396108187, + "loss": 0.0085, + "step": 259750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342160626806786, + "loss": 0.0067, + "step": 259760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010341403857505386, + "loss": 0.0078, + "step": 259770 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010340647088203984, + "loss": 0.0062, + "step": 259780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010339890318902584, + "loss": 0.0058, + "step": 259790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010339133549601182, + "loss": 0.0069, + "step": 259800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010338376780299781, + "loss": 0.0057, + "step": 259810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010337620010998381, + "loss": 0.0074, + "step": 259820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336863241696979, + "loss": 0.0066, + "step": 259830 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336106472395578, + "loss": 0.0107, + "step": 259840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010335349703094178, + "loss": 0.0097, + "step": 259850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010334592933792776, + "loss": 0.0076, + "step": 259860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333836164491374, + "loss": 0.0074, + "step": 259870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333079395189972, + "loss": 0.008, + "step": 259880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010332322625888572, + "loss": 0.0097, + "step": 259890 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033156585658717, + "loss": 0.0079, + "step": 259900 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033080908728577, + "loss": 0.01, + "step": 259910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010330052317984369, + "loss": 0.0061, + "step": 259920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010329295548682967, + "loss": 0.0081, + "step": 259930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010328538779381567, + "loss": 0.0092, + "step": 259940 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010327782010080166, + "loss": 0.0076, + "step": 259950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010327025240778764, + "loss": 0.0087, + "step": 259960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010326268471477364, + "loss": 0.0088, + "step": 259970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010325511702175962, + "loss": 0.008, + "step": 259980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010324754932874561, + "loss": 0.0084, + "step": 259990 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010323998163573161, + "loss": 0.0089, + "step": 260000 + }, + { + "epoch": 1.31, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.006425743922591209, + "eval_runtime": 116.2948, + "eval_samples_per_second": 17.198, + "eval_steps_per_second": 4.299, + "step": 260000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010323241394271759, + "loss": 0.0065, + "step": 260010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010322484624970359, + "loss": 0.0073, + "step": 260020 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010321727855668958, + "loss": 0.0094, + "step": 260030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320971086367556, + "loss": 0.0076, + "step": 260040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320214317066156, + "loss": 0.0106, + "step": 260050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010319457547764755, + "loss": 0.0063, + "step": 260060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010318700778463353, + "loss": 0.0092, + "step": 260070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317944009161953, + "loss": 0.0087, + "step": 260080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317187239860551, + "loss": 0.0069, + "step": 260090 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001031643047055915, + "loss": 0.0072, + "step": 260100 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001031567370125775, + "loss": 0.0109, + "step": 260110 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010314916931956348, + "loss": 0.0062, + "step": 260120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010314160162654948, + "loss": 0.0117, + "step": 260130 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010313403393353547, + "loss": 0.0076, + "step": 260140 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010312646624052145, + "loss": 0.0078, + "step": 260150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010311889854750745, + "loss": 0.0064, + "step": 260160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010311133085449343, + "loss": 0.0069, + "step": 260170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010310376316147942, + "loss": 0.0074, + "step": 260180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010309619546846542, + "loss": 0.006, + "step": 260190 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001030886277754514, + "loss": 0.0077, + "step": 260200 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001030810600824374, + "loss": 0.0125, + "step": 260210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010307349238942339, + "loss": 0.0064, + "step": 260220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010306592469640937, + "loss": 0.0095, + "step": 260230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010305835700339537, + "loss": 0.0073, + "step": 260240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010305078931038135, + "loss": 0.009, + "step": 260250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010304322161736734, + "loss": 0.0082, + "step": 260260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010303565392435334, + "loss": 0.0101, + "step": 260270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010302808623133932, + "loss": 0.0089, + "step": 260280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010302051853832531, + "loss": 0.0112, + "step": 260290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010301295084531131, + "loss": 0.01, + "step": 260300 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010300538315229729, + "loss": 0.0062, + "step": 260310 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299781545928329, + "loss": 0.0077, + "step": 260320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299024776626927, + "loss": 0.0075, + "step": 260330 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010298268007325526, + "loss": 0.0063, + "step": 260340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010297511238024126, + "loss": 0.0087, + "step": 260350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010296754468722724, + "loss": 0.0087, + "step": 260360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010295997699421323, + "loss": 0.0085, + "step": 260370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010295240930119923, + "loss": 0.0076, + "step": 260380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010294484160818521, + "loss": 0.0075, + "step": 260390 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001029372739151712, + "loss": 0.0074, + "step": 260400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010292970622215719, + "loss": 0.0087, + "step": 260410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010292213852914318, + "loss": 0.0075, + "step": 260420 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010291457083612918, + "loss": 0.0067, + "step": 260430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010290700314311516, + "loss": 0.0107, + "step": 260440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010289943545010115, + "loss": 0.0068, + "step": 260450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010289186775708715, + "loss": 0.0061, + "step": 260460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010288430006407313, + "loss": 0.0101, + "step": 260470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010287673237105912, + "loss": 0.0093, + "step": 260480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010286916467804509, + "loss": 0.0081, + "step": 260490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010286159698503109, + "loss": 0.011, + "step": 260500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010285402929201708, + "loss": 0.0083, + "step": 260510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010284646159900306, + "loss": 0.0073, + "step": 260520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010283889390598906, + "loss": 0.0084, + "step": 260530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010283132621297504, + "loss": 0.0086, + "step": 260540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010282375851996104, + "loss": 0.0084, + "step": 260550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010281619082694703, + "loss": 0.0097, + "step": 260560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010280862313393301, + "loss": 0.0073, + "step": 260570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010280105544091901, + "loss": 0.0073, + "step": 260580 + }, + { + "epoch": 1.31, + "learning_rate": 0.000102793487747905, + "loss": 0.0073, + "step": 260590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010278592005489098, + "loss": 0.0068, + "step": 260600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277835236187698, + "loss": 0.0064, + "step": 260610 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277078466886296, + "loss": 0.0071, + "step": 260620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010276321697584895, + "loss": 0.0072, + "step": 260630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010275564928283495, + "loss": 0.0082, + "step": 260640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010274808158982093, + "loss": 0.0089, + "step": 260650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010274051389680693, + "loss": 0.0098, + "step": 260660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010273294620379292, + "loss": 0.0093, + "step": 260670 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001027253785107789, + "loss": 0.0083, + "step": 260680 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001027178108177649, + "loss": 0.0086, + "step": 260690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010271024312475088, + "loss": 0.0069, + "step": 260700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010270267543173687, + "loss": 0.0085, + "step": 260710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010269510773872287, + "loss": 0.0072, + "step": 260720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010268754004570885, + "loss": 0.008, + "step": 260730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010267997235269485, + "loss": 0.0065, + "step": 260740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010267240465968084, + "loss": 0.0075, + "step": 260750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010266483696666682, + "loss": 0.0094, + "step": 260760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010265726927365282, + "loss": 0.007, + "step": 260770 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026497015806388, + "loss": 0.0085, + "step": 260780 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026421338876248, + "loss": 0.0086, + "step": 260790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010263456619461079, + "loss": 0.0075, + "step": 260800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010262699850159677, + "loss": 0.0073, + "step": 260810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261943080858276, + "loss": 0.0094, + "step": 260820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261186311556876, + "loss": 0.0094, + "step": 260830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010260429542255474, + "loss": 0.0098, + "step": 260840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010259672772954074, + "loss": 0.0075, + "step": 260850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010258916003652672, + "loss": 0.0079, + "step": 260860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010258159234351271, + "loss": 0.0075, + "step": 260870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010257402465049871, + "loss": 0.0052, + "step": 260880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010256645695748469, + "loss": 0.007, + "step": 260890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010255888926447068, + "loss": 0.007, + "step": 260900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010255132157145668, + "loss": 0.0083, + "step": 260910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010254375387844266, + "loss": 0.0072, + "step": 260920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010253618618542866, + "loss": 0.0082, + "step": 260930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252861849241464, + "loss": 0.0076, + "step": 260940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252105079940063, + "loss": 0.0086, + "step": 260950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010251348310638663, + "loss": 0.0079, + "step": 260960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010250591541337261, + "loss": 0.0087, + "step": 260970 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024983477203586, + "loss": 0.0076, + "step": 260980 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024907800273446, + "loss": 0.0073, + "step": 260990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010248321233433058, + "loss": 0.008, + "step": 261000 + }, + { + "epoch": 1.32, + "eval_cer": 0.9144343512465224, + "eval_loss": 0.006257697008550167, + "eval_runtime": 116.3265, + "eval_samples_per_second": 17.193, + "eval_steps_per_second": 4.298, + "step": 261000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010247564464131657, + "loss": 0.0073, + "step": 261010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010246807694830256, + "loss": 0.006, + "step": 261020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010246050925528855, + "loss": 0.0093, + "step": 261030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010245294156227455, + "loss": 0.0065, + "step": 261040 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010244537386926053, + "loss": 0.007, + "step": 261050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243780617624652, + "loss": 0.0078, + "step": 261060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243023848323252, + "loss": 0.0096, + "step": 261070 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024226707902185, + "loss": 0.0081, + "step": 261080 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024151030972045, + "loss": 0.0085, + "step": 261090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010240753540419049, + "loss": 0.007, + "step": 261100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010239996771117647, + "loss": 0.0109, + "step": 261110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010239240001816245, + "loss": 0.008, + "step": 261120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010238483232514843, + "loss": 0.0087, + "step": 261130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010237726463213443, + "loss": 0.0107, + "step": 261140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010236969693912041, + "loss": 0.0088, + "step": 261150 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023621292461064, + "loss": 0.0075, + "step": 261160 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023545615530924, + "loss": 0.0109, + "step": 261170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010234699386007838, + "loss": 0.0081, + "step": 261180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233942616706438, + "loss": 0.0108, + "step": 261190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233185847405037, + "loss": 0.0106, + "step": 261200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010232429078103635, + "loss": 0.0068, + "step": 261210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010231672308802235, + "loss": 0.0084, + "step": 261220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010230915539500833, + "loss": 0.0085, + "step": 261230 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010230158770199432, + "loss": 0.0077, + "step": 261240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010229402000898032, + "loss": 0.0085, + "step": 261250 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022864523159663, + "loss": 0.0076, + "step": 261260 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022788846229523, + "loss": 0.0069, + "step": 261270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010227131692993829, + "loss": 0.0076, + "step": 261280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010226374923692427, + "loss": 0.0106, + "step": 261290 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010225618154391027, + "loss": 0.0093, + "step": 261300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224861385089625, + "loss": 0.0078, + "step": 261310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224104615788224, + "loss": 0.0058, + "step": 261320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010223347846486824, + "loss": 0.0078, + "step": 261330 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010222591077185422, + "loss": 0.007, + "step": 261340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221834307884022, + "loss": 0.0082, + "step": 261350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221077538582621, + "loss": 0.0074, + "step": 261360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010220320769281219, + "loss": 0.0105, + "step": 261370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010219563999979819, + "loss": 0.0078, + "step": 261380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010218807230678417, + "loss": 0.0058, + "step": 261390 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010218050461377016, + "loss": 0.0082, + "step": 261400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010217293692075616, + "loss": 0.0111, + "step": 261410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010216536922774214, + "loss": 0.0074, + "step": 261420 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215780153472813, + "loss": 0.0102, + "step": 261430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215023384171413, + "loss": 0.0093, + "step": 261440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010214266614870011, + "loss": 0.0101, + "step": 261450 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001021350984556861, + "loss": 0.0093, + "step": 261460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010212753076267209, + "loss": 0.0077, + "step": 261470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010211996306965808, + "loss": 0.0071, + "step": 261480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010211239537664408, + "loss": 0.0101, + "step": 261490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010210482768363006, + "loss": 0.0124, + "step": 261500 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010209725999061605, + "loss": 0.0068, + "step": 261510 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010208969229760205, + "loss": 0.0075, + "step": 261520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010208212460458803, + "loss": 0.0102, + "step": 261530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010207455691157403, + "loss": 0.0073, + "step": 261540 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010206698921856002, + "loss": 0.0083, + "step": 261550 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102059421525546, + "loss": 0.0071, + "step": 261560 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102051853832532, + "loss": 0.0079, + "step": 261570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010204428613951798, + "loss": 0.0086, + "step": 261580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010203671844650397, + "loss": 0.0088, + "step": 261590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010202915075348997, + "loss": 0.0087, + "step": 261600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010202158306047595, + "loss": 0.0099, + "step": 261610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010201401536746194, + "loss": 0.0086, + "step": 261620 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010200644767444794, + "loss": 0.0104, + "step": 261630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010199887998143392, + "loss": 0.0064, + "step": 261640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010199131228841992, + "loss": 0.0099, + "step": 261650 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019837445954059, + "loss": 0.0097, + "step": 261660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010197617690239189, + "loss": 0.0084, + "step": 261670 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010196860920937789, + "loss": 0.0091, + "step": 261680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010196104151636387, + "loss": 0.0067, + "step": 261690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010195347382334986, + "loss": 0.0099, + "step": 261700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010194590613033586, + "loss": 0.0085, + "step": 261710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010193833843732184, + "loss": 0.008, + "step": 261720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010193077074430784, + "loss": 0.0105, + "step": 261730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010192320305129382, + "loss": 0.0121, + "step": 261740 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019156353582798, + "loss": 0.0082, + "step": 261750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190806766526578, + "loss": 0.0068, + "step": 261760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190049997225177, + "loss": 0.0068, + "step": 261770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010189293227923777, + "loss": 0.0095, + "step": 261780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010188536458622375, + "loss": 0.0082, + "step": 261790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010187779689320975, + "loss": 0.008, + "step": 261800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010187022920019574, + "loss": 0.008, + "step": 261810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010186266150718172, + "loss": 0.0063, + "step": 261820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010185509381416772, + "loss": 0.0083, + "step": 261830 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018475261211537, + "loss": 0.0105, + "step": 261840 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018399584281397, + "loss": 0.0063, + "step": 261850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010183239073512569, + "loss": 0.0074, + "step": 261860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010182482304211167, + "loss": 0.0089, + "step": 261870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010181725534909767, + "loss": 0.0067, + "step": 261880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010180968765608366, + "loss": 0.0063, + "step": 261890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010180211996306964, + "loss": 0.0063, + "step": 261900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010179455227005564, + "loss": 0.0086, + "step": 261910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010178698457704162, + "loss": 0.0092, + "step": 261920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177941688402761, + "loss": 0.0069, + "step": 261930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177184919101361, + "loss": 0.0105, + "step": 261940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010176428149799959, + "loss": 0.0083, + "step": 261950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010175671380498558, + "loss": 0.008, + "step": 261960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010174914611197158, + "loss": 0.0071, + "step": 261970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010174157841895756, + "loss": 0.0069, + "step": 261980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010173401072594356, + "loss": 0.0081, + "step": 261990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010172644303292955, + "loss": 0.0084, + "step": 262000 + }, + { + "epoch": 1.32, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.006132941693067551, + "eval_runtime": 116.3656, + "eval_samples_per_second": 17.187, + "eval_steps_per_second": 4.297, + "step": 262000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010171887533991553, + "loss": 0.0079, + "step": 262010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010171130764690153, + "loss": 0.0081, + "step": 262020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010170373995388751, + "loss": 0.0077, + "step": 262030 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016961722608735, + "loss": 0.0089, + "step": 262040 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016886045678595, + "loss": 0.0096, + "step": 262050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010168103687484548, + "loss": 0.0128, + "step": 262060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010167346918183148, + "loss": 0.0066, + "step": 262070 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010166590148881747, + "loss": 0.0071, + "step": 262080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165833379580345, + "loss": 0.01, + "step": 262090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165076610278945, + "loss": 0.0071, + "step": 262100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010164319840977543, + "loss": 0.0079, + "step": 262110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010163563071676142, + "loss": 0.0097, + "step": 262120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010162806302374742, + "loss": 0.01, + "step": 262130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016204953307334, + "loss": 0.0076, + "step": 262140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016129276377194, + "loss": 0.0073, + "step": 262150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010160535994470539, + "loss": 0.009, + "step": 262160 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159779225169137, + "loss": 0.0074, + "step": 262170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159022455867737, + "loss": 0.0076, + "step": 262180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010158265686566335, + "loss": 0.0091, + "step": 262190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010157508917264934, + "loss": 0.0066, + "step": 262200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010156752147963534, + "loss": 0.0078, + "step": 262210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010155995378662132, + "loss": 0.0066, + "step": 262220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010155238609360731, + "loss": 0.0121, + "step": 262230 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010154481840059331, + "loss": 0.0083, + "step": 262240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010153725070757929, + "loss": 0.0082, + "step": 262250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010152968301456529, + "loss": 0.0083, + "step": 262260 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010152211532155127, + "loss": 0.0092, + "step": 262270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010151454762853726, + "loss": 0.0067, + "step": 262280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010150697993552326, + "loss": 0.0079, + "step": 262290 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010149941224250924, + "loss": 0.0078, + "step": 262300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010149184454949523, + "loss": 0.0076, + "step": 262310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010148427685648123, + "loss": 0.0077, + "step": 262320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010147670916346721, + "loss": 0.0078, + "step": 262330 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014691414704532, + "loss": 0.0097, + "step": 262340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010146157377743919, + "loss": 0.008, + "step": 262350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010145400608442518, + "loss": 0.0074, + "step": 262360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010144643839141118, + "loss": 0.0095, + "step": 262370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010143887069839714, + "loss": 0.0099, + "step": 262380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010143130300538314, + "loss": 0.0085, + "step": 262390 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010142373531236912, + "loss": 0.0069, + "step": 262400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010141616761935512, + "loss": 0.0079, + "step": 262410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140859992634111, + "loss": 0.0086, + "step": 262420 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140103223332709, + "loss": 0.0066, + "step": 262430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010139346454031309, + "loss": 0.007, + "step": 262440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010138589684729908, + "loss": 0.0093, + "step": 262450 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010137832915428506, + "loss": 0.0085, + "step": 262460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010137076146127106, + "loss": 0.0086, + "step": 262470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010136319376825704, + "loss": 0.0096, + "step": 262480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010135562607524303, + "loss": 0.0076, + "step": 262490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010134805838222903, + "loss": 0.0096, + "step": 262500 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010134049068921501, + "loss": 0.0069, + "step": 262510 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101332922996201, + "loss": 0.0089, + "step": 262520 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101325355303187, + "loss": 0.0072, + "step": 262530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131778761017298, + "loss": 0.0078, + "step": 262540 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131021991715898, + "loss": 0.0075, + "step": 262550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010130265222414496, + "loss": 0.0106, + "step": 262560 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010129508453113095, + "loss": 0.008, + "step": 262570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010128751683811695, + "loss": 0.0078, + "step": 262580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010127994914510293, + "loss": 0.0094, + "step": 262590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010127238145208893, + "loss": 0.0101, + "step": 262600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010126481375907492, + "loss": 0.0104, + "step": 262610 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001012572460660609, + "loss": 0.0079, + "step": 262620 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001012496783730469, + "loss": 0.0074, + "step": 262630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010124211068003288, + "loss": 0.0084, + "step": 262640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010123454298701887, + "loss": 0.0073, + "step": 262650 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010122697529400487, + "loss": 0.0097, + "step": 262660 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010121940760099085, + "loss": 0.0094, + "step": 262670 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010121183990797684, + "loss": 0.0095, + "step": 262680 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010120427221496284, + "loss": 0.0072, + "step": 262690 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010119670452194882, + "loss": 0.01, + "step": 262700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010118913682893482, + "loss": 0.0063, + "step": 262710 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001011815691359208, + "loss": 0.0075, + "step": 262720 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010117400144290679, + "loss": 0.007, + "step": 262730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010116643374989279, + "loss": 0.0105, + "step": 262740 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010115886605687877, + "loss": 0.0103, + "step": 262750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010115129836386476, + "loss": 0.0081, + "step": 262760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010114373067085076, + "loss": 0.0076, + "step": 262770 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010113616297783674, + "loss": 0.0075, + "step": 262780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112859528482274, + "loss": 0.0089, + "step": 262790 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112102759180872, + "loss": 0.0095, + "step": 262800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010111345989879471, + "loss": 0.008, + "step": 262810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010110589220578071, + "loss": 0.0057, + "step": 262820 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010109832451276669, + "loss": 0.009, + "step": 262830 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010109075681975268, + "loss": 0.0088, + "step": 262840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010108318912673868, + "loss": 0.0086, + "step": 262850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010107562143372466, + "loss": 0.0075, + "step": 262860 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010106805374071065, + "loss": 0.0088, + "step": 262870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010106048604769664, + "loss": 0.0084, + "step": 262880 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010105291835468263, + "loss": 0.0074, + "step": 262890 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010104535066166863, + "loss": 0.0074, + "step": 262900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010103778296865461, + "loss": 0.0073, + "step": 262910 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001010302152756406, + "loss": 0.0067, + "step": 262920 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001010226475826266, + "loss": 0.0069, + "step": 262930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010101507988961258, + "loss": 0.0076, + "step": 262940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010100751219659857, + "loss": 0.0084, + "step": 262950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010099994450358456, + "loss": 0.0066, + "step": 262960 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010099237681057055, + "loss": 0.0092, + "step": 262970 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010098480911755655, + "loss": 0.0081, + "step": 262980 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010097724142454253, + "loss": 0.0097, + "step": 262990 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010096967373152852, + "loss": 0.0079, + "step": 263000 + }, + { + "epoch": 1.33, + "eval_cer": 0.9144459960000272, + "eval_loss": 0.005995141342282295, + "eval_runtime": 116.2956, + "eval_samples_per_second": 17.198, + "eval_steps_per_second": 4.299, + "step": 263000 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010096210603851449, + "loss": 0.0107, + "step": 263010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010095453834550048, + "loss": 0.0082, + "step": 263020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010094697065248648, + "loss": 0.0079, + "step": 263030 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093940295947246, + "loss": 0.0063, + "step": 263040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093183526645846, + "loss": 0.0076, + "step": 263050 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010092426757344445, + "loss": 0.0089, + "step": 263060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010091669988043043, + "loss": 0.007, + "step": 263070 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010090913218741643, + "loss": 0.0068, + "step": 263080 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010090156449440241, + "loss": 0.0105, + "step": 263090 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008939968013884, + "loss": 0.0061, + "step": 263100 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008864291083744, + "loss": 0.0082, + "step": 263110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010087886141536038, + "loss": 0.0059, + "step": 263120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010087129372234638, + "loss": 0.0111, + "step": 263130 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010086372602933237, + "loss": 0.008, + "step": 263140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010085615833631835, + "loss": 0.0089, + "step": 263150 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010084859064330435, + "loss": 0.0064, + "step": 263160 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010084102295029033, + "loss": 0.0078, + "step": 263170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010083345525727632, + "loss": 0.0066, + "step": 263180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010082588756426232, + "loss": 0.0072, + "step": 263190 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008183198712483, + "loss": 0.0086, + "step": 263200 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008107521782343, + "loss": 0.0093, + "step": 263210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010080318448522029, + "loss": 0.0078, + "step": 263220 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010079561679220627, + "loss": 0.0067, + "step": 263230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010078804909919227, + "loss": 0.0096, + "step": 263240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010078048140617825, + "loss": 0.0106, + "step": 263250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010077291371316424, + "loss": 0.008, + "step": 263260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010076534602015024, + "loss": 0.0092, + "step": 263270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010075777832713622, + "loss": 0.0079, + "step": 263280 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010075021063412221, + "loss": 0.0121, + "step": 263290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010074264294110821, + "loss": 0.0085, + "step": 263300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010073507524809419, + "loss": 0.0082, + "step": 263310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010072750755508019, + "loss": 0.0094, + "step": 263320 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010071993986206617, + "loss": 0.0073, + "step": 263330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010071237216905216, + "loss": 0.0075, + "step": 263340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010070480447603816, + "loss": 0.0092, + "step": 263350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010069723678302414, + "loss": 0.0085, + "step": 263360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068966909001013, + "loss": 0.0088, + "step": 263370 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068210139699613, + "loss": 0.0075, + "step": 263380 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010067453370398211, + "loss": 0.0077, + "step": 263390 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006669660109681, + "loss": 0.0087, + "step": 263400 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010065939831795409, + "loss": 0.0103, + "step": 263410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010065183062494008, + "loss": 0.0081, + "step": 263420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010064426293192608, + "loss": 0.0106, + "step": 263430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010063669523891206, + "loss": 0.0127, + "step": 263440 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062912754589805, + "loss": 0.009, + "step": 263450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062155985288405, + "loss": 0.0086, + "step": 263460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010061399215987003, + "loss": 0.009, + "step": 263470 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010060642446685602, + "loss": 0.0115, + "step": 263480 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010059885677384202, + "loss": 0.0085, + "step": 263490 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100591289080828, + "loss": 0.0074, + "step": 263500 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100583721387814, + "loss": 0.009, + "step": 263510 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010057615369479998, + "loss": 0.0085, + "step": 263520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010056858600178597, + "loss": 0.0081, + "step": 263530 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010056101830877197, + "loss": 0.011, + "step": 263540 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010055345061575795, + "loss": 0.0088, + "step": 263550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010054588292274394, + "loss": 0.0076, + "step": 263560 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010053831522972994, + "loss": 0.0069, + "step": 263570 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010053074753671592, + "loss": 0.009, + "step": 263580 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010052317984370191, + "loss": 0.0082, + "step": 263590 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005156121506879, + "loss": 0.007, + "step": 263600 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010050804445767389, + "loss": 0.0092, + "step": 263610 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010050047676465989, + "loss": 0.0074, + "step": 263620 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010049290907164587, + "loss": 0.0065, + "step": 263630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010048534137863185, + "loss": 0.0078, + "step": 263640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010047777368561783, + "loss": 0.0085, + "step": 263650 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010047020599260383, + "loss": 0.0087, + "step": 263660 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010046263829958982, + "loss": 0.0087, + "step": 263670 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004550706065758, + "loss": 0.0082, + "step": 263680 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004475029135618, + "loss": 0.0078, + "step": 263690 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010043993522054778, + "loss": 0.0103, + "step": 263700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010043236752753377, + "loss": 0.0103, + "step": 263710 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010042479983451977, + "loss": 0.0072, + "step": 263720 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010041723214150575, + "loss": 0.0084, + "step": 263730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010040966444849174, + "loss": 0.0122, + "step": 263740 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010040209675547774, + "loss": 0.0067, + "step": 263750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010039452906246372, + "loss": 0.0081, + "step": 263760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010038696136944972, + "loss": 0.0093, + "step": 263770 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003793936764357, + "loss": 0.0117, + "step": 263780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010037182598342169, + "loss": 0.0089, + "step": 263790 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010036425829040769, + "loss": 0.0079, + "step": 263800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010035669059739367, + "loss": 0.0093, + "step": 263810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010034912290437966, + "loss": 0.0076, + "step": 263820 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010034155521136566, + "loss": 0.0092, + "step": 263830 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010033398751835164, + "loss": 0.0089, + "step": 263840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010032641982533764, + "loss": 0.0073, + "step": 263850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010031885213232362, + "loss": 0.0075, + "step": 263860 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010031128443930961, + "loss": 0.0099, + "step": 263870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010030371674629561, + "loss": 0.0102, + "step": 263880 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010029614905328159, + "loss": 0.0074, + "step": 263890 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010028858136026758, + "loss": 0.0074, + "step": 263900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010028101366725358, + "loss": 0.0062, + "step": 263910 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010027344597423956, + "loss": 0.0081, + "step": 263920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010026587828122556, + "loss": 0.009, + "step": 263930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025831058821155, + "loss": 0.0059, + "step": 263940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025074289519753, + "loss": 0.01, + "step": 263950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010024317520218353, + "loss": 0.0073, + "step": 263960 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010023560750916951, + "loss": 0.0072, + "step": 263970 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001002280398161555, + "loss": 0.0095, + "step": 263980 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001002204721231415, + "loss": 0.0097, + "step": 263990 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010021290443012748, + "loss": 0.0096, + "step": 264000 + }, + { + "epoch": 1.33, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.006162929814308882, + "eval_runtime": 116.2184, + "eval_samples_per_second": 17.209, + "eval_steps_per_second": 4.302, + "step": 264000 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010020533673711347, + "loss": 0.0106, + "step": 264010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010019776904409947, + "loss": 0.0084, + "step": 264020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010019020135108545, + "loss": 0.0065, + "step": 264030 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010018263365807145, + "loss": 0.0059, + "step": 264040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010017506596505743, + "loss": 0.0088, + "step": 264050 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010016749827204342, + "loss": 0.0093, + "step": 264060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010015993057902942, + "loss": 0.0067, + "step": 264070 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001001523628860154, + "loss": 0.0083, + "step": 264080 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001001447951930014, + "loss": 0.0107, + "step": 264090 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010013722749998739, + "loss": 0.0081, + "step": 264100 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010012965980697337, + "loss": 0.0105, + "step": 264110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010012209211395937, + "loss": 0.0081, + "step": 264120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010011452442094535, + "loss": 0.0091, + "step": 264130 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010010695672793134, + "loss": 0.0072, + "step": 264140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009938903491734, + "loss": 0.0092, + "step": 264150 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009182134190332, + "loss": 0.0082, + "step": 264160 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010008425364888931, + "loss": 0.0091, + "step": 264170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010007668595587531, + "loss": 0.0088, + "step": 264180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006911826286129, + "loss": 0.0094, + "step": 264190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006155056984728, + "loss": 0.0067, + "step": 264200 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010005398287683327, + "loss": 0.0077, + "step": 264210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010004641518381926, + "loss": 0.0087, + "step": 264220 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010003884749080526, + "loss": 0.009, + "step": 264230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010003127979779124, + "loss": 0.011, + "step": 264240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010002371210477723, + "loss": 0.008, + "step": 264250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010001614441176323, + "loss": 0.0059, + "step": 264260 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000085767187492, + "loss": 0.0082, + "step": 264270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010000100902573519, + "loss": 0.0078, + "step": 264280 + }, + { + "epoch": 1.33, + "learning_rate": 9.999344133272117e-05, + "loss": 0.0097, + "step": 264290 + }, + { + "epoch": 1.33, + "learning_rate": 9.998587363970717e-05, + "loss": 0.0074, + "step": 264300 + }, + { + "epoch": 1.33, + "learning_rate": 9.997830594669315e-05, + "loss": 0.0096, + "step": 264310 + }, + { + "epoch": 1.33, + "learning_rate": 9.997073825367914e-05, + "loss": 0.0086, + "step": 264320 + }, + { + "epoch": 1.33, + "learning_rate": 9.996317056066514e-05, + "loss": 0.0069, + "step": 264330 + }, + { + "epoch": 1.33, + "learning_rate": 9.995560286765112e-05, + "loss": 0.0069, + "step": 264340 + }, + { + "epoch": 1.33, + "learning_rate": 9.994803517463711e-05, + "loss": 0.0063, + "step": 264350 + }, + { + "epoch": 1.33, + "learning_rate": 9.994046748162311e-05, + "loss": 0.0081, + "step": 264360 + }, + { + "epoch": 1.33, + "learning_rate": 9.993289978860909e-05, + "loss": 0.0105, + "step": 264370 + }, + { + "epoch": 1.33, + "learning_rate": 9.992533209559509e-05, + "loss": 0.0073, + "step": 264380 + }, + { + "epoch": 1.33, + "learning_rate": 9.991776440258108e-05, + "loss": 0.0131, + "step": 264390 + }, + { + "epoch": 1.33, + "learning_rate": 9.991019670956706e-05, + "loss": 0.0094, + "step": 264400 + }, + { + "epoch": 1.33, + "learning_rate": 9.990262901655306e-05, + "loss": 0.0091, + "step": 264410 + }, + { + "epoch": 1.33, + "learning_rate": 9.989506132353904e-05, + "loss": 0.0088, + "step": 264420 + }, + { + "epoch": 1.33, + "learning_rate": 9.988749363052503e-05, + "loss": 0.0077, + "step": 264430 + }, + { + "epoch": 1.33, + "learning_rate": 9.987992593751103e-05, + "loss": 0.0069, + "step": 264440 + }, + { + "epoch": 1.33, + "learning_rate": 9.987235824449701e-05, + "loss": 0.0083, + "step": 264450 + }, + { + "epoch": 1.33, + "learning_rate": 9.9864790551483e-05, + "loss": 0.0086, + "step": 264460 + }, + { + "epoch": 1.33, + "learning_rate": 9.9857222858469e-05, + "loss": 0.008, + "step": 264470 + }, + { + "epoch": 1.33, + "learning_rate": 9.984965516545498e-05, + "loss": 0.0065, + "step": 264480 + }, + { + "epoch": 1.33, + "learning_rate": 9.984208747244098e-05, + "loss": 0.008, + "step": 264490 + }, + { + "epoch": 1.33, + "learning_rate": 9.983451977942696e-05, + "loss": 0.0077, + "step": 264500 + }, + { + "epoch": 1.33, + "learning_rate": 9.982695208641295e-05, + "loss": 0.0082, + "step": 264510 + }, + { + "epoch": 1.33, + "learning_rate": 9.981938439339895e-05, + "loss": 0.0118, + "step": 264520 + }, + { + "epoch": 1.33, + "learning_rate": 9.981181670038493e-05, + "loss": 0.0074, + "step": 264530 + }, + { + "epoch": 1.33, + "learning_rate": 9.980424900737092e-05, + "loss": 0.0071, + "step": 264540 + }, + { + "epoch": 1.33, + "learning_rate": 9.979668131435692e-05, + "loss": 0.0089, + "step": 264550 + }, + { + "epoch": 1.33, + "learning_rate": 9.97891136213429e-05, + "loss": 0.0074, + "step": 264560 + }, + { + "epoch": 1.33, + "learning_rate": 9.97815459283289e-05, + "loss": 0.0085, + "step": 264570 + }, + { + "epoch": 1.33, + "learning_rate": 9.977397823531488e-05, + "loss": 0.0082, + "step": 264580 + }, + { + "epoch": 1.33, + "learning_rate": 9.976641054230087e-05, + "loss": 0.0061, + "step": 264590 + }, + { + "epoch": 1.33, + "learning_rate": 9.975884284928687e-05, + "loss": 0.0083, + "step": 264600 + }, + { + "epoch": 1.33, + "learning_rate": 9.975127515627285e-05, + "loss": 0.0083, + "step": 264610 + }, + { + "epoch": 1.34, + "learning_rate": 9.974370746325884e-05, + "loss": 0.0076, + "step": 264620 + }, + { + "epoch": 1.34, + "learning_rate": 9.973613977024484e-05, + "loss": 0.0074, + "step": 264630 + }, + { + "epoch": 1.34, + "learning_rate": 9.972857207723082e-05, + "loss": 0.0087, + "step": 264640 + }, + { + "epoch": 1.34, + "learning_rate": 9.972100438421682e-05, + "loss": 0.0094, + "step": 264650 + }, + { + "epoch": 1.34, + "learning_rate": 9.97134366912028e-05, + "loss": 0.0108, + "step": 264660 + }, + { + "epoch": 1.34, + "learning_rate": 9.970586899818879e-05, + "loss": 0.007, + "step": 264670 + }, + { + "epoch": 1.34, + "learning_rate": 9.969830130517479e-05, + "loss": 0.0077, + "step": 264680 + }, + { + "epoch": 1.34, + "learning_rate": 9.969073361216077e-05, + "loss": 0.0071, + "step": 264690 + }, + { + "epoch": 1.34, + "learning_rate": 9.968316591914676e-05, + "loss": 0.0087, + "step": 264700 + }, + { + "epoch": 1.34, + "learning_rate": 9.967559822613276e-05, + "loss": 0.0091, + "step": 264710 + }, + { + "epoch": 1.34, + "learning_rate": 9.966803053311874e-05, + "loss": 0.0084, + "step": 264720 + }, + { + "epoch": 1.34, + "learning_rate": 9.966046284010473e-05, + "loss": 0.0077, + "step": 264730 + }, + { + "epoch": 1.34, + "learning_rate": 9.965289514709072e-05, + "loss": 0.0085, + "step": 264740 + }, + { + "epoch": 1.34, + "learning_rate": 9.964532745407671e-05, + "loss": 0.0071, + "step": 264750 + }, + { + "epoch": 1.34, + "learning_rate": 9.96377597610627e-05, + "loss": 0.0077, + "step": 264760 + }, + { + "epoch": 1.34, + "learning_rate": 9.963019206804869e-05, + "loss": 0.0073, + "step": 264770 + }, + { + "epoch": 1.34, + "learning_rate": 9.962262437503468e-05, + "loss": 0.0074, + "step": 264780 + }, + { + "epoch": 1.34, + "learning_rate": 9.961505668202068e-05, + "loss": 0.0085, + "step": 264790 + }, + { + "epoch": 1.34, + "learning_rate": 9.960748898900666e-05, + "loss": 0.0112, + "step": 264800 + }, + { + "epoch": 1.34, + "learning_rate": 9.959992129599265e-05, + "loss": 0.0086, + "step": 264810 + }, + { + "epoch": 1.34, + "learning_rate": 9.959235360297864e-05, + "loss": 0.007, + "step": 264820 + }, + { + "epoch": 1.34, + "learning_rate": 9.958478590996463e-05, + "loss": 0.0079, + "step": 264830 + }, + { + "epoch": 1.34, + "learning_rate": 9.957721821695063e-05, + "loss": 0.0064, + "step": 264840 + }, + { + "epoch": 1.34, + "learning_rate": 9.95696505239366e-05, + "loss": 0.0075, + "step": 264850 + }, + { + "epoch": 1.34, + "learning_rate": 9.95620828309226e-05, + "loss": 0.0078, + "step": 264860 + }, + { + "epoch": 1.34, + "learning_rate": 9.95545151379086e-05, + "loss": 0.0091, + "step": 264870 + }, + { + "epoch": 1.34, + "learning_rate": 9.954694744489458e-05, + "loss": 0.0095, + "step": 264880 + }, + { + "epoch": 1.34, + "learning_rate": 9.953937975188056e-05, + "loss": 0.0084, + "step": 264890 + }, + { + "epoch": 1.34, + "learning_rate": 9.953181205886654e-05, + "loss": 0.0089, + "step": 264900 + }, + { + "epoch": 1.34, + "learning_rate": 9.952424436585254e-05, + "loss": 0.0081, + "step": 264910 + }, + { + "epoch": 1.34, + "learning_rate": 9.951667667283853e-05, + "loss": 0.0067, + "step": 264920 + }, + { + "epoch": 1.34, + "learning_rate": 9.950910897982451e-05, + "loss": 0.0083, + "step": 264930 + }, + { + "epoch": 1.34, + "learning_rate": 9.950154128681051e-05, + "loss": 0.0112, + "step": 264940 + }, + { + "epoch": 1.34, + "learning_rate": 9.949397359379649e-05, + "loss": 0.0071, + "step": 264950 + }, + { + "epoch": 1.34, + "learning_rate": 9.948640590078248e-05, + "loss": 0.0082, + "step": 264960 + }, + { + "epoch": 1.34, + "learning_rate": 9.947883820776848e-05, + "loss": 0.0069, + "step": 264970 + }, + { + "epoch": 1.34, + "learning_rate": 9.947127051475446e-05, + "loss": 0.0074, + "step": 264980 + }, + { + "epoch": 1.34, + "learning_rate": 9.946370282174046e-05, + "loss": 0.0087, + "step": 264990 + }, + { + "epoch": 1.34, + "learning_rate": 9.945613512872645e-05, + "loss": 0.0052, + "step": 265000 + }, + { + "epoch": 1.34, + "eval_cer": 0.9144372624348985, + "eval_loss": 0.006056656129658222, + "eval_runtime": 116.3287, + "eval_samples_per_second": 17.193, + "eval_steps_per_second": 4.298, + "step": 265000 + }, + { + "epoch": 1.34, + "learning_rate": 9.944856743571243e-05, + "loss": 0.0073, + "step": 265010 + }, + { + "epoch": 1.34, + "learning_rate": 9.944099974269843e-05, + "loss": 0.0094, + "step": 265020 + }, + { + "epoch": 1.34, + "learning_rate": 9.943343204968441e-05, + "loss": 0.0105, + "step": 265030 + }, + { + "epoch": 1.34, + "learning_rate": 9.94258643566704e-05, + "loss": 0.007, + "step": 265040 + }, + { + "epoch": 1.34, + "learning_rate": 9.94182966636564e-05, + "loss": 0.0087, + "step": 265050 + }, + { + "epoch": 1.34, + "learning_rate": 9.941072897064238e-05, + "loss": 0.0078, + "step": 265060 + }, + { + "epoch": 1.34, + "learning_rate": 9.940316127762837e-05, + "loss": 0.007, + "step": 265070 + }, + { + "epoch": 1.34, + "learning_rate": 9.939559358461437e-05, + "loss": 0.0071, + "step": 265080 + }, + { + "epoch": 1.34, + "learning_rate": 9.938802589160035e-05, + "loss": 0.0092, + "step": 265090 + }, + { + "epoch": 1.34, + "learning_rate": 9.938045819858635e-05, + "loss": 0.0069, + "step": 265100 + }, + { + "epoch": 1.34, + "learning_rate": 9.937289050557233e-05, + "loss": 0.0077, + "step": 265110 + }, + { + "epoch": 1.34, + "learning_rate": 9.936532281255832e-05, + "loss": 0.0051, + "step": 265120 + }, + { + "epoch": 1.34, + "learning_rate": 9.935775511954432e-05, + "loss": 0.0083, + "step": 265130 + }, + { + "epoch": 1.34, + "learning_rate": 9.93501874265303e-05, + "loss": 0.0099, + "step": 265140 + }, + { + "epoch": 1.34, + "learning_rate": 9.93426197335163e-05, + "loss": 0.007, + "step": 265150 + }, + { + "epoch": 1.34, + "learning_rate": 9.933505204050229e-05, + "loss": 0.0064, + "step": 265160 + }, + { + "epoch": 1.34, + "learning_rate": 9.932748434748827e-05, + "loss": 0.0075, + "step": 265170 + }, + { + "epoch": 1.34, + "learning_rate": 9.931991665447427e-05, + "loss": 0.0079, + "step": 265180 + }, + { + "epoch": 1.34, + "learning_rate": 9.931234896146025e-05, + "loss": 0.0083, + "step": 265190 + }, + { + "epoch": 1.34, + "learning_rate": 9.930478126844624e-05, + "loss": 0.0106, + "step": 265200 + }, + { + "epoch": 1.34, + "learning_rate": 9.929721357543224e-05, + "loss": 0.0072, + "step": 265210 + }, + { + "epoch": 1.34, + "learning_rate": 9.928964588241822e-05, + "loss": 0.0075, + "step": 265220 + }, + { + "epoch": 1.34, + "learning_rate": 9.928207818940421e-05, + "loss": 0.0092, + "step": 265230 + }, + { + "epoch": 1.34, + "learning_rate": 9.927451049639021e-05, + "loss": 0.0089, + "step": 265240 + }, + { + "epoch": 1.34, + "learning_rate": 9.926694280337619e-05, + "loss": 0.0072, + "step": 265250 + }, + { + "epoch": 1.34, + "learning_rate": 9.925937511036218e-05, + "loss": 0.0057, + "step": 265260 + }, + { + "epoch": 1.34, + "learning_rate": 9.925180741734817e-05, + "loss": 0.0066, + "step": 265270 + }, + { + "epoch": 1.34, + "learning_rate": 9.924423972433416e-05, + "loss": 0.0104, + "step": 265280 + }, + { + "epoch": 1.34, + "learning_rate": 9.923667203132016e-05, + "loss": 0.0071, + "step": 265290 + }, + { + "epoch": 1.34, + "learning_rate": 9.922910433830614e-05, + "loss": 0.0096, + "step": 265300 + }, + { + "epoch": 1.34, + "learning_rate": 9.922153664529213e-05, + "loss": 0.0097, + "step": 265310 + }, + { + "epoch": 1.34, + "learning_rate": 9.921396895227813e-05, + "loss": 0.0077, + "step": 265320 + }, + { + "epoch": 1.34, + "learning_rate": 9.920640125926411e-05, + "loss": 0.0084, + "step": 265330 + }, + { + "epoch": 1.34, + "learning_rate": 9.91988335662501e-05, + "loss": 0.0076, + "step": 265340 + }, + { + "epoch": 1.34, + "learning_rate": 9.919126587323609e-05, + "loss": 0.0081, + "step": 265350 + }, + { + "epoch": 1.34, + "learning_rate": 9.918369818022208e-05, + "loss": 0.0087, + "step": 265360 + }, + { + "epoch": 1.34, + "learning_rate": 9.917613048720808e-05, + "loss": 0.0095, + "step": 265370 + }, + { + "epoch": 1.34, + "learning_rate": 9.916856279419406e-05, + "loss": 0.007, + "step": 265380 + }, + { + "epoch": 1.34, + "learning_rate": 9.916099510118005e-05, + "loss": 0.0076, + "step": 265390 + }, + { + "epoch": 1.34, + "learning_rate": 9.915342740816605e-05, + "loss": 0.0075, + "step": 265400 + }, + { + "epoch": 1.34, + "learning_rate": 9.914585971515203e-05, + "loss": 0.0089, + "step": 265410 + }, + { + "epoch": 1.34, + "learning_rate": 9.913829202213802e-05, + "loss": 0.0094, + "step": 265420 + }, + { + "epoch": 1.34, + "learning_rate": 9.913072432912402e-05, + "loss": 0.0081, + "step": 265430 + }, + { + "epoch": 1.34, + "learning_rate": 9.912315663611e-05, + "loss": 0.0077, + "step": 265440 + }, + { + "epoch": 1.34, + "learning_rate": 9.9115588943096e-05, + "loss": 0.0087, + "step": 265450 + }, + { + "epoch": 1.34, + "learning_rate": 9.910802125008198e-05, + "loss": 0.0096, + "step": 265460 + }, + { + "epoch": 1.34, + "learning_rate": 9.910045355706797e-05, + "loss": 0.0096, + "step": 265470 + }, + { + "epoch": 1.34, + "learning_rate": 9.909288586405397e-05, + "loss": 0.0078, + "step": 265480 + }, + { + "epoch": 1.34, + "learning_rate": 9.908531817103995e-05, + "loss": 0.0092, + "step": 265490 + }, + { + "epoch": 1.34, + "learning_rate": 9.907775047802594e-05, + "loss": 0.0088, + "step": 265500 + }, + { + "epoch": 1.34, + "learning_rate": 9.907018278501194e-05, + "loss": 0.0063, + "step": 265510 + }, + { + "epoch": 1.34, + "learning_rate": 9.90626150919979e-05, + "loss": 0.0074, + "step": 265520 + }, + { + "epoch": 1.34, + "learning_rate": 9.90550473989839e-05, + "loss": 0.0072, + "step": 265530 + }, + { + "epoch": 1.34, + "learning_rate": 9.904747970596988e-05, + "loss": 0.0077, + "step": 265540 + }, + { + "epoch": 1.34, + "learning_rate": 9.903991201295588e-05, + "loss": 0.0075, + "step": 265550 + }, + { + "epoch": 1.34, + "learning_rate": 9.903234431994186e-05, + "loss": 0.0068, + "step": 265560 + }, + { + "epoch": 1.34, + "learning_rate": 9.902477662692785e-05, + "loss": 0.0077, + "step": 265570 + }, + { + "epoch": 1.34, + "learning_rate": 9.901720893391385e-05, + "loss": 0.0083, + "step": 265580 + }, + { + "epoch": 1.34, + "learning_rate": 9.900964124089983e-05, + "loss": 0.0065, + "step": 265590 + }, + { + "epoch": 1.34, + "learning_rate": 9.900207354788582e-05, + "loss": 0.0084, + "step": 265600 + }, + { + "epoch": 1.34, + "learning_rate": 9.899450585487182e-05, + "loss": 0.0069, + "step": 265610 + }, + { + "epoch": 1.34, + "learning_rate": 9.89869381618578e-05, + "loss": 0.0091, + "step": 265620 + }, + { + "epoch": 1.34, + "learning_rate": 9.89793704688438e-05, + "loss": 0.0109, + "step": 265630 + }, + { + "epoch": 1.34, + "learning_rate": 9.897180277582978e-05, + "loss": 0.007, + "step": 265640 + }, + { + "epoch": 1.34, + "learning_rate": 9.896423508281577e-05, + "loss": 0.0075, + "step": 265650 + }, + { + "epoch": 1.34, + "learning_rate": 9.895666738980177e-05, + "loss": 0.008, + "step": 265660 + }, + { + "epoch": 1.34, + "learning_rate": 9.894909969678775e-05, + "loss": 0.0115, + "step": 265670 + }, + { + "epoch": 1.34, + "learning_rate": 9.894153200377374e-05, + "loss": 0.0075, + "step": 265680 + }, + { + "epoch": 1.34, + "learning_rate": 9.893396431075974e-05, + "loss": 0.0077, + "step": 265690 + }, + { + "epoch": 1.34, + "learning_rate": 9.892639661774572e-05, + "loss": 0.0103, + "step": 265700 + }, + { + "epoch": 1.34, + "learning_rate": 9.891882892473172e-05, + "loss": 0.0092, + "step": 265710 + }, + { + "epoch": 1.34, + "learning_rate": 9.89112612317177e-05, + "loss": 0.0081, + "step": 265720 + }, + { + "epoch": 1.34, + "learning_rate": 9.890369353870369e-05, + "loss": 0.0108, + "step": 265730 + }, + { + "epoch": 1.34, + "learning_rate": 9.889612584568969e-05, + "loss": 0.0098, + "step": 265740 + }, + { + "epoch": 1.34, + "learning_rate": 9.888855815267567e-05, + "loss": 0.0092, + "step": 265750 + }, + { + "epoch": 1.34, + "learning_rate": 9.888099045966166e-05, + "loss": 0.0099, + "step": 265760 + }, + { + "epoch": 1.34, + "learning_rate": 9.887342276664766e-05, + "loss": 0.0094, + "step": 265770 + }, + { + "epoch": 1.34, + "learning_rate": 9.886585507363364e-05, + "loss": 0.0071, + "step": 265780 + }, + { + "epoch": 1.34, + "learning_rate": 9.885828738061963e-05, + "loss": 0.0105, + "step": 265790 + }, + { + "epoch": 1.34, + "learning_rate": 9.885071968760562e-05, + "loss": 0.0069, + "step": 265800 + }, + { + "epoch": 1.34, + "learning_rate": 9.884315199459161e-05, + "loss": 0.01, + "step": 265810 + }, + { + "epoch": 1.34, + "learning_rate": 9.88355843015776e-05, + "loss": 0.0071, + "step": 265820 + }, + { + "epoch": 1.34, + "learning_rate": 9.882801660856359e-05, + "loss": 0.0072, + "step": 265830 + }, + { + "epoch": 1.34, + "learning_rate": 9.882044891554958e-05, + "loss": 0.0092, + "step": 265840 + }, + { + "epoch": 1.34, + "learning_rate": 9.881288122253558e-05, + "loss": 0.0076, + "step": 265850 + }, + { + "epoch": 1.34, + "learning_rate": 9.880531352952156e-05, + "loss": 0.0083, + "step": 265860 + }, + { + "epoch": 1.34, + "learning_rate": 9.879774583650755e-05, + "loss": 0.0085, + "step": 265870 + }, + { + "epoch": 1.34, + "learning_rate": 9.879017814349355e-05, + "loss": 0.0094, + "step": 265880 + }, + { + "epoch": 1.34, + "learning_rate": 9.878261045047953e-05, + "loss": 0.0073, + "step": 265890 + }, + { + "epoch": 1.34, + "learning_rate": 9.877504275746553e-05, + "loss": 0.0069, + "step": 265900 + }, + { + "epoch": 1.34, + "learning_rate": 9.876747506445151e-05, + "loss": 0.0099, + "step": 265910 + }, + { + "epoch": 1.34, + "learning_rate": 9.87599073714375e-05, + "loss": 0.0094, + "step": 265920 + }, + { + "epoch": 1.34, + "learning_rate": 9.87523396784235e-05, + "loss": 0.0089, + "step": 265930 + }, + { + "epoch": 1.34, + "learning_rate": 9.874477198540948e-05, + "loss": 0.0088, + "step": 265940 + }, + { + "epoch": 1.34, + "learning_rate": 9.873720429239547e-05, + "loss": 0.0088, + "step": 265950 + }, + { + "epoch": 1.34, + "learning_rate": 9.872963659938147e-05, + "loss": 0.0059, + "step": 265960 + }, + { + "epoch": 1.34, + "learning_rate": 9.872206890636745e-05, + "loss": 0.0053, + "step": 265970 + }, + { + "epoch": 1.34, + "learning_rate": 9.871450121335344e-05, + "loss": 0.0104, + "step": 265980 + }, + { + "epoch": 1.34, + "learning_rate": 9.870693352033943e-05, + "loss": 0.0073, + "step": 265990 + }, + { + "epoch": 1.34, + "learning_rate": 9.869936582732542e-05, + "loss": 0.0097, + "step": 266000 + }, + { + "epoch": 1.34, + "eval_cer": 0.9144401736232748, + "eval_loss": 0.0059706708416342735, + "eval_runtime": 116.3669, + "eval_samples_per_second": 17.187, + "eval_steps_per_second": 4.297, + "step": 266000 + }, + { + "epoch": 1.34, + "learning_rate": 9.869179813431142e-05, + "loss": 0.0073, + "step": 266010 + }, + { + "epoch": 1.34, + "learning_rate": 9.86842304412974e-05, + "loss": 0.0072, + "step": 266020 + }, + { + "epoch": 1.34, + "learning_rate": 9.867666274828339e-05, + "loss": 0.0052, + "step": 266030 + }, + { + "epoch": 1.34, + "learning_rate": 9.866909505526939e-05, + "loss": 0.0078, + "step": 266040 + }, + { + "epoch": 1.34, + "learning_rate": 9.866152736225537e-05, + "loss": 0.0076, + "step": 266050 + }, + { + "epoch": 1.34, + "learning_rate": 9.865395966924136e-05, + "loss": 0.0073, + "step": 266060 + }, + { + "epoch": 1.34, + "learning_rate": 9.864639197622735e-05, + "loss": 0.0083, + "step": 266070 + }, + { + "epoch": 1.34, + "learning_rate": 9.863882428321334e-05, + "loss": 0.009, + "step": 266080 + }, + { + "epoch": 1.34, + "learning_rate": 9.863125659019934e-05, + "loss": 0.0075, + "step": 266090 + }, + { + "epoch": 1.34, + "learning_rate": 9.862368889718532e-05, + "loss": 0.0103, + "step": 266100 + }, + { + "epoch": 1.34, + "learning_rate": 9.861612120417131e-05, + "loss": 0.0073, + "step": 266110 + }, + { + "epoch": 1.34, + "learning_rate": 9.860855351115731e-05, + "loss": 0.0117, + "step": 266120 + }, + { + "epoch": 1.34, + "learning_rate": 9.860098581814329e-05, + "loss": 0.0078, + "step": 266130 + }, + { + "epoch": 1.34, + "learning_rate": 9.859341812512928e-05, + "loss": 0.0095, + "step": 266140 + }, + { + "epoch": 1.34, + "learning_rate": 9.858585043211525e-05, + "loss": 0.009, + "step": 266150 + }, + { + "epoch": 1.34, + "learning_rate": 9.857828273910125e-05, + "loss": 0.0063, + "step": 266160 + }, + { + "epoch": 1.34, + "learning_rate": 9.857071504608723e-05, + "loss": 0.0091, + "step": 266170 + }, + { + "epoch": 1.34, + "learning_rate": 9.856314735307322e-05, + "loss": 0.007, + "step": 266180 + }, + { + "epoch": 1.34, + "learning_rate": 9.855557966005922e-05, + "loss": 0.0086, + "step": 266190 + }, + { + "epoch": 1.34, + "learning_rate": 9.85480119670452e-05, + "loss": 0.0069, + "step": 266200 + }, + { + "epoch": 1.34, + "learning_rate": 9.85404442740312e-05, + "loss": 0.0078, + "step": 266210 + }, + { + "epoch": 1.34, + "learning_rate": 9.853287658101719e-05, + "loss": 0.0068, + "step": 266220 + }, + { + "epoch": 1.34, + "learning_rate": 9.852530888800317e-05, + "loss": 0.0091, + "step": 266230 + }, + { + "epoch": 1.34, + "learning_rate": 9.851774119498917e-05, + "loss": 0.0066, + "step": 266240 + }, + { + "epoch": 1.34, + "learning_rate": 9.851017350197515e-05, + "loss": 0.0071, + "step": 266250 + }, + { + "epoch": 1.34, + "learning_rate": 9.850260580896114e-05, + "loss": 0.0086, + "step": 266260 + }, + { + "epoch": 1.34, + "learning_rate": 9.849503811594714e-05, + "loss": 0.0057, + "step": 266270 + }, + { + "epoch": 1.34, + "learning_rate": 9.848747042293312e-05, + "loss": 0.0054, + "step": 266280 + }, + { + "epoch": 1.34, + "learning_rate": 9.847990272991911e-05, + "loss": 0.0068, + "step": 266290 + }, + { + "epoch": 1.34, + "learning_rate": 9.847233503690511e-05, + "loss": 0.0069, + "step": 266300 + }, + { + "epoch": 1.34, + "learning_rate": 9.846476734389109e-05, + "loss": 0.0081, + "step": 266310 + }, + { + "epoch": 1.34, + "learning_rate": 9.845719965087708e-05, + "loss": 0.0083, + "step": 266320 + }, + { + "epoch": 1.34, + "learning_rate": 9.844963195786308e-05, + "loss": 0.0089, + "step": 266330 + }, + { + "epoch": 1.34, + "learning_rate": 9.844206426484906e-05, + "loss": 0.008, + "step": 266340 + }, + { + "epoch": 1.34, + "learning_rate": 9.843449657183506e-05, + "loss": 0.006, + "step": 266350 + }, + { + "epoch": 1.34, + "learning_rate": 9.842692887882104e-05, + "loss": 0.0073, + "step": 266360 + }, + { + "epoch": 1.34, + "learning_rate": 9.841936118580703e-05, + "loss": 0.0086, + "step": 266370 + }, + { + "epoch": 1.34, + "learning_rate": 9.841179349279303e-05, + "loss": 0.0073, + "step": 266380 + }, + { + "epoch": 1.34, + "learning_rate": 9.840422579977901e-05, + "loss": 0.0072, + "step": 266390 + }, + { + "epoch": 1.34, + "learning_rate": 9.8396658106765e-05, + "loss": 0.0069, + "step": 266400 + }, + { + "epoch": 1.34, + "learning_rate": 9.8389090413751e-05, + "loss": 0.0091, + "step": 266410 + }, + { + "epoch": 1.34, + "learning_rate": 9.838152272073698e-05, + "loss": 0.0104, + "step": 266420 + }, + { + "epoch": 1.34, + "learning_rate": 9.837395502772298e-05, + "loss": 0.0079, + "step": 266430 + }, + { + "epoch": 1.34, + "learning_rate": 9.836638733470896e-05, + "loss": 0.0057, + "step": 266440 + }, + { + "epoch": 1.34, + "learning_rate": 9.835881964169495e-05, + "loss": 0.0086, + "step": 266450 + }, + { + "epoch": 1.34, + "learning_rate": 9.835125194868095e-05, + "loss": 0.0064, + "step": 266460 + }, + { + "epoch": 1.34, + "learning_rate": 9.834368425566693e-05, + "loss": 0.0084, + "step": 266470 + }, + { + "epoch": 1.34, + "learning_rate": 9.833611656265292e-05, + "loss": 0.0075, + "step": 266480 + }, + { + "epoch": 1.34, + "learning_rate": 9.832854886963892e-05, + "loss": 0.0102, + "step": 266490 + }, + { + "epoch": 1.34, + "learning_rate": 9.83209811766249e-05, + "loss": 0.0078, + "step": 266500 + }, + { + "epoch": 1.34, + "learning_rate": 9.83134134836109e-05, + "loss": 0.0077, + "step": 266510 + }, + { + "epoch": 1.34, + "learning_rate": 9.830584579059688e-05, + "loss": 0.0062, + "step": 266520 + }, + { + "epoch": 1.34, + "learning_rate": 9.829827809758287e-05, + "loss": 0.0086, + "step": 266530 + }, + { + "epoch": 1.34, + "learning_rate": 9.829071040456887e-05, + "loss": 0.009, + "step": 266540 + }, + { + "epoch": 1.34, + "learning_rate": 9.828314271155485e-05, + "loss": 0.0093, + "step": 266550 + }, + { + "epoch": 1.34, + "learning_rate": 9.827557501854084e-05, + "loss": 0.0072, + "step": 266560 + }, + { + "epoch": 1.34, + "learning_rate": 9.826800732552684e-05, + "loss": 0.0083, + "step": 266570 + }, + { + "epoch": 1.34, + "learning_rate": 9.826043963251282e-05, + "loss": 0.0077, + "step": 266580 + }, + { + "epoch": 1.34, + "learning_rate": 9.825287193949881e-05, + "loss": 0.0084, + "step": 266590 + }, + { + "epoch": 1.35, + "learning_rate": 9.82453042464848e-05, + "loss": 0.0082, + "step": 266600 + }, + { + "epoch": 1.35, + "learning_rate": 9.823773655347079e-05, + "loss": 0.0086, + "step": 266610 + }, + { + "epoch": 1.35, + "learning_rate": 9.823016886045679e-05, + "loss": 0.0064, + "step": 266620 + }, + { + "epoch": 1.35, + "learning_rate": 9.822260116744277e-05, + "loss": 0.0083, + "step": 266630 + }, + { + "epoch": 1.35, + "learning_rate": 9.821503347442876e-05, + "loss": 0.0085, + "step": 266640 + }, + { + "epoch": 1.35, + "learning_rate": 9.820746578141476e-05, + "loss": 0.0081, + "step": 266650 + }, + { + "epoch": 1.35, + "learning_rate": 9.819989808840074e-05, + "loss": 0.0196, + "step": 266660 + }, + { + "epoch": 1.35, + "learning_rate": 9.819233039538673e-05, + "loss": 0.0096, + "step": 266670 + }, + { + "epoch": 1.35, + "learning_rate": 9.818476270237271e-05, + "loss": 0.007, + "step": 266680 + }, + { + "epoch": 1.35, + "learning_rate": 9.817719500935871e-05, + "loss": 0.0066, + "step": 266690 + }, + { + "epoch": 1.35, + "learning_rate": 9.81696273163447e-05, + "loss": 0.0086, + "step": 266700 + }, + { + "epoch": 1.35, + "learning_rate": 9.816205962333069e-05, + "loss": 0.005, + "step": 266710 + }, + { + "epoch": 1.35, + "learning_rate": 9.815449193031668e-05, + "loss": 0.009, + "step": 266720 + }, + { + "epoch": 1.35, + "learning_rate": 9.814692423730268e-05, + "loss": 0.0079, + "step": 266730 + }, + { + "epoch": 1.35, + "learning_rate": 9.813935654428866e-05, + "loss": 0.0074, + "step": 266740 + }, + { + "epoch": 1.35, + "learning_rate": 9.813178885127465e-05, + "loss": 0.0069, + "step": 266750 + }, + { + "epoch": 1.35, + "learning_rate": 9.812422115826063e-05, + "loss": 0.0085, + "step": 266760 + }, + { + "epoch": 1.35, + "learning_rate": 9.811665346524663e-05, + "loss": 0.0131, + "step": 266770 + }, + { + "epoch": 1.35, + "learning_rate": 9.810908577223261e-05, + "loss": 0.0096, + "step": 266780 + }, + { + "epoch": 1.35, + "learning_rate": 9.810151807921859e-05, + "loss": 0.0064, + "step": 266790 + }, + { + "epoch": 1.35, + "learning_rate": 9.809395038620459e-05, + "loss": 0.0065, + "step": 266800 + }, + { + "epoch": 1.35, + "learning_rate": 9.808638269319057e-05, + "loss": 0.0081, + "step": 266810 + }, + { + "epoch": 1.35, + "learning_rate": 9.807881500017656e-05, + "loss": 0.007, + "step": 266820 + }, + { + "epoch": 1.35, + "learning_rate": 9.807124730716256e-05, + "loss": 0.0081, + "step": 266830 + }, + { + "epoch": 1.35, + "learning_rate": 9.806367961414854e-05, + "loss": 0.0087, + "step": 266840 + }, + { + "epoch": 1.35, + "learning_rate": 9.805611192113454e-05, + "loss": 0.0071, + "step": 266850 + }, + { + "epoch": 1.35, + "learning_rate": 9.804854422812053e-05, + "loss": 0.0072, + "step": 266860 + }, + { + "epoch": 1.35, + "learning_rate": 9.804097653510651e-05, + "loss": 0.0063, + "step": 266870 + }, + { + "epoch": 1.35, + "learning_rate": 9.80334088420925e-05, + "loss": 0.0085, + "step": 266880 + }, + { + "epoch": 1.35, + "learning_rate": 9.802584114907849e-05, + "loss": 0.0098, + "step": 266890 + }, + { + "epoch": 1.35, + "learning_rate": 9.801827345606448e-05, + "loss": 0.0072, + "step": 266900 + }, + { + "epoch": 1.35, + "learning_rate": 9.801070576305048e-05, + "loss": 0.0077, + "step": 266910 + }, + { + "epoch": 1.35, + "learning_rate": 9.800313807003646e-05, + "loss": 0.0079, + "step": 266920 + }, + { + "epoch": 1.35, + "learning_rate": 9.799557037702245e-05, + "loss": 0.0086, + "step": 266930 + }, + { + "epoch": 1.35, + "learning_rate": 9.798800268400845e-05, + "loss": 0.0101, + "step": 266940 + }, + { + "epoch": 1.35, + "learning_rate": 9.798043499099443e-05, + "loss": 0.0088, + "step": 266950 + }, + { + "epoch": 1.35, + "learning_rate": 9.797286729798043e-05, + "loss": 0.0081, + "step": 266960 + }, + { + "epoch": 1.35, + "learning_rate": 9.796529960496641e-05, + "loss": 0.0099, + "step": 266970 + }, + { + "epoch": 1.35, + "learning_rate": 9.79577319119524e-05, + "loss": 0.0081, + "step": 266980 + }, + { + "epoch": 1.35, + "learning_rate": 9.79501642189384e-05, + "loss": 0.0088, + "step": 266990 + }, + { + "epoch": 1.35, + "learning_rate": 9.794259652592438e-05, + "loss": 0.0085, + "step": 267000 + }, + { + "epoch": 1.35, + "eval_cer": 0.9144362920387732, + "eval_loss": 0.006072907242923975, + "eval_runtime": 116.2245, + "eval_samples_per_second": 17.208, + "eval_steps_per_second": 4.302, + "step": 267000 + }, + { + "epoch": 1.35, + "learning_rate": 9.793502883291037e-05, + "loss": 0.0077, + "step": 267010 + }, + { + "epoch": 1.35, + "learning_rate": 9.792746113989637e-05, + "loss": 0.0094, + "step": 267020 + }, + { + "epoch": 1.35, + "learning_rate": 9.791989344688235e-05, + "loss": 0.0094, + "step": 267030 + }, + { + "epoch": 1.35, + "learning_rate": 9.791232575386835e-05, + "loss": 0.0082, + "step": 267040 + }, + { + "epoch": 1.35, + "learning_rate": 9.790475806085433e-05, + "loss": 0.0073, + "step": 267050 + }, + { + "epoch": 1.35, + "learning_rate": 9.789719036784032e-05, + "loss": 0.0083, + "step": 267060 + }, + { + "epoch": 1.35, + "learning_rate": 9.788962267482632e-05, + "loss": 0.0071, + "step": 267070 + }, + { + "epoch": 1.35, + "learning_rate": 9.78820549818123e-05, + "loss": 0.0079, + "step": 267080 + }, + { + "epoch": 1.35, + "learning_rate": 9.787448728879829e-05, + "loss": 0.0073, + "step": 267090 + }, + { + "epoch": 1.35, + "learning_rate": 9.786691959578429e-05, + "loss": 0.0102, + "step": 267100 + }, + { + "epoch": 1.35, + "learning_rate": 9.785935190277027e-05, + "loss": 0.007, + "step": 267110 + }, + { + "epoch": 1.35, + "learning_rate": 9.785178420975626e-05, + "loss": 0.0063, + "step": 267120 + }, + { + "epoch": 1.35, + "learning_rate": 9.784421651674225e-05, + "loss": 0.0094, + "step": 267130 + }, + { + "epoch": 1.35, + "learning_rate": 9.783664882372824e-05, + "loss": 0.0085, + "step": 267140 + }, + { + "epoch": 1.35, + "learning_rate": 9.782908113071424e-05, + "loss": 0.0124, + "step": 267150 + }, + { + "epoch": 1.35, + "learning_rate": 9.782151343770022e-05, + "loss": 0.0082, + "step": 267160 + }, + { + "epoch": 1.35, + "learning_rate": 9.781394574468621e-05, + "loss": 0.0076, + "step": 267170 + }, + { + "epoch": 1.35, + "learning_rate": 9.780637805167221e-05, + "loss": 0.0082, + "step": 267180 + }, + { + "epoch": 1.35, + "learning_rate": 9.779881035865819e-05, + "loss": 0.0074, + "step": 267190 + }, + { + "epoch": 1.35, + "learning_rate": 9.779124266564418e-05, + "loss": 0.0057, + "step": 267200 + }, + { + "epoch": 1.35, + "learning_rate": 9.778367497263017e-05, + "loss": 0.0079, + "step": 267210 + }, + { + "epoch": 1.35, + "learning_rate": 9.777610727961616e-05, + "loss": 0.0075, + "step": 267220 + }, + { + "epoch": 1.35, + "learning_rate": 9.776853958660216e-05, + "loss": 0.0092, + "step": 267230 + }, + { + "epoch": 1.35, + "learning_rate": 9.776097189358814e-05, + "loss": 0.0084, + "step": 267240 + }, + { + "epoch": 1.35, + "learning_rate": 9.775340420057413e-05, + "loss": 0.008, + "step": 267250 + }, + { + "epoch": 1.35, + "learning_rate": 9.774583650756013e-05, + "loss": 0.0095, + "step": 267260 + }, + { + "epoch": 1.35, + "learning_rate": 9.773826881454611e-05, + "loss": 0.0112, + "step": 267270 + }, + { + "epoch": 1.35, + "learning_rate": 9.77307011215321e-05, + "loss": 0.0085, + "step": 267280 + }, + { + "epoch": 1.35, + "learning_rate": 9.772313342851808e-05, + "loss": 0.0072, + "step": 267290 + }, + { + "epoch": 1.35, + "learning_rate": 9.771556573550408e-05, + "loss": 0.0122, + "step": 267300 + }, + { + "epoch": 1.35, + "learning_rate": 9.770799804249007e-05, + "loss": 0.007, + "step": 267310 + }, + { + "epoch": 1.35, + "learning_rate": 9.770043034947606e-05, + "loss": 0.0099, + "step": 267320 + }, + { + "epoch": 1.35, + "learning_rate": 9.769286265646205e-05, + "loss": 0.0078, + "step": 267330 + }, + { + "epoch": 1.35, + "learning_rate": 9.768529496344805e-05, + "loss": 0.0059, + "step": 267340 + }, + { + "epoch": 1.35, + "learning_rate": 9.767772727043403e-05, + "loss": 0.0083, + "step": 267350 + }, + { + "epoch": 1.35, + "learning_rate": 9.767015957742002e-05, + "loss": 0.0074, + "step": 267360 + }, + { + "epoch": 1.35, + "learning_rate": 9.766259188440602e-05, + "loss": 0.0079, + "step": 267370 + }, + { + "epoch": 1.35, + "learning_rate": 9.7655024191392e-05, + "loss": 0.0111, + "step": 267380 + }, + { + "epoch": 1.35, + "learning_rate": 9.7647456498378e-05, + "loss": 0.0085, + "step": 267390 + }, + { + "epoch": 1.35, + "learning_rate": 9.763988880536398e-05, + "loss": 0.0073, + "step": 267400 + }, + { + "epoch": 1.35, + "learning_rate": 9.763232111234996e-05, + "loss": 0.0077, + "step": 267410 + }, + { + "epoch": 1.35, + "learning_rate": 9.762475341933594e-05, + "loss": 0.0072, + "step": 267420 + }, + { + "epoch": 1.35, + "learning_rate": 9.761718572632193e-05, + "loss": 0.0089, + "step": 267430 + }, + { + "epoch": 1.35, + "learning_rate": 9.760961803330793e-05, + "loss": 0.0073, + "step": 267440 + }, + { + "epoch": 1.35, + "learning_rate": 9.760205034029391e-05, + "loss": 0.0093, + "step": 267450 + }, + { + "epoch": 1.35, + "learning_rate": 9.75944826472799e-05, + "loss": 0.0102, + "step": 267460 + }, + { + "epoch": 1.35, + "learning_rate": 9.75869149542659e-05, + "loss": 0.0109, + "step": 267470 + }, + { + "epoch": 1.35, + "learning_rate": 9.757934726125188e-05, + "loss": 0.0072, + "step": 267480 + }, + { + "epoch": 1.35, + "learning_rate": 9.757177956823788e-05, + "loss": 0.0081, + "step": 267490 + }, + { + "epoch": 1.35, + "learning_rate": 9.756421187522386e-05, + "loss": 0.0072, + "step": 267500 + }, + { + "epoch": 1.35, + "learning_rate": 9.755664418220985e-05, + "loss": 0.0104, + "step": 267510 + }, + { + "epoch": 1.35, + "learning_rate": 9.754907648919585e-05, + "loss": 0.0084, + "step": 267520 + }, + { + "epoch": 1.35, + "learning_rate": 9.754150879618183e-05, + "loss": 0.0082, + "step": 267530 + }, + { + "epoch": 1.35, + "learning_rate": 9.753394110316782e-05, + "loss": 0.0063, + "step": 267540 + }, + { + "epoch": 1.35, + "learning_rate": 9.752637341015382e-05, + "loss": 0.0057, + "step": 267550 + }, + { + "epoch": 1.35, + "learning_rate": 9.75188057171398e-05, + "loss": 0.008, + "step": 267560 + }, + { + "epoch": 1.35, + "learning_rate": 9.75112380241258e-05, + "loss": 0.008, + "step": 267570 + }, + { + "epoch": 1.35, + "learning_rate": 9.750367033111178e-05, + "loss": 0.007, + "step": 267580 + }, + { + "epoch": 1.35, + "learning_rate": 9.749610263809777e-05, + "loss": 0.0084, + "step": 267590 + }, + { + "epoch": 1.35, + "learning_rate": 9.748853494508377e-05, + "loss": 0.0078, + "step": 267600 + }, + { + "epoch": 1.35, + "learning_rate": 9.748096725206975e-05, + "loss": 0.0078, + "step": 267610 + }, + { + "epoch": 1.35, + "learning_rate": 9.747339955905574e-05, + "loss": 0.0081, + "step": 267620 + }, + { + "epoch": 1.35, + "learning_rate": 9.746583186604174e-05, + "loss": 0.0074, + "step": 267630 + }, + { + "epoch": 1.35, + "learning_rate": 9.745826417302772e-05, + "loss": 0.0079, + "step": 267640 + }, + { + "epoch": 1.35, + "learning_rate": 9.745069648001371e-05, + "loss": 0.0091, + "step": 267650 + }, + { + "epoch": 1.35, + "learning_rate": 9.74431287869997e-05, + "loss": 0.0076, + "step": 267660 + }, + { + "epoch": 1.35, + "learning_rate": 9.743556109398569e-05, + "loss": 0.0065, + "step": 267670 + }, + { + "epoch": 1.35, + "learning_rate": 9.742799340097169e-05, + "loss": 0.0077, + "step": 267680 + }, + { + "epoch": 1.35, + "learning_rate": 9.742042570795767e-05, + "loss": 0.0087, + "step": 267690 + }, + { + "epoch": 1.35, + "learning_rate": 9.741285801494366e-05, + "loss": 0.0082, + "step": 267700 + }, + { + "epoch": 1.35, + "learning_rate": 9.740529032192966e-05, + "loss": 0.0082, + "step": 267710 + }, + { + "epoch": 1.35, + "learning_rate": 9.739772262891564e-05, + "loss": 0.008, + "step": 267720 + }, + { + "epoch": 1.35, + "learning_rate": 9.739015493590163e-05, + "loss": 0.0072, + "step": 267730 + }, + { + "epoch": 1.35, + "learning_rate": 9.738258724288762e-05, + "loss": 0.0094, + "step": 267740 + }, + { + "epoch": 1.35, + "learning_rate": 9.737501954987361e-05, + "loss": 0.0073, + "step": 267750 + }, + { + "epoch": 1.35, + "learning_rate": 9.73674518568596e-05, + "loss": 0.009, + "step": 267760 + }, + { + "epoch": 1.35, + "learning_rate": 9.735988416384559e-05, + "loss": 0.0092, + "step": 267770 + }, + { + "epoch": 1.35, + "learning_rate": 9.735231647083158e-05, + "loss": 0.0104, + "step": 267780 + }, + { + "epoch": 1.35, + "learning_rate": 9.734474877781758e-05, + "loss": 0.0093, + "step": 267790 + }, + { + "epoch": 1.35, + "learning_rate": 9.733718108480356e-05, + "loss": 0.0077, + "step": 267800 + }, + { + "epoch": 1.35, + "learning_rate": 9.732961339178955e-05, + "loss": 0.0078, + "step": 267810 + }, + { + "epoch": 1.35, + "learning_rate": 9.732204569877555e-05, + "loss": 0.0077, + "step": 267820 + }, + { + "epoch": 1.35, + "learning_rate": 9.731447800576153e-05, + "loss": 0.0108, + "step": 267830 + }, + { + "epoch": 1.35, + "learning_rate": 9.730691031274752e-05, + "loss": 0.0084, + "step": 267840 + }, + { + "epoch": 1.35, + "learning_rate": 9.72993426197335e-05, + "loss": 0.009, + "step": 267850 + }, + { + "epoch": 1.35, + "learning_rate": 9.72917749267195e-05, + "loss": 0.0091, + "step": 267860 + }, + { + "epoch": 1.35, + "learning_rate": 9.72842072337055e-05, + "loss": 0.0086, + "step": 267870 + }, + { + "epoch": 1.35, + "learning_rate": 9.727663954069148e-05, + "loss": 0.0076, + "step": 267880 + }, + { + "epoch": 1.35, + "learning_rate": 9.726907184767747e-05, + "loss": 0.0094, + "step": 267890 + }, + { + "epoch": 1.35, + "learning_rate": 9.726150415466347e-05, + "loss": 0.0069, + "step": 267900 + }, + { + "epoch": 1.35, + "learning_rate": 9.725393646164945e-05, + "loss": 0.0094, + "step": 267910 + }, + { + "epoch": 1.35, + "learning_rate": 9.724636876863544e-05, + "loss": 0.0084, + "step": 267920 + }, + { + "epoch": 1.35, + "learning_rate": 9.723880107562143e-05, + "loss": 0.0083, + "step": 267930 + }, + { + "epoch": 1.35, + "learning_rate": 9.723123338260742e-05, + "loss": 0.0065, + "step": 267940 + }, + { + "epoch": 1.35, + "learning_rate": 9.722366568959342e-05, + "loss": 0.0069, + "step": 267950 + }, + { + "epoch": 1.35, + "learning_rate": 9.72160979965794e-05, + "loss": 0.0082, + "step": 267960 + }, + { + "epoch": 1.35, + "learning_rate": 9.720853030356539e-05, + "loss": 0.0048, + "step": 267970 + }, + { + "epoch": 1.35, + "learning_rate": 9.720096261055139e-05, + "loss": 0.0075, + "step": 267980 + }, + { + "epoch": 1.35, + "learning_rate": 9.719339491753737e-05, + "loss": 0.0079, + "step": 267990 + }, + { + "epoch": 1.35, + "learning_rate": 9.718582722452336e-05, + "loss": 0.0097, + "step": 268000 + }, + { + "epoch": 1.35, + "eval_cer": 0.9144178545123905, + "eval_loss": 0.006040630396455526, + "eval_runtime": 116.1695, + "eval_samples_per_second": 17.216, + "eval_steps_per_second": 4.304, + "step": 268000 + }, + { + "epoch": 1.35, + "learning_rate": 9.717825953150934e-05, + "loss": 0.0077, + "step": 268010 + }, + { + "epoch": 1.35, + "learning_rate": 9.717069183849534e-05, + "loss": 0.0066, + "step": 268020 + }, + { + "epoch": 1.35, + "learning_rate": 9.716312414548133e-05, + "loss": 0.0069, + "step": 268030 + }, + { + "epoch": 1.35, + "learning_rate": 9.71555564524673e-05, + "loss": 0.0067, + "step": 268040 + }, + { + "epoch": 1.35, + "learning_rate": 9.71479887594533e-05, + "loss": 0.009, + "step": 268050 + }, + { + "epoch": 1.35, + "learning_rate": 9.714042106643928e-05, + "loss": 0.0094, + "step": 268060 + }, + { + "epoch": 1.35, + "learning_rate": 9.713285337342527e-05, + "loss": 0.0093, + "step": 268070 + }, + { + "epoch": 1.35, + "learning_rate": 9.712528568041127e-05, + "loss": 0.009, + "step": 268080 + }, + { + "epoch": 1.35, + "learning_rate": 9.711771798739725e-05, + "loss": 0.0085, + "step": 268090 + }, + { + "epoch": 1.35, + "learning_rate": 9.711015029438325e-05, + "loss": 0.006, + "step": 268100 + }, + { + "epoch": 1.35, + "learning_rate": 9.710258260136923e-05, + "loss": 0.0086, + "step": 268110 + }, + { + "epoch": 1.35, + "learning_rate": 9.709501490835522e-05, + "loss": 0.0087, + "step": 268120 + }, + { + "epoch": 1.35, + "learning_rate": 9.708744721534122e-05, + "loss": 0.0082, + "step": 268130 + }, + { + "epoch": 1.35, + "learning_rate": 9.70798795223272e-05, + "loss": 0.01, + "step": 268140 + }, + { + "epoch": 1.35, + "learning_rate": 9.707231182931319e-05, + "loss": 0.0074, + "step": 268150 + }, + { + "epoch": 1.35, + "learning_rate": 9.706474413629919e-05, + "loss": 0.0075, + "step": 268160 + }, + { + "epoch": 1.35, + "learning_rate": 9.705717644328517e-05, + "loss": 0.0093, + "step": 268170 + }, + { + "epoch": 1.35, + "learning_rate": 9.704960875027116e-05, + "loss": 0.0103, + "step": 268180 + }, + { + "epoch": 1.35, + "learning_rate": 9.704204105725715e-05, + "loss": 0.011, + "step": 268190 + }, + { + "epoch": 1.35, + "learning_rate": 9.703447336424314e-05, + "loss": 0.0117, + "step": 268200 + }, + { + "epoch": 1.35, + "learning_rate": 9.702690567122914e-05, + "loss": 0.0072, + "step": 268210 + }, + { + "epoch": 1.35, + "learning_rate": 9.701933797821512e-05, + "loss": 0.0082, + "step": 268220 + }, + { + "epoch": 1.35, + "learning_rate": 9.701177028520111e-05, + "loss": 0.0095, + "step": 268230 + }, + { + "epoch": 1.35, + "learning_rate": 9.700420259218711e-05, + "loss": 0.0063, + "step": 268240 + }, + { + "epoch": 1.35, + "learning_rate": 9.699663489917309e-05, + "loss": 0.0084, + "step": 268250 + }, + { + "epoch": 1.35, + "learning_rate": 9.698906720615908e-05, + "loss": 0.0082, + "step": 268260 + }, + { + "epoch": 1.35, + "learning_rate": 9.698149951314508e-05, + "loss": 0.0067, + "step": 268270 + }, + { + "epoch": 1.35, + "learning_rate": 9.697393182013106e-05, + "loss": 0.0108, + "step": 268280 + }, + { + "epoch": 1.35, + "learning_rate": 9.696636412711706e-05, + "loss": 0.0059, + "step": 268290 + }, + { + "epoch": 1.35, + "learning_rate": 9.695879643410304e-05, + "loss": 0.0091, + "step": 268300 + }, + { + "epoch": 1.35, + "learning_rate": 9.695122874108903e-05, + "loss": 0.0077, + "step": 268310 + }, + { + "epoch": 1.35, + "learning_rate": 9.694366104807503e-05, + "loss": 0.0072, + "step": 268320 + }, + { + "epoch": 1.35, + "learning_rate": 9.693609335506101e-05, + "loss": 0.0088, + "step": 268330 + }, + { + "epoch": 1.35, + "learning_rate": 9.6928525662047e-05, + "loss": 0.0086, + "step": 268340 + }, + { + "epoch": 1.35, + "learning_rate": 9.6920957969033e-05, + "loss": 0.0089, + "step": 268350 + }, + { + "epoch": 1.35, + "learning_rate": 9.691339027601898e-05, + "loss": 0.0096, + "step": 268360 + }, + { + "epoch": 1.35, + "learning_rate": 9.690582258300497e-05, + "loss": 0.0066, + "step": 268370 + }, + { + "epoch": 1.35, + "learning_rate": 9.689825488999096e-05, + "loss": 0.0087, + "step": 268380 + }, + { + "epoch": 1.35, + "learning_rate": 9.689068719697695e-05, + "loss": 0.0076, + "step": 268390 + }, + { + "epoch": 1.35, + "learning_rate": 9.688311950396295e-05, + "loss": 0.0084, + "step": 268400 + }, + { + "epoch": 1.35, + "learning_rate": 9.687555181094893e-05, + "loss": 0.0072, + "step": 268410 + }, + { + "epoch": 1.35, + "learning_rate": 9.686798411793492e-05, + "loss": 0.0071, + "step": 268420 + }, + { + "epoch": 1.35, + "learning_rate": 9.686041642492092e-05, + "loss": 0.0054, + "step": 268430 + }, + { + "epoch": 1.35, + "learning_rate": 9.68528487319069e-05, + "loss": 0.0069, + "step": 268440 + }, + { + "epoch": 1.35, + "learning_rate": 9.68452810388929e-05, + "loss": 0.0066, + "step": 268450 + }, + { + "epoch": 1.35, + "learning_rate": 9.683771334587888e-05, + "loss": 0.0079, + "step": 268460 + }, + { + "epoch": 1.35, + "learning_rate": 9.683014565286487e-05, + "loss": 0.0091, + "step": 268470 + }, + { + "epoch": 1.35, + "learning_rate": 9.682257795985087e-05, + "loss": 0.0072, + "step": 268480 + }, + { + "epoch": 1.35, + "learning_rate": 9.681501026683685e-05, + "loss": 0.0107, + "step": 268490 + }, + { + "epoch": 1.35, + "learning_rate": 9.680744257382284e-05, + "loss": 0.0106, + "step": 268500 + }, + { + "epoch": 1.35, + "learning_rate": 9.679987488080884e-05, + "loss": 0.0089, + "step": 268510 + }, + { + "epoch": 1.35, + "learning_rate": 9.679230718779482e-05, + "loss": 0.0089, + "step": 268520 + }, + { + "epoch": 1.35, + "learning_rate": 9.678473949478081e-05, + "loss": 0.0067, + "step": 268530 + }, + { + "epoch": 1.35, + "learning_rate": 9.67771718017668e-05, + "loss": 0.0096, + "step": 268540 + }, + { + "epoch": 1.35, + "learning_rate": 9.676960410875279e-05, + "loss": 0.0089, + "step": 268550 + }, + { + "epoch": 1.35, + "learning_rate": 9.676203641573878e-05, + "loss": 0.007, + "step": 268560 + }, + { + "epoch": 1.35, + "learning_rate": 9.675446872272477e-05, + "loss": 0.0088, + "step": 268570 + }, + { + "epoch": 1.36, + "learning_rate": 9.674690102971076e-05, + "loss": 0.0074, + "step": 268580 + }, + { + "epoch": 1.36, + "learning_rate": 9.673933333669676e-05, + "loss": 0.0077, + "step": 268590 + }, + { + "epoch": 1.36, + "learning_rate": 9.673176564368274e-05, + "loss": 0.008, + "step": 268600 + }, + { + "epoch": 1.36, + "learning_rate": 9.672419795066873e-05, + "loss": 0.0067, + "step": 268610 + }, + { + "epoch": 1.36, + "learning_rate": 9.671663025765471e-05, + "loss": 0.0069, + "step": 268620 + }, + { + "epoch": 1.36, + "learning_rate": 9.670906256464071e-05, + "loss": 0.008, + "step": 268630 + }, + { + "epoch": 1.36, + "learning_rate": 9.67014948716267e-05, + "loss": 0.008, + "step": 268640 + }, + { + "epoch": 1.36, + "learning_rate": 9.669392717861269e-05, + "loss": 0.0084, + "step": 268650 + }, + { + "epoch": 1.36, + "learning_rate": 9.668635948559867e-05, + "loss": 0.0067, + "step": 268660 + }, + { + "epoch": 1.36, + "learning_rate": 9.667879179258465e-05, + "loss": 0.0069, + "step": 268670 + }, + { + "epoch": 1.36, + "learning_rate": 9.667122409957064e-05, + "loss": 0.0072, + "step": 268680 + }, + { + "epoch": 1.36, + "learning_rate": 9.666365640655664e-05, + "loss": 0.0089, + "step": 268690 + }, + { + "epoch": 1.36, + "learning_rate": 9.665608871354262e-05, + "loss": 0.0101, + "step": 268700 + }, + { + "epoch": 1.36, + "learning_rate": 9.664852102052861e-05, + "loss": 0.0076, + "step": 268710 + }, + { + "epoch": 1.36, + "learning_rate": 9.664095332751461e-05, + "loss": 0.0063, + "step": 268720 + }, + { + "epoch": 1.36, + "learning_rate": 9.663338563450059e-05, + "loss": 0.0059, + "step": 268730 + }, + { + "epoch": 1.36, + "learning_rate": 9.662581794148659e-05, + "loss": 0.0095, + "step": 268740 + }, + { + "epoch": 1.36, + "learning_rate": 9.661825024847257e-05, + "loss": 0.0082, + "step": 268750 + }, + { + "epoch": 1.36, + "learning_rate": 9.661068255545856e-05, + "loss": 0.0068, + "step": 268760 + }, + { + "epoch": 1.36, + "learning_rate": 9.660311486244456e-05, + "loss": 0.0121, + "step": 268770 + }, + { + "epoch": 1.36, + "learning_rate": 9.659554716943054e-05, + "loss": 0.0091, + "step": 268780 + }, + { + "epoch": 1.36, + "learning_rate": 9.658797947641653e-05, + "loss": 0.0057, + "step": 268790 + }, + { + "epoch": 1.36, + "learning_rate": 9.658041178340253e-05, + "loss": 0.0102, + "step": 268800 + }, + { + "epoch": 1.36, + "learning_rate": 9.657284409038851e-05, + "loss": 0.012, + "step": 268810 + }, + { + "epoch": 1.36, + "learning_rate": 9.65652763973745e-05, + "loss": 0.0092, + "step": 268820 + }, + { + "epoch": 1.36, + "learning_rate": 9.655770870436049e-05, + "loss": 0.0078, + "step": 268830 + }, + { + "epoch": 1.36, + "learning_rate": 9.655014101134648e-05, + "loss": 0.0102, + "step": 268840 + }, + { + "epoch": 1.36, + "learning_rate": 9.654257331833248e-05, + "loss": 0.0084, + "step": 268850 + }, + { + "epoch": 1.36, + "learning_rate": 9.653500562531846e-05, + "loss": 0.0069, + "step": 268860 + }, + { + "epoch": 1.36, + "learning_rate": 9.652743793230445e-05, + "loss": 0.0055, + "step": 268870 + }, + { + "epoch": 1.36, + "learning_rate": 9.651987023929045e-05, + "loss": 0.0075, + "step": 268880 + }, + { + "epoch": 1.36, + "learning_rate": 9.651230254627643e-05, + "loss": 0.0062, + "step": 268890 + }, + { + "epoch": 1.36, + "learning_rate": 9.650473485326242e-05, + "loss": 0.0084, + "step": 268900 + }, + { + "epoch": 1.36, + "learning_rate": 9.64971671602484e-05, + "loss": 0.0083, + "step": 268910 + }, + { + "epoch": 1.36, + "learning_rate": 9.64895994672344e-05, + "loss": 0.0065, + "step": 268920 + }, + { + "epoch": 1.36, + "learning_rate": 9.64820317742204e-05, + "loss": 0.0084, + "step": 268930 + }, + { + "epoch": 1.36, + "learning_rate": 9.647446408120638e-05, + "loss": 0.0078, + "step": 268940 + }, + { + "epoch": 1.36, + "learning_rate": 9.646689638819237e-05, + "loss": 0.0071, + "step": 268950 + }, + { + "epoch": 1.36, + "learning_rate": 9.645932869517837e-05, + "loss": 0.007, + "step": 268960 + }, + { + "epoch": 1.36, + "learning_rate": 9.645176100216435e-05, + "loss": 0.008, + "step": 268970 + }, + { + "epoch": 1.36, + "learning_rate": 9.644419330915034e-05, + "loss": 0.007, + "step": 268980 + }, + { + "epoch": 1.36, + "learning_rate": 9.643662561613633e-05, + "loss": 0.0079, + "step": 268990 + }, + { + "epoch": 1.36, + "learning_rate": 9.642905792312232e-05, + "loss": 0.0084, + "step": 269000 + }, + { + "epoch": 1.36, + "eval_cer": 0.9144071801550111, + "eval_loss": 0.006098465994000435, + "eval_runtime": 116.3578, + "eval_samples_per_second": 17.188, + "eval_steps_per_second": 4.297, + "step": 269000 + }, + { + "epoch": 1.36, + "learning_rate": 9.642149023010832e-05, + "loss": 0.0086, + "step": 269010 + }, + { + "epoch": 1.36, + "learning_rate": 9.64139225370943e-05, + "loss": 0.0089, + "step": 269020 + }, + { + "epoch": 1.36, + "learning_rate": 9.640635484408029e-05, + "loss": 0.0087, + "step": 269030 + }, + { + "epoch": 1.36, + "learning_rate": 9.639878715106629e-05, + "loss": 0.0073, + "step": 269040 + }, + { + "epoch": 1.36, + "learning_rate": 9.639121945805227e-05, + "loss": 0.007, + "step": 269050 + }, + { + "epoch": 1.36, + "learning_rate": 9.638365176503826e-05, + "loss": 0.0061, + "step": 269060 + }, + { + "epoch": 1.36, + "learning_rate": 9.637608407202424e-05, + "loss": 0.0093, + "step": 269070 + }, + { + "epoch": 1.36, + "learning_rate": 9.636851637901024e-05, + "loss": 0.0096, + "step": 269080 + }, + { + "epoch": 1.36, + "learning_rate": 9.636094868599623e-05, + "loss": 0.0075, + "step": 269090 + }, + { + "epoch": 1.36, + "learning_rate": 9.635338099298222e-05, + "loss": 0.0059, + "step": 269100 + }, + { + "epoch": 1.36, + "learning_rate": 9.634581329996821e-05, + "loss": 0.0064, + "step": 269110 + }, + { + "epoch": 1.36, + "learning_rate": 9.63382456069542e-05, + "loss": 0.0079, + "step": 269120 + }, + { + "epoch": 1.36, + "learning_rate": 9.633067791394019e-05, + "loss": 0.0084, + "step": 269130 + }, + { + "epoch": 1.36, + "learning_rate": 9.632311022092618e-05, + "loss": 0.01, + "step": 269140 + }, + { + "epoch": 1.36, + "learning_rate": 9.631554252791216e-05, + "loss": 0.0084, + "step": 269150 + }, + { + "epoch": 1.36, + "learning_rate": 9.630797483489816e-05, + "loss": 0.0088, + "step": 269160 + }, + { + "epoch": 1.36, + "learning_rate": 9.630040714188415e-05, + "loss": 0.0103, + "step": 269170 + }, + { + "epoch": 1.36, + "learning_rate": 9.629283944887014e-05, + "loss": 0.0071, + "step": 269180 + }, + { + "epoch": 1.36, + "learning_rate": 9.628527175585613e-05, + "loss": 0.0075, + "step": 269190 + }, + { + "epoch": 1.36, + "learning_rate": 9.627770406284213e-05, + "loss": 0.01, + "step": 269200 + }, + { + "epoch": 1.36, + "learning_rate": 9.627013636982811e-05, + "loss": 0.0089, + "step": 269210 + }, + { + "epoch": 1.36, + "learning_rate": 9.62625686768141e-05, + "loss": 0.0079, + "step": 269220 + }, + { + "epoch": 1.36, + "learning_rate": 9.625500098380008e-05, + "loss": 0.0076, + "step": 269230 + }, + { + "epoch": 1.36, + "learning_rate": 9.624743329078608e-05, + "loss": 0.0089, + "step": 269240 + }, + { + "epoch": 1.36, + "learning_rate": 9.623986559777207e-05, + "loss": 0.0101, + "step": 269250 + }, + { + "epoch": 1.36, + "learning_rate": 9.623229790475805e-05, + "loss": 0.0067, + "step": 269260 + }, + { + "epoch": 1.36, + "learning_rate": 9.622473021174405e-05, + "loss": 0.0118, + "step": 269270 + }, + { + "epoch": 1.36, + "learning_rate": 9.621716251873004e-05, + "loss": 0.0084, + "step": 269280 + }, + { + "epoch": 1.36, + "learning_rate": 9.620959482571601e-05, + "loss": 0.0121, + "step": 269290 + }, + { + "epoch": 1.36, + "learning_rate": 9.620202713270201e-05, + "loss": 0.0075, + "step": 269300 + }, + { + "epoch": 1.36, + "learning_rate": 9.619445943968799e-05, + "loss": 0.0071, + "step": 269310 + }, + { + "epoch": 1.36, + "learning_rate": 9.618689174667398e-05, + "loss": 0.0084, + "step": 269320 + }, + { + "epoch": 1.36, + "learning_rate": 9.617932405365998e-05, + "loss": 0.0066, + "step": 269330 + }, + { + "epoch": 1.36, + "learning_rate": 9.617175636064596e-05, + "loss": 0.0132, + "step": 269340 + }, + { + "epoch": 1.36, + "learning_rate": 9.616418866763196e-05, + "loss": 0.0086, + "step": 269350 + }, + { + "epoch": 1.36, + "learning_rate": 9.615662097461794e-05, + "loss": 0.0085, + "step": 269360 + }, + { + "epoch": 1.36, + "learning_rate": 9.614905328160393e-05, + "loss": 0.0111, + "step": 269370 + }, + { + "epoch": 1.36, + "learning_rate": 9.614148558858993e-05, + "loss": 0.0076, + "step": 269380 + }, + { + "epoch": 1.36, + "learning_rate": 9.613391789557591e-05, + "loss": 0.0058, + "step": 269390 + }, + { + "epoch": 1.36, + "learning_rate": 9.61263502025619e-05, + "loss": 0.0119, + "step": 269400 + }, + { + "epoch": 1.36, + "learning_rate": 9.61187825095479e-05, + "loss": 0.008, + "step": 269410 + }, + { + "epoch": 1.36, + "learning_rate": 9.611121481653388e-05, + "loss": 0.0097, + "step": 269420 + }, + { + "epoch": 1.36, + "learning_rate": 9.610364712351987e-05, + "loss": 0.0094, + "step": 269430 + }, + { + "epoch": 1.36, + "learning_rate": 9.609607943050586e-05, + "loss": 0.0089, + "step": 269440 + }, + { + "epoch": 1.36, + "learning_rate": 9.608851173749185e-05, + "loss": 0.0077, + "step": 269450 + }, + { + "epoch": 1.36, + "learning_rate": 9.608094404447785e-05, + "loss": 0.0083, + "step": 269460 + }, + { + "epoch": 1.36, + "learning_rate": 9.607337635146383e-05, + "loss": 0.0076, + "step": 269470 + }, + { + "epoch": 1.36, + "learning_rate": 9.606580865844982e-05, + "loss": 0.0094, + "step": 269480 + }, + { + "epoch": 1.36, + "learning_rate": 9.605824096543582e-05, + "loss": 0.0062, + "step": 269490 + }, + { + "epoch": 1.36, + "learning_rate": 9.60506732724218e-05, + "loss": 0.0084, + "step": 269500 + }, + { + "epoch": 1.36, + "learning_rate": 9.60431055794078e-05, + "loss": 0.007, + "step": 269510 + }, + { + "epoch": 1.36, + "learning_rate": 9.603553788639378e-05, + "loss": 0.0101, + "step": 269520 + }, + { + "epoch": 1.36, + "learning_rate": 9.602797019337977e-05, + "loss": 0.0064, + "step": 269530 + }, + { + "epoch": 1.36, + "learning_rate": 9.602040250036577e-05, + "loss": 0.0061, + "step": 269540 + }, + { + "epoch": 1.36, + "learning_rate": 9.601283480735175e-05, + "loss": 0.0073, + "step": 269550 + }, + { + "epoch": 1.36, + "learning_rate": 9.600526711433774e-05, + "loss": 0.0067, + "step": 269560 + }, + { + "epoch": 1.36, + "learning_rate": 9.599769942132374e-05, + "loss": 0.007, + "step": 269570 + }, + { + "epoch": 1.36, + "learning_rate": 9.599013172830972e-05, + "loss": 0.0078, + "step": 269580 + }, + { + "epoch": 1.36, + "learning_rate": 9.598256403529571e-05, + "loss": 0.0085, + "step": 269590 + }, + { + "epoch": 1.36, + "learning_rate": 9.59749963422817e-05, + "loss": 0.0066, + "step": 269600 + }, + { + "epoch": 1.36, + "learning_rate": 9.596742864926769e-05, + "loss": 0.0091, + "step": 269610 + }, + { + "epoch": 1.36, + "learning_rate": 9.595986095625368e-05, + "loss": 0.0078, + "step": 269620 + }, + { + "epoch": 1.36, + "learning_rate": 9.595229326323967e-05, + "loss": 0.0072, + "step": 269630 + }, + { + "epoch": 1.36, + "learning_rate": 9.594472557022566e-05, + "loss": 0.0078, + "step": 269640 + }, + { + "epoch": 1.36, + "learning_rate": 9.593715787721166e-05, + "loss": 0.0075, + "step": 269650 + }, + { + "epoch": 1.36, + "learning_rate": 9.592959018419764e-05, + "loss": 0.008, + "step": 269660 + }, + { + "epoch": 1.36, + "learning_rate": 9.592202249118363e-05, + "loss": 0.0098, + "step": 269670 + }, + { + "epoch": 1.36, + "learning_rate": 9.591445479816961e-05, + "loss": 0.0063, + "step": 269680 + }, + { + "epoch": 1.36, + "learning_rate": 9.590688710515561e-05, + "loss": 0.0096, + "step": 269690 + }, + { + "epoch": 1.36, + "learning_rate": 9.58993194121416e-05, + "loss": 0.0078, + "step": 269700 + }, + { + "epoch": 1.36, + "learning_rate": 9.589175171912759e-05, + "loss": 0.0085, + "step": 269710 + }, + { + "epoch": 1.36, + "learning_rate": 9.588418402611358e-05, + "loss": 0.007, + "step": 269720 + }, + { + "epoch": 1.36, + "learning_rate": 9.587661633309958e-05, + "loss": 0.0074, + "step": 269730 + }, + { + "epoch": 1.36, + "learning_rate": 9.586904864008556e-05, + "loss": 0.0079, + "step": 269740 + }, + { + "epoch": 1.36, + "learning_rate": 9.586148094707155e-05, + "loss": 0.0071, + "step": 269750 + }, + { + "epoch": 1.36, + "learning_rate": 9.585391325405755e-05, + "loss": 0.0103, + "step": 269760 + }, + { + "epoch": 1.36, + "learning_rate": 9.584634556104353e-05, + "loss": 0.0076, + "step": 269770 + }, + { + "epoch": 1.36, + "learning_rate": 9.583877786802952e-05, + "loss": 0.0091, + "step": 269780 + }, + { + "epoch": 1.36, + "learning_rate": 9.58312101750155e-05, + "loss": 0.0077, + "step": 269790 + }, + { + "epoch": 1.36, + "learning_rate": 9.58236424820015e-05, + "loss": 0.0103, + "step": 269800 + }, + { + "epoch": 1.36, + "learning_rate": 9.58160747889875e-05, + "loss": 0.008, + "step": 269810 + }, + { + "epoch": 1.36, + "learning_rate": 9.580850709597348e-05, + "loss": 0.0086, + "step": 269820 + }, + { + "epoch": 1.36, + "learning_rate": 9.580093940295947e-05, + "loss": 0.0072, + "step": 269830 + }, + { + "epoch": 1.36, + "learning_rate": 9.579337170994547e-05, + "loss": 0.0057, + "step": 269840 + }, + { + "epoch": 1.36, + "learning_rate": 9.578580401693145e-05, + "loss": 0.0089, + "step": 269850 + }, + { + "epoch": 1.36, + "learning_rate": 9.577823632391744e-05, + "loss": 0.0089, + "step": 269860 + }, + { + "epoch": 1.36, + "learning_rate": 9.577066863090342e-05, + "loss": 0.0091, + "step": 269870 + }, + { + "epoch": 1.36, + "learning_rate": 9.576310093788942e-05, + "loss": 0.0081, + "step": 269880 + }, + { + "epoch": 1.36, + "learning_rate": 9.575553324487541e-05, + "loss": 0.0081, + "step": 269890 + }, + { + "epoch": 1.36, + "learning_rate": 9.57479655518614e-05, + "loss": 0.0074, + "step": 269900 + }, + { + "epoch": 1.36, + "learning_rate": 9.574039785884739e-05, + "loss": 0.0084, + "step": 269910 + }, + { + "epoch": 1.36, + "learning_rate": 9.573283016583336e-05, + "loss": 0.008, + "step": 269920 + }, + { + "epoch": 1.36, + "learning_rate": 9.572526247281935e-05, + "loss": 0.0081, + "step": 269930 + }, + { + "epoch": 1.36, + "learning_rate": 9.571769477980535e-05, + "loss": 0.0082, + "step": 269940 + }, + { + "epoch": 1.36, + "learning_rate": 9.571012708679133e-05, + "loss": 0.0071, + "step": 269950 + }, + { + "epoch": 1.36, + "learning_rate": 9.570255939377733e-05, + "loss": 0.0065, + "step": 269960 + }, + { + "epoch": 1.36, + "learning_rate": 9.56949917007633e-05, + "loss": 0.0084, + "step": 269970 + }, + { + "epoch": 1.36, + "learning_rate": 9.56874240077493e-05, + "loss": 0.0086, + "step": 269980 + }, + { + "epoch": 1.36, + "learning_rate": 9.56798563147353e-05, + "loss": 0.0087, + "step": 269990 + }, + { + "epoch": 1.36, + "learning_rate": 9.567228862172128e-05, + "loss": 0.0089, + "step": 270000 + }, + { + "epoch": 1.36, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.006005189847201109, + "eval_runtime": 116.1544, + "eval_samples_per_second": 17.218, + "eval_steps_per_second": 4.305, + "step": 270000 + }, + { + "epoch": 1.36, + "learning_rate": 9.566472092870727e-05, + "loss": 0.009, + "step": 270010 + }, + { + "epoch": 1.36, + "learning_rate": 9.565715323569327e-05, + "loss": 0.0076, + "step": 270020 + }, + { + "epoch": 1.36, + "learning_rate": 9.564958554267925e-05, + "loss": 0.008, + "step": 270030 + }, + { + "epoch": 1.36, + "learning_rate": 9.564201784966524e-05, + "loss": 0.0072, + "step": 270040 + }, + { + "epoch": 1.36, + "learning_rate": 9.563445015665123e-05, + "loss": 0.007, + "step": 270050 + }, + { + "epoch": 1.36, + "learning_rate": 9.562688246363722e-05, + "loss": 0.0064, + "step": 270060 + }, + { + "epoch": 1.36, + "learning_rate": 9.561931477062322e-05, + "loss": 0.0069, + "step": 270070 + }, + { + "epoch": 1.36, + "learning_rate": 9.56117470776092e-05, + "loss": 0.0092, + "step": 270080 + }, + { + "epoch": 1.36, + "learning_rate": 9.560417938459519e-05, + "loss": 0.0101, + "step": 270090 + }, + { + "epoch": 1.36, + "learning_rate": 9.559661169158119e-05, + "loss": 0.0097, + "step": 270100 + }, + { + "epoch": 1.36, + "learning_rate": 9.558904399856717e-05, + "loss": 0.0091, + "step": 270110 + }, + { + "epoch": 1.36, + "learning_rate": 9.558147630555316e-05, + "loss": 0.007, + "step": 270120 + }, + { + "epoch": 1.36, + "learning_rate": 9.557390861253915e-05, + "loss": 0.0101, + "step": 270130 + }, + { + "epoch": 1.36, + "learning_rate": 9.556634091952514e-05, + "loss": 0.0088, + "step": 270140 + }, + { + "epoch": 1.36, + "learning_rate": 9.555877322651114e-05, + "loss": 0.0064, + "step": 270150 + }, + { + "epoch": 1.36, + "learning_rate": 9.555120553349712e-05, + "loss": 0.0073, + "step": 270160 + }, + { + "epoch": 1.36, + "learning_rate": 9.554363784048311e-05, + "loss": 0.0073, + "step": 270170 + }, + { + "epoch": 1.36, + "learning_rate": 9.55360701474691e-05, + "loss": 0.0063, + "step": 270180 + }, + { + "epoch": 1.36, + "learning_rate": 9.552850245445509e-05, + "loss": 0.0069, + "step": 270190 + }, + { + "epoch": 1.36, + "learning_rate": 9.552093476144108e-05, + "loss": 0.0084, + "step": 270200 + }, + { + "epoch": 1.36, + "learning_rate": 9.551336706842708e-05, + "loss": 0.0074, + "step": 270210 + }, + { + "epoch": 1.36, + "learning_rate": 9.550579937541306e-05, + "loss": 0.0074, + "step": 270220 + }, + { + "epoch": 1.36, + "learning_rate": 9.549823168239905e-05, + "loss": 0.0057, + "step": 270230 + }, + { + "epoch": 1.36, + "learning_rate": 9.549066398938504e-05, + "loss": 0.0102, + "step": 270240 + }, + { + "epoch": 1.36, + "learning_rate": 9.548309629637103e-05, + "loss": 0.0072, + "step": 270250 + }, + { + "epoch": 1.36, + "learning_rate": 9.547552860335703e-05, + "loss": 0.0056, + "step": 270260 + }, + { + "epoch": 1.36, + "learning_rate": 9.546796091034301e-05, + "loss": 0.0065, + "step": 270270 + }, + { + "epoch": 1.36, + "learning_rate": 9.5460393217329e-05, + "loss": 0.0075, + "step": 270280 + }, + { + "epoch": 1.36, + "learning_rate": 9.5452825524315e-05, + "loss": 0.0137, + "step": 270290 + }, + { + "epoch": 1.36, + "learning_rate": 9.544525783130098e-05, + "loss": 0.0086, + "step": 270300 + }, + { + "epoch": 1.36, + "learning_rate": 9.543769013828697e-05, + "loss": 0.0099, + "step": 270310 + }, + { + "epoch": 1.36, + "learning_rate": 9.543012244527296e-05, + "loss": 0.0071, + "step": 270320 + }, + { + "epoch": 1.36, + "learning_rate": 9.542255475225895e-05, + "loss": 0.0083, + "step": 270330 + }, + { + "epoch": 1.36, + "learning_rate": 9.541498705924495e-05, + "loss": 0.0088, + "step": 270340 + }, + { + "epoch": 1.36, + "learning_rate": 9.540741936623093e-05, + "loss": 0.0081, + "step": 270350 + }, + { + "epoch": 1.36, + "learning_rate": 9.539985167321692e-05, + "loss": 0.0068, + "step": 270360 + }, + { + "epoch": 1.36, + "learning_rate": 9.539228398020292e-05, + "loss": 0.009, + "step": 270370 + }, + { + "epoch": 1.36, + "learning_rate": 9.53847162871889e-05, + "loss": 0.0095, + "step": 270380 + }, + { + "epoch": 1.36, + "learning_rate": 9.537714859417489e-05, + "loss": 0.0088, + "step": 270390 + }, + { + "epoch": 1.36, + "learning_rate": 9.536958090116087e-05, + "loss": 0.0054, + "step": 270400 + }, + { + "epoch": 1.36, + "learning_rate": 9.536201320814687e-05, + "loss": 0.0095, + "step": 270410 + }, + { + "epoch": 1.36, + "learning_rate": 9.535444551513286e-05, + "loss": 0.0065, + "step": 270420 + }, + { + "epoch": 1.36, + "learning_rate": 9.534687782211885e-05, + "loss": 0.007, + "step": 270430 + }, + { + "epoch": 1.36, + "learning_rate": 9.533931012910484e-05, + "loss": 0.0067, + "step": 270440 + }, + { + "epoch": 1.36, + "learning_rate": 9.533174243609084e-05, + "loss": 0.0108, + "step": 270450 + }, + { + "epoch": 1.36, + "learning_rate": 9.532417474307682e-05, + "loss": 0.0086, + "step": 270460 + }, + { + "epoch": 1.36, + "learning_rate": 9.531660705006281e-05, + "loss": 0.0096, + "step": 270470 + }, + { + "epoch": 1.36, + "learning_rate": 9.53090393570488e-05, + "loss": 0.0108, + "step": 270480 + }, + { + "epoch": 1.36, + "learning_rate": 9.530147166403479e-05, + "loss": 0.0072, + "step": 270490 + }, + { + "epoch": 1.36, + "learning_rate": 9.529390397102078e-05, + "loss": 0.0075, + "step": 270500 + }, + { + "epoch": 1.36, + "learning_rate": 9.528633627800677e-05, + "loss": 0.0064, + "step": 270510 + }, + { + "epoch": 1.36, + "learning_rate": 9.527876858499276e-05, + "loss": 0.009, + "step": 270520 + }, + { + "epoch": 1.36, + "learning_rate": 9.527120089197876e-05, + "loss": 0.0097, + "step": 270530 + }, + { + "epoch": 1.36, + "learning_rate": 9.526363319896474e-05, + "loss": 0.0086, + "step": 270540 + }, + { + "epoch": 1.36, + "learning_rate": 9.525606550595072e-05, + "loss": 0.0065, + "step": 270550 + }, + { + "epoch": 1.37, + "learning_rate": 9.52484978129367e-05, + "loss": 0.0082, + "step": 270560 + }, + { + "epoch": 1.37, + "learning_rate": 9.52409301199227e-05, + "loss": 0.0068, + "step": 270570 + }, + { + "epoch": 1.37, + "learning_rate": 9.523336242690868e-05, + "loss": 0.0097, + "step": 270580 + }, + { + "epoch": 1.37, + "learning_rate": 9.522579473389467e-05, + "loss": 0.0063, + "step": 270590 + }, + { + "epoch": 1.37, + "learning_rate": 9.521822704088067e-05, + "loss": 0.0072, + "step": 270600 + }, + { + "epoch": 1.37, + "learning_rate": 9.521065934786665e-05, + "loss": 0.0096, + "step": 270610 + }, + { + "epoch": 1.37, + "learning_rate": 9.520309165485264e-05, + "loss": 0.0068, + "step": 270620 + }, + { + "epoch": 1.37, + "learning_rate": 9.519552396183864e-05, + "loss": 0.0065, + "step": 270630 + }, + { + "epoch": 1.37, + "learning_rate": 9.518795626882462e-05, + "loss": 0.0081, + "step": 270640 + }, + { + "epoch": 1.37, + "learning_rate": 9.518038857581061e-05, + "loss": 0.0074, + "step": 270650 + }, + { + "epoch": 1.37, + "learning_rate": 9.517282088279661e-05, + "loss": 0.0066, + "step": 270660 + }, + { + "epoch": 1.37, + "learning_rate": 9.516525318978259e-05, + "loss": 0.0092, + "step": 270670 + }, + { + "epoch": 1.37, + "learning_rate": 9.515768549676859e-05, + "loss": 0.0133, + "step": 270680 + }, + { + "epoch": 1.37, + "learning_rate": 9.515011780375457e-05, + "loss": 0.0075, + "step": 270690 + }, + { + "epoch": 1.37, + "learning_rate": 9.514255011074056e-05, + "loss": 0.0079, + "step": 270700 + }, + { + "epoch": 1.37, + "learning_rate": 9.513498241772656e-05, + "loss": 0.0083, + "step": 270710 + }, + { + "epoch": 1.37, + "learning_rate": 9.512741472471254e-05, + "loss": 0.0081, + "step": 270720 + }, + { + "epoch": 1.37, + "learning_rate": 9.511984703169853e-05, + "loss": 0.0077, + "step": 270730 + }, + { + "epoch": 1.37, + "learning_rate": 9.511227933868453e-05, + "loss": 0.0062, + "step": 270740 + }, + { + "epoch": 1.37, + "learning_rate": 9.510471164567051e-05, + "loss": 0.0069, + "step": 270750 + }, + { + "epoch": 1.37, + "learning_rate": 9.50971439526565e-05, + "loss": 0.007, + "step": 270760 + }, + { + "epoch": 1.37, + "learning_rate": 9.508957625964249e-05, + "loss": 0.0087, + "step": 270770 + }, + { + "epoch": 1.37, + "learning_rate": 9.508200856662848e-05, + "loss": 0.0093, + "step": 270780 + }, + { + "epoch": 1.37, + "learning_rate": 9.507444087361448e-05, + "loss": 0.0117, + "step": 270790 + }, + { + "epoch": 1.37, + "learning_rate": 9.506687318060046e-05, + "loss": 0.0083, + "step": 270800 + }, + { + "epoch": 1.37, + "learning_rate": 9.505930548758645e-05, + "loss": 0.0069, + "step": 270810 + }, + { + "epoch": 1.37, + "learning_rate": 9.505173779457245e-05, + "loss": 0.0078, + "step": 270820 + }, + { + "epoch": 1.37, + "learning_rate": 9.504417010155843e-05, + "loss": 0.0079, + "step": 270830 + }, + { + "epoch": 1.37, + "learning_rate": 9.503660240854442e-05, + "loss": 0.0082, + "step": 270840 + }, + { + "epoch": 1.37, + "learning_rate": 9.50290347155304e-05, + "loss": 0.0089, + "step": 270850 + }, + { + "epoch": 1.37, + "learning_rate": 9.50214670225164e-05, + "loss": 0.0098, + "step": 270860 + }, + { + "epoch": 1.37, + "learning_rate": 9.50138993295024e-05, + "loss": 0.006, + "step": 270870 + }, + { + "epoch": 1.37, + "learning_rate": 9.500633163648838e-05, + "loss": 0.0139, + "step": 270880 + }, + { + "epoch": 1.37, + "learning_rate": 9.499876394347437e-05, + "loss": 0.0072, + "step": 270890 + }, + { + "epoch": 1.37, + "learning_rate": 9.499119625046037e-05, + "loss": 0.0115, + "step": 270900 + }, + { + "epoch": 1.37, + "learning_rate": 9.498362855744635e-05, + "loss": 0.0098, + "step": 270910 + }, + { + "epoch": 1.37, + "learning_rate": 9.497606086443234e-05, + "loss": 0.0091, + "step": 270920 + }, + { + "epoch": 1.37, + "learning_rate": 9.496849317141832e-05, + "loss": 0.0077, + "step": 270930 + }, + { + "epoch": 1.37, + "learning_rate": 9.496092547840432e-05, + "loss": 0.007, + "step": 270940 + }, + { + "epoch": 1.37, + "learning_rate": 9.495335778539031e-05, + "loss": 0.0098, + "step": 270950 + }, + { + "epoch": 1.37, + "learning_rate": 9.49457900923763e-05, + "loss": 0.0077, + "step": 270960 + }, + { + "epoch": 1.37, + "learning_rate": 9.493822239936229e-05, + "loss": 0.0075, + "step": 270970 + }, + { + "epoch": 1.37, + "learning_rate": 9.493065470634829e-05, + "loss": 0.0089, + "step": 270980 + }, + { + "epoch": 1.37, + "learning_rate": 9.492308701333427e-05, + "loss": 0.0077, + "step": 270990 + }, + { + "epoch": 1.37, + "learning_rate": 9.491551932032026e-05, + "loss": 0.012, + "step": 271000 + }, + { + "epoch": 1.37, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.0061246431432664394, + "eval_runtime": 116.2526, + "eval_samples_per_second": 17.204, + "eval_steps_per_second": 4.301, + "step": 271000 + }, + { + "epoch": 1.37, + "learning_rate": 9.490795162730624e-05, + "loss": 0.0075, + "step": 271010 + }, + { + "epoch": 1.37, + "learning_rate": 9.490038393429224e-05, + "loss": 0.0075, + "step": 271020 + }, + { + "epoch": 1.37, + "learning_rate": 9.489281624127823e-05, + "loss": 0.0087, + "step": 271030 + }, + { + "epoch": 1.37, + "learning_rate": 9.488524854826422e-05, + "loss": 0.0078, + "step": 271040 + }, + { + "epoch": 1.37, + "learning_rate": 9.487768085525021e-05, + "loss": 0.0111, + "step": 271050 + }, + { + "epoch": 1.37, + "learning_rate": 9.48701131622362e-05, + "loss": 0.008, + "step": 271060 + }, + { + "epoch": 1.37, + "learning_rate": 9.486254546922219e-05, + "loss": 0.0117, + "step": 271070 + }, + { + "epoch": 1.37, + "learning_rate": 9.485497777620818e-05, + "loss": 0.005, + "step": 271080 + }, + { + "epoch": 1.37, + "learning_rate": 9.484741008319416e-05, + "loss": 0.009, + "step": 271090 + }, + { + "epoch": 1.37, + "learning_rate": 9.483984239018016e-05, + "loss": 0.0068, + "step": 271100 + }, + { + "epoch": 1.37, + "learning_rate": 9.483227469716615e-05, + "loss": 0.007, + "step": 271110 + }, + { + "epoch": 1.37, + "learning_rate": 9.482470700415213e-05, + "loss": 0.0074, + "step": 271120 + }, + { + "epoch": 1.37, + "learning_rate": 9.481713931113813e-05, + "loss": 0.0065, + "step": 271130 + }, + { + "epoch": 1.37, + "learning_rate": 9.480957161812412e-05, + "loss": 0.0068, + "step": 271140 + }, + { + "epoch": 1.37, + "learning_rate": 9.48020039251101e-05, + "loss": 0.0091, + "step": 271150 + }, + { + "epoch": 1.37, + "learning_rate": 9.47944362320961e-05, + "loss": 0.007, + "step": 271160 + }, + { + "epoch": 1.37, + "learning_rate": 9.478686853908208e-05, + "loss": 0.0083, + "step": 271170 + }, + { + "epoch": 1.37, + "learning_rate": 9.477930084606806e-05, + "loss": 0.009, + "step": 271180 + }, + { + "epoch": 1.37, + "learning_rate": 9.477173315305406e-05, + "loss": 0.0062, + "step": 271190 + }, + { + "epoch": 1.37, + "learning_rate": 9.476416546004004e-05, + "loss": 0.0092, + "step": 271200 + }, + { + "epoch": 1.37, + "learning_rate": 9.475659776702604e-05, + "loss": 0.0084, + "step": 271210 + }, + { + "epoch": 1.37, + "learning_rate": 9.474903007401202e-05, + "loss": 0.0113, + "step": 271220 + }, + { + "epoch": 1.37, + "learning_rate": 9.474146238099801e-05, + "loss": 0.0079, + "step": 271230 + }, + { + "epoch": 1.37, + "learning_rate": 9.473389468798401e-05, + "loss": 0.0083, + "step": 271240 + }, + { + "epoch": 1.37, + "learning_rate": 9.472632699496999e-05, + "loss": 0.0095, + "step": 271250 + }, + { + "epoch": 1.37, + "learning_rate": 9.471875930195598e-05, + "loss": 0.0082, + "step": 271260 + }, + { + "epoch": 1.37, + "learning_rate": 9.471119160894198e-05, + "loss": 0.009, + "step": 271270 + }, + { + "epoch": 1.37, + "learning_rate": 9.470362391592796e-05, + "loss": 0.0114, + "step": 271280 + }, + { + "epoch": 1.37, + "learning_rate": 9.469605622291395e-05, + "loss": 0.0084, + "step": 271290 + }, + { + "epoch": 1.37, + "learning_rate": 9.468848852989994e-05, + "loss": 0.007, + "step": 271300 + }, + { + "epoch": 1.37, + "learning_rate": 9.468092083688593e-05, + "loss": 0.0064, + "step": 271310 + }, + { + "epoch": 1.37, + "learning_rate": 9.467335314387193e-05, + "loss": 0.0104, + "step": 271320 + }, + { + "epoch": 1.37, + "learning_rate": 9.466578545085791e-05, + "loss": 0.0073, + "step": 271330 + }, + { + "epoch": 1.37, + "learning_rate": 9.46582177578439e-05, + "loss": 0.0086, + "step": 271340 + }, + { + "epoch": 1.37, + "learning_rate": 9.46506500648299e-05, + "loss": 0.0073, + "step": 271350 + }, + { + "epoch": 1.37, + "learning_rate": 9.464308237181588e-05, + "loss": 0.0072, + "step": 271360 + }, + { + "epoch": 1.37, + "learning_rate": 9.463551467880187e-05, + "loss": 0.0088, + "step": 271370 + }, + { + "epoch": 1.37, + "learning_rate": 9.462794698578786e-05, + "loss": 0.0065, + "step": 271380 + }, + { + "epoch": 1.37, + "learning_rate": 9.462037929277385e-05, + "loss": 0.0062, + "step": 271390 + }, + { + "epoch": 1.37, + "learning_rate": 9.461281159975985e-05, + "loss": 0.0115, + "step": 271400 + }, + { + "epoch": 1.37, + "learning_rate": 9.460524390674583e-05, + "loss": 0.0074, + "step": 271410 + }, + { + "epoch": 1.37, + "learning_rate": 9.459767621373182e-05, + "loss": 0.0073, + "step": 271420 + }, + { + "epoch": 1.37, + "learning_rate": 9.459010852071782e-05, + "loss": 0.01, + "step": 271430 + }, + { + "epoch": 1.37, + "learning_rate": 9.45825408277038e-05, + "loss": 0.0072, + "step": 271440 + }, + { + "epoch": 1.37, + "learning_rate": 9.45749731346898e-05, + "loss": 0.008, + "step": 271450 + }, + { + "epoch": 1.37, + "learning_rate": 9.456740544167577e-05, + "loss": 0.0094, + "step": 271460 + }, + { + "epoch": 1.37, + "learning_rate": 9.455983774866177e-05, + "loss": 0.0077, + "step": 271470 + }, + { + "epoch": 1.37, + "learning_rate": 9.455227005564776e-05, + "loss": 0.0082, + "step": 271480 + }, + { + "epoch": 1.37, + "learning_rate": 9.454470236263375e-05, + "loss": 0.0071, + "step": 271490 + }, + { + "epoch": 1.37, + "learning_rate": 9.453713466961974e-05, + "loss": 0.0099, + "step": 271500 + }, + { + "epoch": 1.37, + "learning_rate": 9.452956697660574e-05, + "loss": 0.0083, + "step": 271510 + }, + { + "epoch": 1.37, + "learning_rate": 9.452199928359172e-05, + "loss": 0.0072, + "step": 271520 + }, + { + "epoch": 1.37, + "learning_rate": 9.451443159057771e-05, + "loss": 0.0083, + "step": 271530 + }, + { + "epoch": 1.37, + "learning_rate": 9.45068638975637e-05, + "loss": 0.0101, + "step": 271540 + }, + { + "epoch": 1.37, + "learning_rate": 9.449929620454969e-05, + "loss": 0.0081, + "step": 271550 + }, + { + "epoch": 1.37, + "learning_rate": 9.449172851153568e-05, + "loss": 0.007, + "step": 271560 + }, + { + "epoch": 1.37, + "learning_rate": 9.448416081852167e-05, + "loss": 0.0088, + "step": 271570 + }, + { + "epoch": 1.37, + "learning_rate": 9.447659312550766e-05, + "loss": 0.0093, + "step": 271580 + }, + { + "epoch": 1.37, + "learning_rate": 9.446902543249366e-05, + "loss": 0.0113, + "step": 271590 + }, + { + "epoch": 1.37, + "learning_rate": 9.446145773947964e-05, + "loss": 0.0093, + "step": 271600 + }, + { + "epoch": 1.37, + "learning_rate": 9.445389004646563e-05, + "loss": 0.0099, + "step": 271610 + }, + { + "epoch": 1.37, + "learning_rate": 9.444632235345161e-05, + "loss": 0.0067, + "step": 271620 + }, + { + "epoch": 1.37, + "learning_rate": 9.443875466043761e-05, + "loss": 0.0093, + "step": 271630 + }, + { + "epoch": 1.37, + "learning_rate": 9.44311869674236e-05, + "loss": 0.0079, + "step": 271640 + }, + { + "epoch": 1.37, + "learning_rate": 9.442361927440958e-05, + "loss": 0.0093, + "step": 271650 + }, + { + "epoch": 1.37, + "learning_rate": 9.441605158139558e-05, + "loss": 0.0091, + "step": 271660 + }, + { + "epoch": 1.37, + "learning_rate": 9.440848388838157e-05, + "loss": 0.0064, + "step": 271670 + }, + { + "epoch": 1.37, + "learning_rate": 9.440091619536756e-05, + "loss": 0.0096, + "step": 271680 + }, + { + "epoch": 1.37, + "learning_rate": 9.439334850235355e-05, + "loss": 0.0059, + "step": 271690 + }, + { + "epoch": 1.37, + "learning_rate": 9.438578080933955e-05, + "loss": 0.0094, + "step": 271700 + }, + { + "epoch": 1.37, + "learning_rate": 9.437821311632553e-05, + "loss": 0.0067, + "step": 271710 + }, + { + "epoch": 1.37, + "learning_rate": 9.437064542331152e-05, + "loss": 0.0079, + "step": 271720 + }, + { + "epoch": 1.37, + "learning_rate": 9.43630777302975e-05, + "loss": 0.0076, + "step": 271730 + }, + { + "epoch": 1.37, + "learning_rate": 9.43555100372835e-05, + "loss": 0.0068, + "step": 271740 + }, + { + "epoch": 1.37, + "learning_rate": 9.43479423442695e-05, + "loss": 0.0091, + "step": 271750 + }, + { + "epoch": 1.37, + "learning_rate": 9.434037465125548e-05, + "loss": 0.0053, + "step": 271760 + }, + { + "epoch": 1.37, + "learning_rate": 9.433280695824147e-05, + "loss": 0.0085, + "step": 271770 + }, + { + "epoch": 1.37, + "learning_rate": 9.432523926522747e-05, + "loss": 0.0073, + "step": 271780 + }, + { + "epoch": 1.37, + "learning_rate": 9.431767157221345e-05, + "loss": 0.0087, + "step": 271790 + }, + { + "epoch": 1.37, + "learning_rate": 9.431010387919944e-05, + "loss": 0.0074, + "step": 271800 + }, + { + "epoch": 1.37, + "learning_rate": 9.430253618618541e-05, + "loss": 0.0061, + "step": 271810 + }, + { + "epoch": 1.37, + "learning_rate": 9.42949684931714e-05, + "loss": 0.0081, + "step": 271820 + }, + { + "epoch": 1.37, + "learning_rate": 9.428740080015739e-05, + "loss": 0.0084, + "step": 271830 + }, + { + "epoch": 1.37, + "learning_rate": 9.427983310714338e-05, + "loss": 0.0134, + "step": 271840 + }, + { + "epoch": 1.37, + "learning_rate": 9.427226541412938e-05, + "loss": 0.0075, + "step": 271850 + }, + { + "epoch": 1.37, + "learning_rate": 9.426469772111536e-05, + "loss": 0.0069, + "step": 271860 + }, + { + "epoch": 1.37, + "learning_rate": 9.425713002810135e-05, + "loss": 0.0091, + "step": 271870 + }, + { + "epoch": 1.37, + "learning_rate": 9.424956233508735e-05, + "loss": 0.0076, + "step": 271880 + }, + { + "epoch": 1.37, + "learning_rate": 9.424199464207333e-05, + "loss": 0.009, + "step": 271890 + }, + { + "epoch": 1.37, + "learning_rate": 9.423442694905932e-05, + "loss": 0.0088, + "step": 271900 + }, + { + "epoch": 1.37, + "learning_rate": 9.42268592560453e-05, + "loss": 0.008, + "step": 271910 + }, + { + "epoch": 1.37, + "learning_rate": 9.42192915630313e-05, + "loss": 0.0059, + "step": 271920 + }, + { + "epoch": 1.37, + "learning_rate": 9.42117238700173e-05, + "loss": 0.0109, + "step": 271930 + }, + { + "epoch": 1.37, + "learning_rate": 9.420415617700328e-05, + "loss": 0.0077, + "step": 271940 + }, + { + "epoch": 1.37, + "learning_rate": 9.419658848398927e-05, + "loss": 0.0073, + "step": 271950 + }, + { + "epoch": 1.37, + "learning_rate": 9.418902079097527e-05, + "loss": 0.0094, + "step": 271960 + }, + { + "epoch": 1.37, + "learning_rate": 9.418145309796125e-05, + "loss": 0.0062, + "step": 271970 + }, + { + "epoch": 1.37, + "learning_rate": 9.417388540494724e-05, + "loss": 0.0092, + "step": 271980 + }, + { + "epoch": 1.37, + "learning_rate": 9.416631771193322e-05, + "loss": 0.0069, + "step": 271990 + }, + { + "epoch": 1.37, + "learning_rate": 9.415875001891922e-05, + "loss": 0.0082, + "step": 272000 + }, + { + "epoch": 1.37, + "eval_cer": 0.9144265880775191, + "eval_loss": 0.006095241755247116, + "eval_runtime": 116.2589, + "eval_samples_per_second": 17.203, + "eval_steps_per_second": 4.301, + "step": 272000 + }, + { + "epoch": 1.37, + "learning_rate": 9.415118232590521e-05, + "loss": 0.0073, + "step": 272010 + }, + { + "epoch": 1.37, + "learning_rate": 9.41436146328912e-05, + "loss": 0.0076, + "step": 272020 + }, + { + "epoch": 1.37, + "learning_rate": 9.413604693987719e-05, + "loss": 0.0072, + "step": 272030 + }, + { + "epoch": 1.37, + "learning_rate": 9.412847924686319e-05, + "loss": 0.007, + "step": 272040 + }, + { + "epoch": 1.37, + "learning_rate": 9.412091155384917e-05, + "loss": 0.0083, + "step": 272050 + }, + { + "epoch": 1.37, + "learning_rate": 9.411334386083516e-05, + "loss": 0.0082, + "step": 272060 + }, + { + "epoch": 1.37, + "learning_rate": 9.410577616782114e-05, + "loss": 0.0097, + "step": 272070 + }, + { + "epoch": 1.37, + "learning_rate": 9.409820847480714e-05, + "loss": 0.0093, + "step": 272080 + }, + { + "epoch": 1.37, + "learning_rate": 9.409064078179313e-05, + "loss": 0.0096, + "step": 272090 + }, + { + "epoch": 1.37, + "learning_rate": 9.408307308877912e-05, + "loss": 0.0073, + "step": 272100 + }, + { + "epoch": 1.37, + "learning_rate": 9.407550539576511e-05, + "loss": 0.0092, + "step": 272110 + }, + { + "epoch": 1.37, + "learning_rate": 9.40679377027511e-05, + "loss": 0.0085, + "step": 272120 + }, + { + "epoch": 1.37, + "learning_rate": 9.406037000973709e-05, + "loss": 0.0071, + "step": 272130 + }, + { + "epoch": 1.37, + "learning_rate": 9.405280231672308e-05, + "loss": 0.0066, + "step": 272140 + }, + { + "epoch": 1.37, + "learning_rate": 9.404523462370908e-05, + "loss": 0.0074, + "step": 272150 + }, + { + "epoch": 1.37, + "learning_rate": 9.403766693069506e-05, + "loss": 0.0072, + "step": 272160 + }, + { + "epoch": 1.37, + "learning_rate": 9.403009923768105e-05, + "loss": 0.0103, + "step": 272170 + }, + { + "epoch": 1.37, + "learning_rate": 9.402253154466703e-05, + "loss": 0.0086, + "step": 272180 + }, + { + "epoch": 1.37, + "learning_rate": 9.401496385165303e-05, + "loss": 0.0081, + "step": 272190 + }, + { + "epoch": 1.37, + "learning_rate": 9.400739615863902e-05, + "loss": 0.0071, + "step": 272200 + }, + { + "epoch": 1.37, + "learning_rate": 9.3999828465625e-05, + "loss": 0.0072, + "step": 272210 + }, + { + "epoch": 1.37, + "learning_rate": 9.3992260772611e-05, + "loss": 0.0096, + "step": 272220 + }, + { + "epoch": 1.37, + "learning_rate": 9.3984693079597e-05, + "loss": 0.0064, + "step": 272230 + }, + { + "epoch": 1.37, + "learning_rate": 9.397712538658298e-05, + "loss": 0.009, + "step": 272240 + }, + { + "epoch": 1.37, + "learning_rate": 9.396955769356897e-05, + "loss": 0.0081, + "step": 272250 + }, + { + "epoch": 1.37, + "learning_rate": 9.396199000055495e-05, + "loss": 0.0076, + "step": 272260 + }, + { + "epoch": 1.37, + "learning_rate": 9.395442230754095e-05, + "loss": 0.0074, + "step": 272270 + }, + { + "epoch": 1.37, + "learning_rate": 9.394685461452694e-05, + "loss": 0.0106, + "step": 272280 + }, + { + "epoch": 1.37, + "learning_rate": 9.393928692151293e-05, + "loss": 0.0071, + "step": 272290 + }, + { + "epoch": 1.37, + "learning_rate": 9.393171922849892e-05, + "loss": 0.0125, + "step": 272300 + }, + { + "epoch": 1.37, + "learning_rate": 9.392415153548492e-05, + "loss": 0.0077, + "step": 272310 + }, + { + "epoch": 1.37, + "learning_rate": 9.39165838424709e-05, + "loss": 0.0095, + "step": 272320 + }, + { + "epoch": 1.37, + "learning_rate": 9.390901614945689e-05, + "loss": 0.0074, + "step": 272330 + }, + { + "epoch": 1.37, + "learning_rate": 9.390144845644287e-05, + "loss": 0.007, + "step": 272340 + }, + { + "epoch": 1.37, + "learning_rate": 9.389388076342887e-05, + "loss": 0.0068, + "step": 272350 + }, + { + "epoch": 1.37, + "learning_rate": 9.388631307041486e-05, + "loss": 0.0066, + "step": 272360 + }, + { + "epoch": 1.37, + "learning_rate": 9.387874537740084e-05, + "loss": 0.0082, + "step": 272370 + }, + { + "epoch": 1.37, + "learning_rate": 9.387117768438684e-05, + "loss": 0.0056, + "step": 272380 + }, + { + "epoch": 1.37, + "learning_rate": 9.386360999137283e-05, + "loss": 0.008, + "step": 272390 + }, + { + "epoch": 1.37, + "learning_rate": 9.385604229835882e-05, + "loss": 0.0074, + "step": 272400 + }, + { + "epoch": 1.37, + "learning_rate": 9.384847460534481e-05, + "loss": 0.0077, + "step": 272410 + }, + { + "epoch": 1.37, + "learning_rate": 9.384090691233079e-05, + "loss": 0.0081, + "step": 272420 + }, + { + "epoch": 1.37, + "learning_rate": 9.383333921931679e-05, + "loss": 0.0084, + "step": 272430 + }, + { + "epoch": 1.37, + "learning_rate": 9.382577152630276e-05, + "loss": 0.0084, + "step": 272440 + }, + { + "epoch": 1.37, + "learning_rate": 9.381820383328875e-05, + "loss": 0.0067, + "step": 272450 + }, + { + "epoch": 1.37, + "learning_rate": 9.381063614027475e-05, + "loss": 0.0077, + "step": 272460 + }, + { + "epoch": 1.37, + "learning_rate": 9.380306844726073e-05, + "loss": 0.0076, + "step": 272470 + }, + { + "epoch": 1.37, + "learning_rate": 9.379550075424672e-05, + "loss": 0.01, + "step": 272480 + }, + { + "epoch": 1.37, + "learning_rate": 9.378793306123272e-05, + "loss": 0.0071, + "step": 272490 + }, + { + "epoch": 1.37, + "learning_rate": 9.37803653682187e-05, + "loss": 0.0084, + "step": 272500 + }, + { + "epoch": 1.37, + "learning_rate": 9.37727976752047e-05, + "loss": 0.011, + "step": 272510 + }, + { + "epoch": 1.37, + "learning_rate": 9.376522998219067e-05, + "loss": 0.007, + "step": 272520 + }, + { + "epoch": 1.37, + "learning_rate": 9.375766228917667e-05, + "loss": 0.0083, + "step": 272530 + }, + { + "epoch": 1.37, + "learning_rate": 9.375009459616266e-05, + "loss": 0.0069, + "step": 272540 + }, + { + "epoch": 1.38, + "learning_rate": 9.374252690314865e-05, + "loss": 0.0123, + "step": 272550 + }, + { + "epoch": 1.38, + "learning_rate": 9.373495921013464e-05, + "loss": 0.0067, + "step": 272560 + }, + { + "epoch": 1.38, + "learning_rate": 9.372739151712064e-05, + "loss": 0.01, + "step": 272570 + }, + { + "epoch": 1.38, + "learning_rate": 9.371982382410662e-05, + "loss": 0.0076, + "step": 272580 + }, + { + "epoch": 1.38, + "learning_rate": 9.371225613109261e-05, + "loss": 0.0083, + "step": 272590 + }, + { + "epoch": 1.38, + "learning_rate": 9.370468843807861e-05, + "loss": 0.0054, + "step": 272600 + }, + { + "epoch": 1.38, + "learning_rate": 9.369712074506459e-05, + "loss": 0.0102, + "step": 272610 + }, + { + "epoch": 1.38, + "learning_rate": 9.368955305205058e-05, + "loss": 0.0083, + "step": 272620 + }, + { + "epoch": 1.38, + "learning_rate": 9.368198535903657e-05, + "loss": 0.0091, + "step": 272630 + }, + { + "epoch": 1.38, + "learning_rate": 9.367441766602256e-05, + "loss": 0.0084, + "step": 272640 + }, + { + "epoch": 1.38, + "learning_rate": 9.366684997300856e-05, + "loss": 0.0076, + "step": 272650 + }, + { + "epoch": 1.38, + "learning_rate": 9.365928227999454e-05, + "loss": 0.0069, + "step": 272660 + }, + { + "epoch": 1.38, + "learning_rate": 9.365171458698053e-05, + "loss": 0.0089, + "step": 272670 + }, + { + "epoch": 1.38, + "learning_rate": 9.364414689396653e-05, + "loss": 0.0073, + "step": 272680 + }, + { + "epoch": 1.38, + "learning_rate": 9.363657920095251e-05, + "loss": 0.0088, + "step": 272690 + }, + { + "epoch": 1.38, + "learning_rate": 9.36290115079385e-05, + "loss": 0.0068, + "step": 272700 + }, + { + "epoch": 1.38, + "learning_rate": 9.362144381492449e-05, + "loss": 0.0073, + "step": 272710 + }, + { + "epoch": 1.38, + "learning_rate": 9.361387612191048e-05, + "loss": 0.01, + "step": 272720 + }, + { + "epoch": 1.38, + "learning_rate": 9.360630842889648e-05, + "loss": 0.0082, + "step": 272730 + }, + { + "epoch": 1.38, + "learning_rate": 9.359874073588246e-05, + "loss": 0.0086, + "step": 272740 + }, + { + "epoch": 1.38, + "learning_rate": 9.359117304286845e-05, + "loss": 0.0065, + "step": 272750 + }, + { + "epoch": 1.38, + "learning_rate": 9.358360534985445e-05, + "loss": 0.0087, + "step": 272760 + }, + { + "epoch": 1.38, + "learning_rate": 9.357603765684043e-05, + "loss": 0.0076, + "step": 272770 + }, + { + "epoch": 1.38, + "learning_rate": 9.356846996382642e-05, + "loss": 0.0071, + "step": 272780 + }, + { + "epoch": 1.38, + "learning_rate": 9.35609022708124e-05, + "loss": 0.007, + "step": 272790 + }, + { + "epoch": 1.38, + "learning_rate": 9.35533345777984e-05, + "loss": 0.0075, + "step": 272800 + }, + { + "epoch": 1.38, + "learning_rate": 9.35457668847844e-05, + "loss": 0.0081, + "step": 272810 + }, + { + "epoch": 1.38, + "learning_rate": 9.353819919177038e-05, + "loss": 0.0082, + "step": 272820 + }, + { + "epoch": 1.38, + "learning_rate": 9.353063149875637e-05, + "loss": 0.0053, + "step": 272830 + }, + { + "epoch": 1.38, + "learning_rate": 9.352306380574237e-05, + "loss": 0.0099, + "step": 272840 + }, + { + "epoch": 1.38, + "learning_rate": 9.351549611272835e-05, + "loss": 0.0074, + "step": 272850 + }, + { + "epoch": 1.38, + "learning_rate": 9.350792841971434e-05, + "loss": 0.0065, + "step": 272860 + }, + { + "epoch": 1.38, + "learning_rate": 9.350036072670032e-05, + "loss": 0.0073, + "step": 272870 + }, + { + "epoch": 1.38, + "learning_rate": 9.349279303368632e-05, + "loss": 0.006, + "step": 272880 + }, + { + "epoch": 1.38, + "learning_rate": 9.348522534067231e-05, + "loss": 0.0061, + "step": 272890 + }, + { + "epoch": 1.38, + "learning_rate": 9.34776576476583e-05, + "loss": 0.0102, + "step": 272900 + }, + { + "epoch": 1.38, + "learning_rate": 9.347008995464429e-05, + "loss": 0.0057, + "step": 272910 + }, + { + "epoch": 1.38, + "learning_rate": 9.346252226163029e-05, + "loss": 0.0077, + "step": 272920 + }, + { + "epoch": 1.38, + "learning_rate": 9.345495456861627e-05, + "loss": 0.0068, + "step": 272930 + }, + { + "epoch": 1.38, + "learning_rate": 9.344738687560226e-05, + "loss": 0.007, + "step": 272940 + }, + { + "epoch": 1.38, + "learning_rate": 9.343981918258824e-05, + "loss": 0.0072, + "step": 272950 + }, + { + "epoch": 1.38, + "learning_rate": 9.343225148957424e-05, + "loss": 0.0077, + "step": 272960 + }, + { + "epoch": 1.38, + "learning_rate": 9.342468379656023e-05, + "loss": 0.0072, + "step": 272970 + }, + { + "epoch": 1.38, + "learning_rate": 9.341711610354621e-05, + "loss": 0.0084, + "step": 272980 + }, + { + "epoch": 1.38, + "learning_rate": 9.340954841053221e-05, + "loss": 0.0084, + "step": 272990 + }, + { + "epoch": 1.38, + "learning_rate": 9.34019807175182e-05, + "loss": 0.008, + "step": 273000 + }, + { + "epoch": 1.38, + "eval_cer": 0.9144256176813937, + "eval_loss": 0.005903230048716068, + "eval_runtime": 116.3214, + "eval_samples_per_second": 17.194, + "eval_steps_per_second": 4.298, + "step": 273000 + }, + { + "epoch": 1.38, + "learning_rate": 9.339441302450419e-05, + "loss": 0.0064, + "step": 273010 + }, + { + "epoch": 1.38, + "learning_rate": 9.338684533149018e-05, + "loss": 0.0092, + "step": 273020 + }, + { + "epoch": 1.38, + "learning_rate": 9.337927763847616e-05, + "loss": 0.0106, + "step": 273030 + }, + { + "epoch": 1.38, + "learning_rate": 9.337170994546216e-05, + "loss": 0.0071, + "step": 273040 + }, + { + "epoch": 1.38, + "learning_rate": 9.336414225244815e-05, + "loss": 0.0089, + "step": 273050 + }, + { + "epoch": 1.38, + "learning_rate": 9.335657455943412e-05, + "loss": 0.0078, + "step": 273060 + }, + { + "epoch": 1.38, + "learning_rate": 9.334900686642012e-05, + "loss": 0.0094, + "step": 273070 + }, + { + "epoch": 1.38, + "learning_rate": 9.33414391734061e-05, + "loss": 0.0096, + "step": 273080 + }, + { + "epoch": 1.38, + "learning_rate": 9.333387148039209e-05, + "loss": 0.0079, + "step": 273090 + }, + { + "epoch": 1.38, + "learning_rate": 9.332630378737809e-05, + "loss": 0.0095, + "step": 273100 + }, + { + "epoch": 1.38, + "learning_rate": 9.331873609436407e-05, + "loss": 0.0078, + "step": 273110 + }, + { + "epoch": 1.38, + "learning_rate": 9.331116840135006e-05, + "loss": 0.0068, + "step": 273120 + }, + { + "epoch": 1.38, + "learning_rate": 9.330360070833606e-05, + "loss": 0.0071, + "step": 273130 + }, + { + "epoch": 1.38, + "learning_rate": 9.329603301532204e-05, + "loss": 0.0081, + "step": 273140 + }, + { + "epoch": 1.38, + "learning_rate": 9.328846532230803e-05, + "loss": 0.0064, + "step": 273150 + }, + { + "epoch": 1.38, + "learning_rate": 9.328089762929402e-05, + "loss": 0.009, + "step": 273160 + }, + { + "epoch": 1.38, + "learning_rate": 9.327332993628001e-05, + "loss": 0.009, + "step": 273170 + }, + { + "epoch": 1.38, + "learning_rate": 9.3265762243266e-05, + "loss": 0.0086, + "step": 273180 + }, + { + "epoch": 1.38, + "learning_rate": 9.325819455025199e-05, + "loss": 0.0071, + "step": 273190 + }, + { + "epoch": 1.38, + "learning_rate": 9.325062685723798e-05, + "loss": 0.0079, + "step": 273200 + }, + { + "epoch": 1.38, + "learning_rate": 9.324305916422398e-05, + "loss": 0.0075, + "step": 273210 + }, + { + "epoch": 1.38, + "learning_rate": 9.323549147120996e-05, + "loss": 0.0088, + "step": 273220 + }, + { + "epoch": 1.38, + "learning_rate": 9.322792377819595e-05, + "loss": 0.0063, + "step": 273230 + }, + { + "epoch": 1.38, + "learning_rate": 9.322035608518194e-05, + "loss": 0.0077, + "step": 273240 + }, + { + "epoch": 1.38, + "learning_rate": 9.321278839216793e-05, + "loss": 0.0092, + "step": 273250 + }, + { + "epoch": 1.38, + "learning_rate": 9.320522069915393e-05, + "loss": 0.0082, + "step": 273260 + }, + { + "epoch": 1.38, + "learning_rate": 9.31976530061399e-05, + "loss": 0.0068, + "step": 273270 + }, + { + "epoch": 1.38, + "learning_rate": 9.31900853131259e-05, + "loss": 0.0071, + "step": 273280 + }, + { + "epoch": 1.38, + "learning_rate": 9.31825176201119e-05, + "loss": 0.0058, + "step": 273290 + }, + { + "epoch": 1.38, + "learning_rate": 9.317494992709788e-05, + "loss": 0.0077, + "step": 273300 + }, + { + "epoch": 1.38, + "learning_rate": 9.316738223408387e-05, + "loss": 0.0089, + "step": 273310 + }, + { + "epoch": 1.38, + "learning_rate": 9.315981454106985e-05, + "loss": 0.0059, + "step": 273320 + }, + { + "epoch": 1.38, + "learning_rate": 9.315224684805585e-05, + "loss": 0.0069, + "step": 273330 + }, + { + "epoch": 1.38, + "learning_rate": 9.314467915504184e-05, + "loss": 0.0072, + "step": 273340 + }, + { + "epoch": 1.38, + "learning_rate": 9.313711146202783e-05, + "loss": 0.0094, + "step": 273350 + }, + { + "epoch": 1.38, + "learning_rate": 9.312954376901382e-05, + "loss": 0.0096, + "step": 273360 + }, + { + "epoch": 1.38, + "learning_rate": 9.312197607599982e-05, + "loss": 0.0047, + "step": 273370 + }, + { + "epoch": 1.38, + "learning_rate": 9.31144083829858e-05, + "loss": 0.0077, + "step": 273380 + }, + { + "epoch": 1.38, + "learning_rate": 9.310684068997179e-05, + "loss": 0.0069, + "step": 273390 + }, + { + "epoch": 1.38, + "learning_rate": 9.309927299695777e-05, + "loss": 0.0081, + "step": 273400 + }, + { + "epoch": 1.38, + "learning_rate": 9.309170530394377e-05, + "loss": 0.0089, + "step": 273410 + }, + { + "epoch": 1.38, + "learning_rate": 9.308413761092976e-05, + "loss": 0.007, + "step": 273420 + }, + { + "epoch": 1.38, + "learning_rate": 9.307656991791575e-05, + "loss": 0.0067, + "step": 273430 + }, + { + "epoch": 1.38, + "learning_rate": 9.306900222490174e-05, + "loss": 0.0077, + "step": 273440 + }, + { + "epoch": 1.38, + "learning_rate": 9.306143453188774e-05, + "loss": 0.0075, + "step": 273450 + }, + { + "epoch": 1.38, + "learning_rate": 9.305386683887372e-05, + "loss": 0.0076, + "step": 273460 + }, + { + "epoch": 1.38, + "learning_rate": 9.304629914585971e-05, + "loss": 0.0085, + "step": 273470 + }, + { + "epoch": 1.38, + "learning_rate": 9.303873145284569e-05, + "loss": 0.0079, + "step": 273480 + }, + { + "epoch": 1.38, + "learning_rate": 9.303116375983169e-05, + "loss": 0.007, + "step": 273490 + }, + { + "epoch": 1.38, + "learning_rate": 9.302359606681768e-05, + "loss": 0.0117, + "step": 273500 + }, + { + "epoch": 1.38, + "learning_rate": 9.301602837380366e-05, + "loss": 0.0087, + "step": 273510 + }, + { + "epoch": 1.38, + "learning_rate": 9.300846068078966e-05, + "loss": 0.0091, + "step": 273520 + }, + { + "epoch": 1.38, + "learning_rate": 9.300089298777565e-05, + "loss": 0.0072, + "step": 273530 + }, + { + "epoch": 1.38, + "learning_rate": 9.299332529476164e-05, + "loss": 0.0056, + "step": 273540 + }, + { + "epoch": 1.38, + "learning_rate": 9.298575760174763e-05, + "loss": 0.0063, + "step": 273550 + }, + { + "epoch": 1.38, + "learning_rate": 9.297818990873361e-05, + "loss": 0.0069, + "step": 273560 + }, + { + "epoch": 1.38, + "learning_rate": 9.297062221571961e-05, + "loss": 0.0079, + "step": 273570 + }, + { + "epoch": 1.38, + "learning_rate": 9.29630545227056e-05, + "loss": 0.0087, + "step": 273580 + }, + { + "epoch": 1.38, + "learning_rate": 9.295548682969158e-05, + "loss": 0.0075, + "step": 273590 + }, + { + "epoch": 1.38, + "learning_rate": 9.294791913667758e-05, + "loss": 0.0083, + "step": 273600 + }, + { + "epoch": 1.38, + "learning_rate": 9.294035144366357e-05, + "loss": 0.0074, + "step": 273610 + }, + { + "epoch": 1.38, + "learning_rate": 9.293278375064956e-05, + "loss": 0.0096, + "step": 273620 + }, + { + "epoch": 1.38, + "learning_rate": 9.292521605763555e-05, + "loss": 0.0082, + "step": 273630 + }, + { + "epoch": 1.38, + "learning_rate": 9.291764836462155e-05, + "loss": 0.0089, + "step": 273640 + }, + { + "epoch": 1.38, + "learning_rate": 9.291008067160753e-05, + "loss": 0.0084, + "step": 273650 + }, + { + "epoch": 1.38, + "learning_rate": 9.290251297859352e-05, + "loss": 0.0084, + "step": 273660 + }, + { + "epoch": 1.38, + "learning_rate": 9.28949452855795e-05, + "loss": 0.0074, + "step": 273670 + }, + { + "epoch": 1.38, + "learning_rate": 9.28873775925655e-05, + "loss": 0.0092, + "step": 273680 + }, + { + "epoch": 1.38, + "learning_rate": 9.287980989955147e-05, + "loss": 0.0077, + "step": 273690 + }, + { + "epoch": 1.38, + "learning_rate": 9.287224220653746e-05, + "loss": 0.0074, + "step": 273700 + }, + { + "epoch": 1.38, + "learning_rate": 9.286467451352346e-05, + "loss": 0.0059, + "step": 273710 + }, + { + "epoch": 1.38, + "learning_rate": 9.285710682050944e-05, + "loss": 0.0105, + "step": 273720 + }, + { + "epoch": 1.38, + "learning_rate": 9.284953912749543e-05, + "loss": 0.0079, + "step": 273730 + }, + { + "epoch": 1.38, + "learning_rate": 9.284197143448143e-05, + "loss": 0.0083, + "step": 273740 + }, + { + "epoch": 1.38, + "learning_rate": 9.283440374146741e-05, + "loss": 0.0091, + "step": 273750 + }, + { + "epoch": 1.38, + "learning_rate": 9.28268360484534e-05, + "loss": 0.0071, + "step": 273760 + }, + { + "epoch": 1.38, + "learning_rate": 9.281926835543939e-05, + "loss": 0.0085, + "step": 273770 + }, + { + "epoch": 1.38, + "learning_rate": 9.281170066242538e-05, + "loss": 0.0087, + "step": 273780 + }, + { + "epoch": 1.38, + "learning_rate": 9.280413296941138e-05, + "loss": 0.0084, + "step": 273790 + }, + { + "epoch": 1.38, + "learning_rate": 9.279656527639736e-05, + "loss": 0.0074, + "step": 273800 + }, + { + "epoch": 1.38, + "learning_rate": 9.278899758338335e-05, + "loss": 0.0109, + "step": 273810 + }, + { + "epoch": 1.38, + "learning_rate": 9.278142989036935e-05, + "loss": 0.0089, + "step": 273820 + }, + { + "epoch": 1.38, + "learning_rate": 9.277386219735533e-05, + "loss": 0.0079, + "step": 273830 + }, + { + "epoch": 1.38, + "learning_rate": 9.276629450434132e-05, + "loss": 0.0094, + "step": 273840 + }, + { + "epoch": 1.38, + "learning_rate": 9.27587268113273e-05, + "loss": 0.0089, + "step": 273850 + }, + { + "epoch": 1.38, + "learning_rate": 9.27511591183133e-05, + "loss": 0.0064, + "step": 273860 + }, + { + "epoch": 1.38, + "learning_rate": 9.27435914252993e-05, + "loss": 0.0079, + "step": 273870 + }, + { + "epoch": 1.38, + "learning_rate": 9.273602373228528e-05, + "loss": 0.0088, + "step": 273880 + }, + { + "epoch": 1.38, + "learning_rate": 9.272845603927127e-05, + "loss": 0.0091, + "step": 273890 + }, + { + "epoch": 1.38, + "learning_rate": 9.272088834625727e-05, + "loss": 0.0071, + "step": 273900 + }, + { + "epoch": 1.38, + "learning_rate": 9.271332065324325e-05, + "loss": 0.0075, + "step": 273910 + }, + { + "epoch": 1.38, + "learning_rate": 9.270575296022924e-05, + "loss": 0.006, + "step": 273920 + }, + { + "epoch": 1.38, + "learning_rate": 9.269818526721522e-05, + "loss": 0.007, + "step": 273930 + }, + { + "epoch": 1.38, + "learning_rate": 9.269061757420122e-05, + "loss": 0.0062, + "step": 273940 + }, + { + "epoch": 1.38, + "learning_rate": 9.268304988118721e-05, + "loss": 0.0068, + "step": 273950 + }, + { + "epoch": 1.38, + "learning_rate": 9.26754821881732e-05, + "loss": 0.0064, + "step": 273960 + }, + { + "epoch": 1.38, + "learning_rate": 9.266791449515919e-05, + "loss": 0.0055, + "step": 273970 + }, + { + "epoch": 1.38, + "learning_rate": 9.266034680214519e-05, + "loss": 0.0063, + "step": 273980 + }, + { + "epoch": 1.38, + "learning_rate": 9.265277910913117e-05, + "loss": 0.0087, + "step": 273990 + }, + { + "epoch": 1.38, + "learning_rate": 9.264521141611716e-05, + "loss": 0.0063, + "step": 274000 + }, + { + "epoch": 1.38, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.005893085617572069, + "eval_runtime": 116.3239, + "eval_samples_per_second": 17.193, + "eval_steps_per_second": 4.298, + "step": 274000 + }, + { + "epoch": 1.38, + "learning_rate": 9.263764372310314e-05, + "loss": 0.005, + "step": 274010 + }, + { + "epoch": 1.38, + "learning_rate": 9.263007603008914e-05, + "loss": 0.0073, + "step": 274020 + }, + { + "epoch": 1.38, + "learning_rate": 9.262250833707513e-05, + "loss": 0.0083, + "step": 274030 + }, + { + "epoch": 1.38, + "learning_rate": 9.261494064406111e-05, + "loss": 0.0101, + "step": 274040 + }, + { + "epoch": 1.38, + "learning_rate": 9.260737295104711e-05, + "loss": 0.0059, + "step": 274050 + }, + { + "epoch": 1.38, + "learning_rate": 9.25998052580331e-05, + "loss": 0.0083, + "step": 274060 + }, + { + "epoch": 1.38, + "learning_rate": 9.259223756501909e-05, + "loss": 0.0075, + "step": 274070 + }, + { + "epoch": 1.38, + "learning_rate": 9.258466987200508e-05, + "loss": 0.0155, + "step": 274080 + }, + { + "epoch": 1.38, + "learning_rate": 9.257710217899108e-05, + "loss": 0.0085, + "step": 274090 + }, + { + "epoch": 1.38, + "learning_rate": 9.256953448597706e-05, + "loss": 0.0081, + "step": 274100 + }, + { + "epoch": 1.38, + "learning_rate": 9.256196679296305e-05, + "loss": 0.0065, + "step": 274110 + }, + { + "epoch": 1.38, + "learning_rate": 9.255439909994903e-05, + "loss": 0.01, + "step": 274120 + }, + { + "epoch": 1.38, + "learning_rate": 9.254683140693503e-05, + "loss": 0.0083, + "step": 274130 + }, + { + "epoch": 1.38, + "learning_rate": 9.253926371392102e-05, + "loss": 0.0069, + "step": 274140 + }, + { + "epoch": 1.38, + "learning_rate": 9.2531696020907e-05, + "loss": 0.0068, + "step": 274150 + }, + { + "epoch": 1.38, + "learning_rate": 9.2524128327893e-05, + "loss": 0.007, + "step": 274160 + }, + { + "epoch": 1.38, + "learning_rate": 9.2516560634879e-05, + "loss": 0.0096, + "step": 274170 + }, + { + "epoch": 1.38, + "learning_rate": 9.250899294186498e-05, + "loss": 0.0076, + "step": 274180 + }, + { + "epoch": 1.38, + "learning_rate": 9.250142524885097e-05, + "loss": 0.0089, + "step": 274190 + }, + { + "epoch": 1.38, + "learning_rate": 9.249385755583695e-05, + "loss": 0.0082, + "step": 274200 + }, + { + "epoch": 1.38, + "learning_rate": 9.248628986282295e-05, + "loss": 0.0074, + "step": 274210 + }, + { + "epoch": 1.38, + "learning_rate": 9.247872216980894e-05, + "loss": 0.0074, + "step": 274220 + }, + { + "epoch": 1.38, + "learning_rate": 9.247115447679492e-05, + "loss": 0.0075, + "step": 274230 + }, + { + "epoch": 1.38, + "learning_rate": 9.246358678378092e-05, + "loss": 0.0085, + "step": 274240 + }, + { + "epoch": 1.38, + "learning_rate": 9.245601909076691e-05, + "loss": 0.0087, + "step": 274250 + }, + { + "epoch": 1.38, + "learning_rate": 9.24484513977529e-05, + "loss": 0.0078, + "step": 274260 + }, + { + "epoch": 1.38, + "learning_rate": 9.244088370473889e-05, + "loss": 0.0086, + "step": 274270 + }, + { + "epoch": 1.38, + "learning_rate": 9.243331601172487e-05, + "loss": 0.0117, + "step": 274280 + }, + { + "epoch": 1.38, + "learning_rate": 9.242574831871087e-05, + "loss": 0.0084, + "step": 274290 + }, + { + "epoch": 1.38, + "learning_rate": 9.241818062569686e-05, + "loss": 0.0077, + "step": 274300 + }, + { + "epoch": 1.38, + "learning_rate": 9.241061293268284e-05, + "loss": 0.0069, + "step": 274310 + }, + { + "epoch": 1.38, + "learning_rate": 9.240304523966883e-05, + "loss": 0.0099, + "step": 274320 + }, + { + "epoch": 1.38, + "learning_rate": 9.239547754665481e-05, + "loss": 0.0086, + "step": 274330 + }, + { + "epoch": 1.38, + "learning_rate": 9.23879098536408e-05, + "loss": 0.0081, + "step": 274340 + }, + { + "epoch": 1.38, + "learning_rate": 9.23803421606268e-05, + "loss": 0.0064, + "step": 274350 + }, + { + "epoch": 1.38, + "learning_rate": 9.237277446761278e-05, + "loss": 0.011, + "step": 274360 + }, + { + "epoch": 1.38, + "learning_rate": 9.236520677459877e-05, + "loss": 0.0071, + "step": 274370 + }, + { + "epoch": 1.38, + "learning_rate": 9.235763908158475e-05, + "loss": 0.0081, + "step": 274380 + }, + { + "epoch": 1.38, + "learning_rate": 9.235007138857075e-05, + "loss": 0.0097, + "step": 274390 + }, + { + "epoch": 1.38, + "learning_rate": 9.234250369555674e-05, + "loss": 0.0087, + "step": 274400 + }, + { + "epoch": 1.38, + "learning_rate": 9.233493600254273e-05, + "loss": 0.006, + "step": 274410 + }, + { + "epoch": 1.38, + "learning_rate": 9.232736830952872e-05, + "loss": 0.0097, + "step": 274420 + }, + { + "epoch": 1.38, + "learning_rate": 9.231980061651472e-05, + "loss": 0.0087, + "step": 274430 + }, + { + "epoch": 1.38, + "learning_rate": 9.23122329235007e-05, + "loss": 0.0083, + "step": 274440 + }, + { + "epoch": 1.38, + "learning_rate": 9.230466523048669e-05, + "loss": 0.0096, + "step": 274450 + }, + { + "epoch": 1.38, + "learning_rate": 9.229709753747267e-05, + "loss": 0.0078, + "step": 274460 + }, + { + "epoch": 1.38, + "learning_rate": 9.228952984445867e-05, + "loss": 0.0051, + "step": 274470 + }, + { + "epoch": 1.38, + "learning_rate": 9.228196215144466e-05, + "loss": 0.0083, + "step": 274480 + }, + { + "epoch": 1.38, + "learning_rate": 9.227439445843065e-05, + "loss": 0.0075, + "step": 274490 + }, + { + "epoch": 1.38, + "learning_rate": 9.226682676541664e-05, + "loss": 0.0085, + "step": 274500 + }, + { + "epoch": 1.38, + "learning_rate": 9.225925907240264e-05, + "loss": 0.0061, + "step": 274510 + }, + { + "epoch": 1.38, + "learning_rate": 9.225169137938862e-05, + "loss": 0.0071, + "step": 274520 + }, + { + "epoch": 1.39, + "learning_rate": 9.224412368637461e-05, + "loss": 0.0066, + "step": 274530 + }, + { + "epoch": 1.39, + "learning_rate": 9.223655599336061e-05, + "loss": 0.0066, + "step": 274540 + }, + { + "epoch": 1.39, + "learning_rate": 9.222898830034659e-05, + "loss": 0.0072, + "step": 274550 + }, + { + "epoch": 1.39, + "learning_rate": 9.222142060733258e-05, + "loss": 0.0098, + "step": 274560 + }, + { + "epoch": 1.39, + "learning_rate": 9.221385291431856e-05, + "loss": 0.0073, + "step": 274570 + }, + { + "epoch": 1.39, + "learning_rate": 9.220628522130456e-05, + "loss": 0.0073, + "step": 274580 + }, + { + "epoch": 1.39, + "learning_rate": 9.219871752829055e-05, + "loss": 0.0083, + "step": 274590 + }, + { + "epoch": 1.39, + "learning_rate": 9.219114983527654e-05, + "loss": 0.007, + "step": 274600 + }, + { + "epoch": 1.39, + "learning_rate": 9.218358214226253e-05, + "loss": 0.009, + "step": 274610 + }, + { + "epoch": 1.39, + "learning_rate": 9.217601444924853e-05, + "loss": 0.0087, + "step": 274620 + }, + { + "epoch": 1.39, + "learning_rate": 9.216844675623451e-05, + "loss": 0.0063, + "step": 274630 + }, + { + "epoch": 1.39, + "learning_rate": 9.21608790632205e-05, + "loss": 0.0066, + "step": 274640 + }, + { + "epoch": 1.39, + "learning_rate": 9.215331137020648e-05, + "loss": 0.0061, + "step": 274650 + }, + { + "epoch": 1.39, + "learning_rate": 9.214574367719248e-05, + "loss": 0.0116, + "step": 274660 + }, + { + "epoch": 1.39, + "learning_rate": 9.213817598417847e-05, + "loss": 0.0063, + "step": 274670 + }, + { + "epoch": 1.39, + "learning_rate": 9.213060829116446e-05, + "loss": 0.0069, + "step": 274680 + }, + { + "epoch": 1.39, + "learning_rate": 9.212304059815045e-05, + "loss": 0.0085, + "step": 274690 + }, + { + "epoch": 1.39, + "learning_rate": 9.211547290513645e-05, + "loss": 0.0107, + "step": 274700 + }, + { + "epoch": 1.39, + "learning_rate": 9.210790521212243e-05, + "loss": 0.0087, + "step": 274710 + }, + { + "epoch": 1.39, + "learning_rate": 9.210033751910842e-05, + "loss": 0.0091, + "step": 274720 + }, + { + "epoch": 1.39, + "learning_rate": 9.20927698260944e-05, + "loss": 0.007, + "step": 274730 + }, + { + "epoch": 1.39, + "learning_rate": 9.20852021330804e-05, + "loss": 0.0074, + "step": 274740 + }, + { + "epoch": 1.39, + "learning_rate": 9.20776344400664e-05, + "loss": 0.0076, + "step": 274750 + }, + { + "epoch": 1.39, + "learning_rate": 9.207006674705237e-05, + "loss": 0.007, + "step": 274760 + }, + { + "epoch": 1.39, + "learning_rate": 9.206249905403837e-05, + "loss": 0.008, + "step": 274770 + }, + { + "epoch": 1.39, + "learning_rate": 9.205493136102436e-05, + "loss": 0.0072, + "step": 274780 + }, + { + "epoch": 1.39, + "learning_rate": 9.204736366801035e-05, + "loss": 0.008, + "step": 274790 + }, + { + "epoch": 1.39, + "learning_rate": 9.203979597499634e-05, + "loss": 0.0075, + "step": 274800 + }, + { + "epoch": 1.39, + "learning_rate": 9.203222828198232e-05, + "loss": 0.0087, + "step": 274810 + }, + { + "epoch": 1.39, + "learning_rate": 9.202466058896832e-05, + "loss": 0.0072, + "step": 274820 + }, + { + "epoch": 1.39, + "learning_rate": 9.201709289595431e-05, + "loss": 0.0056, + "step": 274830 + }, + { + "epoch": 1.39, + "learning_rate": 9.20095252029403e-05, + "loss": 0.0086, + "step": 274840 + }, + { + "epoch": 1.39, + "learning_rate": 9.200195750992629e-05, + "loss": 0.0078, + "step": 274850 + }, + { + "epoch": 1.39, + "learning_rate": 9.199438981691228e-05, + "loss": 0.0084, + "step": 274860 + }, + { + "epoch": 1.39, + "learning_rate": 9.198682212389827e-05, + "loss": 0.0085, + "step": 274870 + }, + { + "epoch": 1.39, + "learning_rate": 9.197925443088426e-05, + "loss": 0.008, + "step": 274880 + }, + { + "epoch": 1.39, + "learning_rate": 9.197168673787024e-05, + "loss": 0.0087, + "step": 274890 + }, + { + "epoch": 1.39, + "learning_rate": 9.196411904485624e-05, + "loss": 0.0097, + "step": 274900 + }, + { + "epoch": 1.39, + "learning_rate": 9.195655135184223e-05, + "loss": 0.0067, + "step": 274910 + }, + { + "epoch": 1.39, + "learning_rate": 9.194898365882821e-05, + "loss": 0.0095, + "step": 274920 + }, + { + "epoch": 1.39, + "learning_rate": 9.194141596581421e-05, + "loss": 0.0104, + "step": 274930 + }, + { + "epoch": 1.39, + "learning_rate": 9.19338482728002e-05, + "loss": 0.006, + "step": 274940 + }, + { + "epoch": 1.39, + "learning_rate": 9.192628057978617e-05, + "loss": 0.0074, + "step": 274950 + }, + { + "epoch": 1.39, + "learning_rate": 9.191871288677217e-05, + "loss": 0.0066, + "step": 274960 + }, + { + "epoch": 1.39, + "learning_rate": 9.191114519375815e-05, + "loss": 0.0074, + "step": 274970 + }, + { + "epoch": 1.39, + "learning_rate": 9.190357750074414e-05, + "loss": 0.0072, + "step": 274980 + }, + { + "epoch": 1.39, + "learning_rate": 9.189600980773014e-05, + "loss": 0.0077, + "step": 274990 + }, + { + "epoch": 1.39, + "learning_rate": 9.188844211471612e-05, + "loss": 0.0088, + "step": 275000 + }, + { + "epoch": 1.39, + "eval_cer": 0.9144459960000272, + "eval_loss": 0.005970404949039221, + "eval_runtime": 116.7373, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, + "step": 275000 + }, + { + "epoch": 1.39, + "learning_rate": 9.188087442170211e-05, + "loss": 0.0106, + "step": 275010 + }, + { + "epoch": 1.39, + "learning_rate": 9.18733067286881e-05, + "loss": 0.0089, + "step": 275020 + }, + { + "epoch": 1.39, + "learning_rate": 9.186573903567409e-05, + "loss": 0.0075, + "step": 275030 + }, + { + "epoch": 1.39, + "learning_rate": 9.185817134266009e-05, + "loss": 0.0061, + "step": 275040 + }, + { + "epoch": 1.39, + "learning_rate": 9.185060364964607e-05, + "loss": 0.0067, + "step": 275050 + }, + { + "epoch": 1.39, + "learning_rate": 9.184303595663206e-05, + "loss": 0.0075, + "step": 275060 + }, + { + "epoch": 1.39, + "learning_rate": 9.183546826361806e-05, + "loss": 0.0072, + "step": 275070 + }, + { + "epoch": 1.39, + "learning_rate": 9.182790057060404e-05, + "loss": 0.0077, + "step": 275080 + }, + { + "epoch": 1.39, + "learning_rate": 9.182033287759003e-05, + "loss": 0.0062, + "step": 275090 + }, + { + "epoch": 1.39, + "learning_rate": 9.181276518457601e-05, + "loss": 0.0077, + "step": 275100 + }, + { + "epoch": 1.39, + "learning_rate": 9.180519749156201e-05, + "loss": 0.0062, + "step": 275110 + }, + { + "epoch": 1.39, + "learning_rate": 9.1797629798548e-05, + "loss": 0.0079, + "step": 275120 + }, + { + "epoch": 1.39, + "learning_rate": 9.179006210553399e-05, + "loss": 0.0115, + "step": 275130 + }, + { + "epoch": 1.39, + "learning_rate": 9.178249441251998e-05, + "loss": 0.0108, + "step": 275140 + }, + { + "epoch": 1.39, + "learning_rate": 9.177492671950598e-05, + "loss": 0.0073, + "step": 275150 + }, + { + "epoch": 1.39, + "learning_rate": 9.176735902649196e-05, + "loss": 0.0085, + "step": 275160 + }, + { + "epoch": 1.39, + "learning_rate": 9.175979133347795e-05, + "loss": 0.0111, + "step": 275170 + }, + { + "epoch": 1.39, + "learning_rate": 9.175222364046393e-05, + "loss": 0.0105, + "step": 275180 + }, + { + "epoch": 1.39, + "learning_rate": 9.174465594744993e-05, + "loss": 0.0073, + "step": 275190 + }, + { + "epoch": 1.39, + "learning_rate": 9.173708825443592e-05, + "loss": 0.0091, + "step": 275200 + }, + { + "epoch": 1.39, + "learning_rate": 9.17295205614219e-05, + "loss": 0.008, + "step": 275210 + }, + { + "epoch": 1.39, + "learning_rate": 9.17219528684079e-05, + "loss": 0.0051, + "step": 275220 + }, + { + "epoch": 1.39, + "learning_rate": 9.17143851753939e-05, + "loss": 0.0074, + "step": 275230 + }, + { + "epoch": 1.39, + "learning_rate": 9.170681748237988e-05, + "loss": 0.007, + "step": 275240 + }, + { + "epoch": 1.39, + "learning_rate": 9.169924978936587e-05, + "loss": 0.0097, + "step": 275250 + }, + { + "epoch": 1.39, + "learning_rate": 9.169168209635185e-05, + "loss": 0.0075, + "step": 275260 + }, + { + "epoch": 1.39, + "learning_rate": 9.168411440333785e-05, + "loss": 0.008, + "step": 275270 + }, + { + "epoch": 1.39, + "learning_rate": 9.167654671032384e-05, + "loss": 0.0059, + "step": 275280 + }, + { + "epoch": 1.39, + "learning_rate": 9.166897901730982e-05, + "loss": 0.0047, + "step": 275290 + }, + { + "epoch": 1.39, + "learning_rate": 9.166141132429582e-05, + "loss": 0.0081, + "step": 275300 + }, + { + "epoch": 1.39, + "learning_rate": 9.165384363128181e-05, + "loss": 0.0081, + "step": 275310 + }, + { + "epoch": 1.39, + "learning_rate": 9.16462759382678e-05, + "loss": 0.0101, + "step": 275320 + }, + { + "epoch": 1.39, + "learning_rate": 9.163870824525379e-05, + "loss": 0.0071, + "step": 275330 + }, + { + "epoch": 1.39, + "learning_rate": 9.163114055223977e-05, + "loss": 0.0074, + "step": 275340 + }, + { + "epoch": 1.39, + "learning_rate": 9.162357285922577e-05, + "loss": 0.009, + "step": 275350 + }, + { + "epoch": 1.39, + "learning_rate": 9.161600516621176e-05, + "loss": 0.0082, + "step": 275360 + }, + { + "epoch": 1.39, + "learning_rate": 9.160843747319774e-05, + "loss": 0.0074, + "step": 275370 + }, + { + "epoch": 1.39, + "learning_rate": 9.160086978018374e-05, + "loss": 0.0071, + "step": 275380 + }, + { + "epoch": 1.39, + "learning_rate": 9.159330208716973e-05, + "loss": 0.0094, + "step": 275390 + }, + { + "epoch": 1.39, + "learning_rate": 9.158573439415572e-05, + "loss": 0.0085, + "step": 275400 + }, + { + "epoch": 1.39, + "learning_rate": 9.157816670114171e-05, + "loss": 0.0069, + "step": 275410 + }, + { + "epoch": 1.39, + "learning_rate": 9.157059900812769e-05, + "loss": 0.0078, + "step": 275420 + }, + { + "epoch": 1.39, + "learning_rate": 9.156303131511369e-05, + "loss": 0.0096, + "step": 275430 + }, + { + "epoch": 1.39, + "learning_rate": 9.155546362209968e-05, + "loss": 0.0082, + "step": 275440 + }, + { + "epoch": 1.39, + "learning_rate": 9.154789592908566e-05, + "loss": 0.0068, + "step": 275450 + }, + { + "epoch": 1.39, + "learning_rate": 9.154032823607166e-05, + "loss": 0.007, + "step": 275460 + }, + { + "epoch": 1.39, + "learning_rate": 9.153276054305765e-05, + "loss": 0.0097, + "step": 275470 + }, + { + "epoch": 1.39, + "learning_rate": 9.152519285004363e-05, + "loss": 0.0078, + "step": 275480 + }, + { + "epoch": 1.39, + "learning_rate": 9.151762515702963e-05, + "loss": 0.0117, + "step": 275490 + }, + { + "epoch": 1.39, + "learning_rate": 9.151005746401561e-05, + "loss": 0.0085, + "step": 275500 + }, + { + "epoch": 1.39, + "learning_rate": 9.15024897710016e-05, + "loss": 0.0064, + "step": 275510 + }, + { + "epoch": 1.39, + "learning_rate": 9.14949220779876e-05, + "loss": 0.009, + "step": 275520 + }, + { + "epoch": 1.39, + "learning_rate": 9.148735438497358e-05, + "loss": 0.0085, + "step": 275530 + }, + { + "epoch": 1.39, + "learning_rate": 9.147978669195958e-05, + "loss": 0.0081, + "step": 275540 + }, + { + "epoch": 1.39, + "learning_rate": 9.147221899894557e-05, + "loss": 0.0066, + "step": 275550 + }, + { + "epoch": 1.39, + "learning_rate": 9.146465130593155e-05, + "loss": 0.0073, + "step": 275560 + }, + { + "epoch": 1.39, + "learning_rate": 9.145708361291755e-05, + "loss": 0.0081, + "step": 275570 + }, + { + "epoch": 1.39, + "learning_rate": 9.144951591990352e-05, + "loss": 0.009, + "step": 275580 + }, + { + "epoch": 1.39, + "learning_rate": 9.144194822688951e-05, + "loss": 0.0093, + "step": 275590 + }, + { + "epoch": 1.39, + "learning_rate": 9.143438053387551e-05, + "loss": 0.0077, + "step": 275600 + }, + { + "epoch": 1.39, + "learning_rate": 9.142681284086149e-05, + "loss": 0.0091, + "step": 275610 + }, + { + "epoch": 1.39, + "learning_rate": 9.141924514784748e-05, + "loss": 0.0078, + "step": 275620 + }, + { + "epoch": 1.39, + "learning_rate": 9.141167745483347e-05, + "loss": 0.006, + "step": 275630 + }, + { + "epoch": 1.39, + "learning_rate": 9.140410976181946e-05, + "loss": 0.0066, + "step": 275640 + }, + { + "epoch": 1.39, + "learning_rate": 9.139654206880546e-05, + "loss": 0.0082, + "step": 275650 + }, + { + "epoch": 1.39, + "learning_rate": 9.138897437579144e-05, + "loss": 0.0071, + "step": 275660 + }, + { + "epoch": 1.39, + "learning_rate": 9.138140668277743e-05, + "loss": 0.0107, + "step": 275670 + }, + { + "epoch": 1.39, + "learning_rate": 9.137383898976343e-05, + "loss": 0.0103, + "step": 275680 + }, + { + "epoch": 1.39, + "learning_rate": 9.136627129674941e-05, + "loss": 0.0091, + "step": 275690 + }, + { + "epoch": 1.39, + "learning_rate": 9.13587036037354e-05, + "loss": 0.0083, + "step": 275700 + }, + { + "epoch": 1.39, + "learning_rate": 9.135113591072138e-05, + "loss": 0.0082, + "step": 275710 + }, + { + "epoch": 1.39, + "learning_rate": 9.134356821770738e-05, + "loss": 0.0095, + "step": 275720 + }, + { + "epoch": 1.39, + "learning_rate": 9.133600052469337e-05, + "loss": 0.0103, + "step": 275730 + }, + { + "epoch": 1.39, + "learning_rate": 9.132843283167936e-05, + "loss": 0.0112, + "step": 275740 + }, + { + "epoch": 1.39, + "learning_rate": 9.132086513866535e-05, + "loss": 0.0059, + "step": 275750 + }, + { + "epoch": 1.39, + "learning_rate": 9.131329744565135e-05, + "loss": 0.01, + "step": 275760 + }, + { + "epoch": 1.39, + "learning_rate": 9.130572975263733e-05, + "loss": 0.0091, + "step": 275770 + }, + { + "epoch": 1.39, + "learning_rate": 9.129816205962332e-05, + "loss": 0.0085, + "step": 275780 + }, + { + "epoch": 1.39, + "learning_rate": 9.12905943666093e-05, + "loss": 0.007, + "step": 275790 + }, + { + "epoch": 1.39, + "learning_rate": 9.12830266735953e-05, + "loss": 0.0058, + "step": 275800 + }, + { + "epoch": 1.39, + "learning_rate": 9.12754589805813e-05, + "loss": 0.0095, + "step": 275810 + }, + { + "epoch": 1.39, + "learning_rate": 9.126789128756728e-05, + "loss": 0.0068, + "step": 275820 + }, + { + "epoch": 1.39, + "learning_rate": 9.126032359455327e-05, + "loss": 0.0052, + "step": 275830 + }, + { + "epoch": 1.39, + "learning_rate": 9.125275590153927e-05, + "loss": 0.0089, + "step": 275840 + }, + { + "epoch": 1.39, + "learning_rate": 9.124518820852525e-05, + "loss": 0.007, + "step": 275850 + }, + { + "epoch": 1.39, + "learning_rate": 9.123762051551124e-05, + "loss": 0.0087, + "step": 275860 + }, + { + "epoch": 1.39, + "learning_rate": 9.123005282249722e-05, + "loss": 0.0083, + "step": 275870 + }, + { + "epoch": 1.39, + "learning_rate": 9.122248512948322e-05, + "loss": 0.0081, + "step": 275880 + }, + { + "epoch": 1.39, + "learning_rate": 9.121491743646921e-05, + "loss": 0.0067, + "step": 275890 + }, + { + "epoch": 1.39, + "learning_rate": 9.12073497434552e-05, + "loss": 0.0093, + "step": 275900 + }, + { + "epoch": 1.39, + "learning_rate": 9.119978205044119e-05, + "loss": 0.006, + "step": 275910 + }, + { + "epoch": 1.39, + "learning_rate": 9.119221435742718e-05, + "loss": 0.0068, + "step": 275920 + }, + { + "epoch": 1.39, + "learning_rate": 9.118464666441317e-05, + "loss": 0.008, + "step": 275930 + }, + { + "epoch": 1.39, + "learning_rate": 9.117707897139916e-05, + "loss": 0.0077, + "step": 275940 + }, + { + "epoch": 1.39, + "learning_rate": 9.116951127838514e-05, + "loss": 0.0091, + "step": 275950 + }, + { + "epoch": 1.39, + "learning_rate": 9.116194358537114e-05, + "loss": 0.0095, + "step": 275960 + }, + { + "epoch": 1.39, + "learning_rate": 9.115437589235713e-05, + "loss": 0.0101, + "step": 275970 + }, + { + "epoch": 1.39, + "learning_rate": 9.114680819934311e-05, + "loss": 0.0085, + "step": 275980 + }, + { + "epoch": 1.39, + "learning_rate": 9.113924050632911e-05, + "loss": 0.007, + "step": 275990 + }, + { + "epoch": 1.39, + "learning_rate": 9.11316728133151e-05, + "loss": 0.0081, + "step": 276000 + }, + { + "epoch": 1.39, + "eval_cer": 0.9144159137201398, + "eval_loss": 0.006024388130754232, + "eval_runtime": 116.144, + "eval_samples_per_second": 17.22, + "eval_steps_per_second": 4.305, + "step": 276000 + }, + { + "epoch": 1.39, + "learning_rate": 9.112410512030109e-05, + "loss": 0.0067, + "step": 276010 + }, + { + "epoch": 1.39, + "learning_rate": 9.111653742728708e-05, + "loss": 0.008, + "step": 276020 + }, + { + "epoch": 1.39, + "learning_rate": 9.110896973427308e-05, + "loss": 0.0073, + "step": 276030 + }, + { + "epoch": 1.39, + "learning_rate": 9.110140204125906e-05, + "loss": 0.0059, + "step": 276040 + }, + { + "epoch": 1.39, + "learning_rate": 9.109383434824505e-05, + "loss": 0.0076, + "step": 276050 + }, + { + "epoch": 1.39, + "learning_rate": 9.108626665523103e-05, + "loss": 0.0077, + "step": 276060 + }, + { + "epoch": 1.39, + "learning_rate": 9.107869896221703e-05, + "loss": 0.0095, + "step": 276070 + }, + { + "epoch": 1.39, + "learning_rate": 9.107113126920302e-05, + "loss": 0.008, + "step": 276080 + }, + { + "epoch": 1.39, + "learning_rate": 9.1063563576189e-05, + "loss": 0.0068, + "step": 276090 + }, + { + "epoch": 1.39, + "learning_rate": 9.1055995883175e-05, + "loss": 0.009, + "step": 276100 + }, + { + "epoch": 1.39, + "learning_rate": 9.1048428190161e-05, + "loss": 0.0076, + "step": 276110 + }, + { + "epoch": 1.39, + "learning_rate": 9.104086049714698e-05, + "loss": 0.008, + "step": 276120 + }, + { + "epoch": 1.39, + "learning_rate": 9.103329280413297e-05, + "loss": 0.0088, + "step": 276130 + }, + { + "epoch": 1.39, + "learning_rate": 9.102572511111895e-05, + "loss": 0.0075, + "step": 276140 + }, + { + "epoch": 1.39, + "learning_rate": 9.101815741810495e-05, + "loss": 0.0066, + "step": 276150 + }, + { + "epoch": 1.39, + "learning_rate": 9.101058972509094e-05, + "loss": 0.0072, + "step": 276160 + }, + { + "epoch": 1.39, + "learning_rate": 9.100302203207692e-05, + "loss": 0.0086, + "step": 276170 + }, + { + "epoch": 1.39, + "learning_rate": 9.099545433906292e-05, + "loss": 0.0081, + "step": 276180 + }, + { + "epoch": 1.39, + "learning_rate": 9.098788664604891e-05, + "loss": 0.0111, + "step": 276190 + }, + { + "epoch": 1.39, + "learning_rate": 9.09803189530349e-05, + "loss": 0.0076, + "step": 276200 + }, + { + "epoch": 1.39, + "learning_rate": 9.097275126002088e-05, + "loss": 0.0082, + "step": 276210 + }, + { + "epoch": 1.39, + "learning_rate": 9.096518356700686e-05, + "loss": 0.0066, + "step": 276220 + }, + { + "epoch": 1.39, + "learning_rate": 9.095761587399285e-05, + "loss": 0.006, + "step": 276230 + }, + { + "epoch": 1.39, + "learning_rate": 9.095004818097883e-05, + "loss": 0.008, + "step": 276240 + }, + { + "epoch": 1.39, + "learning_rate": 9.094248048796483e-05, + "loss": 0.0087, + "step": 276250 + }, + { + "epoch": 1.39, + "learning_rate": 9.093491279495082e-05, + "loss": 0.0075, + "step": 276260 + }, + { + "epoch": 1.39, + "learning_rate": 9.09273451019368e-05, + "loss": 0.0082, + "step": 276270 + }, + { + "epoch": 1.39, + "learning_rate": 9.09197774089228e-05, + "loss": 0.008, + "step": 276280 + }, + { + "epoch": 1.39, + "learning_rate": 9.09122097159088e-05, + "loss": 0.0081, + "step": 276290 + }, + { + "epoch": 1.39, + "learning_rate": 9.090464202289478e-05, + "loss": 0.0065, + "step": 276300 + }, + { + "epoch": 1.39, + "learning_rate": 9.089707432988077e-05, + "loss": 0.0072, + "step": 276310 + }, + { + "epoch": 1.39, + "learning_rate": 9.088950663686675e-05, + "loss": 0.0103, + "step": 276320 + }, + { + "epoch": 1.39, + "learning_rate": 9.088193894385275e-05, + "loss": 0.0092, + "step": 276330 + }, + { + "epoch": 1.39, + "learning_rate": 9.087437125083874e-05, + "loss": 0.0075, + "step": 276340 + }, + { + "epoch": 1.39, + "learning_rate": 9.086680355782473e-05, + "loss": 0.0072, + "step": 276350 + }, + { + "epoch": 1.39, + "learning_rate": 9.085923586481072e-05, + "loss": 0.0077, + "step": 276360 + }, + { + "epoch": 1.39, + "learning_rate": 9.085166817179672e-05, + "loss": 0.0074, + "step": 276370 + }, + { + "epoch": 1.39, + "learning_rate": 9.08441004787827e-05, + "loss": 0.0067, + "step": 276380 + }, + { + "epoch": 1.39, + "learning_rate": 9.083653278576869e-05, + "loss": 0.0082, + "step": 276390 + }, + { + "epoch": 1.39, + "learning_rate": 9.082896509275467e-05, + "loss": 0.008, + "step": 276400 + }, + { + "epoch": 1.39, + "learning_rate": 9.082139739974067e-05, + "loss": 0.0094, + "step": 276410 + }, + { + "epoch": 1.39, + "learning_rate": 9.081382970672666e-05, + "loss": 0.0074, + "step": 276420 + }, + { + "epoch": 1.39, + "learning_rate": 9.080626201371264e-05, + "loss": 0.007, + "step": 276430 + }, + { + "epoch": 1.39, + "learning_rate": 9.079869432069864e-05, + "loss": 0.009, + "step": 276440 + }, + { + "epoch": 1.39, + "learning_rate": 9.079112662768463e-05, + "loss": 0.0074, + "step": 276450 + }, + { + "epoch": 1.39, + "learning_rate": 9.078355893467062e-05, + "loss": 0.0067, + "step": 276460 + }, + { + "epoch": 1.39, + "learning_rate": 9.077599124165661e-05, + "loss": 0.0085, + "step": 276470 + }, + { + "epoch": 1.39, + "learning_rate": 9.07684235486426e-05, + "loss": 0.0057, + "step": 276480 + }, + { + "epoch": 1.39, + "learning_rate": 9.076085585562859e-05, + "loss": 0.0088, + "step": 276490 + }, + { + "epoch": 1.39, + "learning_rate": 9.075328816261458e-05, + "loss": 0.0063, + "step": 276500 + }, + { + "epoch": 1.4, + "learning_rate": 9.074572046960056e-05, + "loss": 0.0112, + "step": 276510 + }, + { + "epoch": 1.4, + "learning_rate": 9.073815277658656e-05, + "loss": 0.0102, + "step": 276520 + }, + { + "epoch": 1.4, + "learning_rate": 9.073058508357255e-05, + "loss": 0.0064, + "step": 276530 + }, + { + "epoch": 1.4, + "learning_rate": 9.072301739055854e-05, + "loss": 0.0093, + "step": 276540 + }, + { + "epoch": 1.4, + "learning_rate": 9.071544969754453e-05, + "loss": 0.0077, + "step": 276550 + }, + { + "epoch": 1.4, + "learning_rate": 9.070788200453053e-05, + "loss": 0.0068, + "step": 276560 + }, + { + "epoch": 1.4, + "learning_rate": 9.07003143115165e-05, + "loss": 0.0073, + "step": 276570 + }, + { + "epoch": 1.4, + "learning_rate": 9.06927466185025e-05, + "loss": 0.0084, + "step": 276580 + }, + { + "epoch": 1.4, + "learning_rate": 9.068517892548848e-05, + "loss": 0.006, + "step": 276590 + }, + { + "epoch": 1.4, + "learning_rate": 9.067761123247448e-05, + "loss": 0.0082, + "step": 276600 + }, + { + "epoch": 1.4, + "learning_rate": 9.067004353946047e-05, + "loss": 0.0066, + "step": 276610 + }, + { + "epoch": 1.4, + "learning_rate": 9.066247584644645e-05, + "loss": 0.0082, + "step": 276620 + }, + { + "epoch": 1.4, + "learning_rate": 9.065490815343245e-05, + "loss": 0.0056, + "step": 276630 + }, + { + "epoch": 1.4, + "learning_rate": 9.064734046041844e-05, + "loss": 0.0073, + "step": 276640 + }, + { + "epoch": 1.4, + "learning_rate": 9.063977276740443e-05, + "loss": 0.0062, + "step": 276650 + }, + { + "epoch": 1.4, + "learning_rate": 9.063220507439042e-05, + "loss": 0.0068, + "step": 276660 + }, + { + "epoch": 1.4, + "learning_rate": 9.06246373813764e-05, + "loss": 0.0082, + "step": 276670 + }, + { + "epoch": 1.4, + "learning_rate": 9.06170696883624e-05, + "loss": 0.0087, + "step": 276680 + }, + { + "epoch": 1.4, + "learning_rate": 9.060950199534839e-05, + "loss": 0.0092, + "step": 276690 + }, + { + "epoch": 1.4, + "learning_rate": 9.060193430233437e-05, + "loss": 0.0095, + "step": 276700 + }, + { + "epoch": 1.4, + "learning_rate": 9.059436660932037e-05, + "loss": 0.0076, + "step": 276710 + }, + { + "epoch": 1.4, + "learning_rate": 9.058679891630636e-05, + "loss": 0.0083, + "step": 276720 + }, + { + "epoch": 1.4, + "learning_rate": 9.057923122329235e-05, + "loss": 0.0076, + "step": 276730 + }, + { + "epoch": 1.4, + "learning_rate": 9.057166353027834e-05, + "loss": 0.0095, + "step": 276740 + }, + { + "epoch": 1.4, + "learning_rate": 9.056409583726432e-05, + "loss": 0.0075, + "step": 276750 + }, + { + "epoch": 1.4, + "learning_rate": 9.055652814425032e-05, + "loss": 0.009, + "step": 276760 + }, + { + "epoch": 1.4, + "learning_rate": 9.054896045123631e-05, + "loss": 0.009, + "step": 276770 + }, + { + "epoch": 1.4, + "learning_rate": 9.054139275822229e-05, + "loss": 0.0081, + "step": 276780 + }, + { + "epoch": 1.4, + "learning_rate": 9.053382506520829e-05, + "loss": 0.0057, + "step": 276790 + }, + { + "epoch": 1.4, + "learning_rate": 9.052625737219428e-05, + "loss": 0.0069, + "step": 276800 + }, + { + "epoch": 1.4, + "learning_rate": 9.051868967918026e-05, + "loss": 0.008, + "step": 276810 + }, + { + "epoch": 1.4, + "learning_rate": 9.051112198616626e-05, + "loss": 0.0081, + "step": 276820 + }, + { + "epoch": 1.4, + "learning_rate": 9.050355429315223e-05, + "loss": 0.0084, + "step": 276830 + }, + { + "epoch": 1.4, + "learning_rate": 9.049598660013822e-05, + "loss": 0.0085, + "step": 276840 + }, + { + "epoch": 1.4, + "learning_rate": 9.04884189071242e-05, + "loss": 0.0064, + "step": 276850 + }, + { + "epoch": 1.4, + "learning_rate": 9.04808512141102e-05, + "loss": 0.0084, + "step": 276860 + }, + { + "epoch": 1.4, + "learning_rate": 9.04732835210962e-05, + "loss": 0.0075, + "step": 276870 + }, + { + "epoch": 1.4, + "learning_rate": 9.046571582808218e-05, + "loss": 0.0063, + "step": 276880 + }, + { + "epoch": 1.4, + "learning_rate": 9.045814813506817e-05, + "loss": 0.0092, + "step": 276890 + }, + { + "epoch": 1.4, + "learning_rate": 9.045058044205417e-05, + "loss": 0.0066, + "step": 276900 + }, + { + "epoch": 1.4, + "learning_rate": 9.044301274904015e-05, + "loss": 0.0101, + "step": 276910 + }, + { + "epoch": 1.4, + "learning_rate": 9.043544505602614e-05, + "loss": 0.0095, + "step": 276920 + }, + { + "epoch": 1.4, + "learning_rate": 9.042787736301214e-05, + "loss": 0.0066, + "step": 276930 + }, + { + "epoch": 1.4, + "learning_rate": 9.042030966999812e-05, + "loss": 0.0063, + "step": 276940 + }, + { + "epoch": 1.4, + "learning_rate": 9.041274197698411e-05, + "loss": 0.0063, + "step": 276950 + }, + { + "epoch": 1.4, + "learning_rate": 9.04051742839701e-05, + "loss": 0.0074, + "step": 276960 + }, + { + "epoch": 1.4, + "learning_rate": 9.039760659095609e-05, + "loss": 0.0064, + "step": 276970 + }, + { + "epoch": 1.4, + "learning_rate": 9.039003889794208e-05, + "loss": 0.0076, + "step": 276980 + }, + { + "epoch": 1.4, + "learning_rate": 9.038247120492807e-05, + "loss": 0.0109, + "step": 276990 + }, + { + "epoch": 1.4, + "learning_rate": 9.037490351191406e-05, + "loss": 0.008, + "step": 277000 + }, + { + "epoch": 1.4, + "eval_cer": 0.9144246472852683, + "eval_loss": 0.0058305272832512856, + "eval_runtime": 115.9259, + "eval_samples_per_second": 17.252, + "eval_steps_per_second": 4.313, + "step": 277000 + }, + { + "epoch": 1.4, + "learning_rate": 9.036733581890006e-05, + "loss": 0.0067, + "step": 277010 + }, + { + "epoch": 1.4, + "learning_rate": 9.035976812588604e-05, + "loss": 0.0072, + "step": 277020 + }, + { + "epoch": 1.4, + "learning_rate": 9.035220043287203e-05, + "loss": 0.0073, + "step": 277030 + }, + { + "epoch": 1.4, + "learning_rate": 9.034463273985801e-05, + "loss": 0.0185, + "step": 277040 + }, + { + "epoch": 1.4, + "learning_rate": 9.033706504684401e-05, + "loss": 0.0088, + "step": 277050 + }, + { + "epoch": 1.4, + "learning_rate": 9.032949735383e-05, + "loss": 0.0105, + "step": 277060 + }, + { + "epoch": 1.4, + "learning_rate": 9.032192966081599e-05, + "loss": 0.0067, + "step": 277070 + }, + { + "epoch": 1.4, + "learning_rate": 9.031436196780198e-05, + "loss": 0.0099, + "step": 277080 + }, + { + "epoch": 1.4, + "learning_rate": 9.030679427478798e-05, + "loss": 0.0111, + "step": 277090 + }, + { + "epoch": 1.4, + "learning_rate": 9.029922658177396e-05, + "loss": 0.0069, + "step": 277100 + }, + { + "epoch": 1.4, + "learning_rate": 9.029165888875995e-05, + "loss": 0.0076, + "step": 277110 + }, + { + "epoch": 1.4, + "learning_rate": 9.028409119574593e-05, + "loss": 0.0072, + "step": 277120 + }, + { + "epoch": 1.4, + "learning_rate": 9.027652350273193e-05, + "loss": 0.0106, + "step": 277130 + }, + { + "epoch": 1.4, + "learning_rate": 9.026895580971792e-05, + "loss": 0.0064, + "step": 277140 + }, + { + "epoch": 1.4, + "learning_rate": 9.02613881167039e-05, + "loss": 0.0084, + "step": 277150 + }, + { + "epoch": 1.4, + "learning_rate": 9.02538204236899e-05, + "loss": 0.0092, + "step": 277160 + }, + { + "epoch": 1.4, + "learning_rate": 9.02462527306759e-05, + "loss": 0.0072, + "step": 277170 + }, + { + "epoch": 1.4, + "learning_rate": 9.023868503766188e-05, + "loss": 0.0079, + "step": 277180 + }, + { + "epoch": 1.4, + "learning_rate": 9.023111734464787e-05, + "loss": 0.0056, + "step": 277190 + }, + { + "epoch": 1.4, + "learning_rate": 9.022354965163385e-05, + "loss": 0.0073, + "step": 277200 + }, + { + "epoch": 1.4, + "learning_rate": 9.021598195861985e-05, + "loss": 0.0073, + "step": 277210 + }, + { + "epoch": 1.4, + "learning_rate": 9.020841426560584e-05, + "loss": 0.0074, + "step": 277220 + }, + { + "epoch": 1.4, + "learning_rate": 9.020084657259182e-05, + "loss": 0.0068, + "step": 277230 + }, + { + "epoch": 1.4, + "learning_rate": 9.019327887957782e-05, + "loss": 0.0076, + "step": 277240 + }, + { + "epoch": 1.4, + "learning_rate": 9.018571118656381e-05, + "loss": 0.0081, + "step": 277250 + }, + { + "epoch": 1.4, + "learning_rate": 9.01781434935498e-05, + "loss": 0.0079, + "step": 277260 + }, + { + "epoch": 1.4, + "learning_rate": 9.017057580053579e-05, + "loss": 0.0062, + "step": 277270 + }, + { + "epoch": 1.4, + "learning_rate": 9.016300810752177e-05, + "loss": 0.0101, + "step": 277280 + }, + { + "epoch": 1.4, + "learning_rate": 9.015544041450777e-05, + "loss": 0.0067, + "step": 277290 + }, + { + "epoch": 1.4, + "learning_rate": 9.014787272149376e-05, + "loss": 0.0109, + "step": 277300 + }, + { + "epoch": 1.4, + "learning_rate": 9.014030502847974e-05, + "loss": 0.008, + "step": 277310 + }, + { + "epoch": 1.4, + "learning_rate": 9.013273733546574e-05, + "loss": 0.008, + "step": 277320 + }, + { + "epoch": 1.4, + "learning_rate": 9.012516964245173e-05, + "loss": 0.0079, + "step": 277330 + }, + { + "epoch": 1.4, + "learning_rate": 9.011760194943771e-05, + "loss": 0.0073, + "step": 277340 + }, + { + "epoch": 1.4, + "learning_rate": 9.011003425642371e-05, + "loss": 0.0077, + "step": 277350 + }, + { + "epoch": 1.4, + "learning_rate": 9.010246656340969e-05, + "loss": 0.0074, + "step": 277360 + }, + { + "epoch": 1.4, + "learning_rate": 9.009489887039569e-05, + "loss": 0.0094, + "step": 277370 + }, + { + "epoch": 1.4, + "learning_rate": 9.008733117738168e-05, + "loss": 0.0087, + "step": 277380 + }, + { + "epoch": 1.4, + "learning_rate": 9.007976348436766e-05, + "loss": 0.0059, + "step": 277390 + }, + { + "epoch": 1.4, + "learning_rate": 9.007219579135366e-05, + "loss": 0.0082, + "step": 277400 + }, + { + "epoch": 1.4, + "learning_rate": 9.006462809833965e-05, + "loss": 0.0079, + "step": 277410 + }, + { + "epoch": 1.4, + "learning_rate": 9.005706040532563e-05, + "loss": 0.0069, + "step": 277420 + }, + { + "epoch": 1.4, + "learning_rate": 9.004949271231163e-05, + "loss": 0.0078, + "step": 277430 + }, + { + "epoch": 1.4, + "learning_rate": 9.004192501929761e-05, + "loss": 0.0102, + "step": 277440 + }, + { + "epoch": 1.4, + "learning_rate": 9.00343573262836e-05, + "loss": 0.0081, + "step": 277450 + }, + { + "epoch": 1.4, + "learning_rate": 9.002678963326959e-05, + "loss": 0.0075, + "step": 277460 + }, + { + "epoch": 1.4, + "learning_rate": 9.001922194025557e-05, + "loss": 0.0065, + "step": 277470 + }, + { + "epoch": 1.4, + "learning_rate": 9.001165424724156e-05, + "loss": 0.0087, + "step": 277480 + }, + { + "epoch": 1.4, + "learning_rate": 9.000408655422754e-05, + "loss": 0.008, + "step": 277490 + }, + { + "epoch": 1.4, + "learning_rate": 8.999651886121354e-05, + "loss": 0.0082, + "step": 277500 + }, + { + "epoch": 1.4, + "learning_rate": 8.998895116819953e-05, + "loss": 0.0089, + "step": 277510 + }, + { + "epoch": 1.4, + "learning_rate": 8.998138347518552e-05, + "loss": 0.0079, + "step": 277520 + }, + { + "epoch": 1.4, + "learning_rate": 8.997381578217151e-05, + "loss": 0.0101, + "step": 277530 + }, + { + "epoch": 1.4, + "learning_rate": 8.99662480891575e-05, + "loss": 0.0087, + "step": 277540 + }, + { + "epoch": 1.4, + "learning_rate": 8.995868039614349e-05, + "loss": 0.0067, + "step": 277550 + }, + { + "epoch": 1.4, + "learning_rate": 8.995111270312948e-05, + "loss": 0.009, + "step": 277560 + }, + { + "epoch": 1.4, + "learning_rate": 8.994354501011546e-05, + "loss": 0.0071, + "step": 277570 + }, + { + "epoch": 1.4, + "learning_rate": 8.993597731710146e-05, + "loss": 0.0085, + "step": 277580 + }, + { + "epoch": 1.4, + "learning_rate": 8.992840962408745e-05, + "loss": 0.0066, + "step": 277590 + }, + { + "epoch": 1.4, + "learning_rate": 8.992084193107344e-05, + "loss": 0.0073, + "step": 277600 + }, + { + "epoch": 1.4, + "learning_rate": 8.991327423805943e-05, + "loss": 0.0068, + "step": 277610 + }, + { + "epoch": 1.4, + "learning_rate": 8.990570654504543e-05, + "loss": 0.0081, + "step": 277620 + }, + { + "epoch": 1.4, + "learning_rate": 8.989813885203141e-05, + "loss": 0.0061, + "step": 277630 + }, + { + "epoch": 1.4, + "learning_rate": 8.98905711590174e-05, + "loss": 0.0068, + "step": 277640 + }, + { + "epoch": 1.4, + "learning_rate": 8.988300346600338e-05, + "loss": 0.0055, + "step": 277650 + }, + { + "epoch": 1.4, + "learning_rate": 8.987543577298938e-05, + "loss": 0.0089, + "step": 277660 + }, + { + "epoch": 1.4, + "learning_rate": 8.986786807997537e-05, + "loss": 0.007, + "step": 277670 + }, + { + "epoch": 1.4, + "learning_rate": 8.986030038696135e-05, + "loss": 0.0072, + "step": 277680 + }, + { + "epoch": 1.4, + "learning_rate": 8.985273269394735e-05, + "loss": 0.0063, + "step": 277690 + }, + { + "epoch": 1.4, + "learning_rate": 8.984516500093334e-05, + "loss": 0.0089, + "step": 277700 + }, + { + "epoch": 1.4, + "learning_rate": 8.983759730791933e-05, + "loss": 0.0078, + "step": 277710 + }, + { + "epoch": 1.4, + "learning_rate": 8.983002961490532e-05, + "loss": 0.0084, + "step": 277720 + }, + { + "epoch": 1.4, + "learning_rate": 8.98224619218913e-05, + "loss": 0.0073, + "step": 277730 + }, + { + "epoch": 1.4, + "learning_rate": 8.98148942288773e-05, + "loss": 0.0081, + "step": 277740 + }, + { + "epoch": 1.4, + "learning_rate": 8.980732653586329e-05, + "loss": 0.0077, + "step": 277750 + }, + { + "epoch": 1.4, + "learning_rate": 8.979975884284927e-05, + "loss": 0.0083, + "step": 277760 + }, + { + "epoch": 1.4, + "learning_rate": 8.979219114983527e-05, + "loss": 0.0084, + "step": 277770 + }, + { + "epoch": 1.4, + "learning_rate": 8.978462345682126e-05, + "loss": 0.0089, + "step": 277780 + }, + { + "epoch": 1.4, + "learning_rate": 8.977705576380725e-05, + "loss": 0.0069, + "step": 277790 + }, + { + "epoch": 1.4, + "learning_rate": 8.976948807079324e-05, + "loss": 0.0067, + "step": 277800 + }, + { + "epoch": 1.4, + "learning_rate": 8.976192037777922e-05, + "loss": 0.0079, + "step": 277810 + }, + { + "epoch": 1.4, + "learning_rate": 8.975435268476522e-05, + "loss": 0.0098, + "step": 277820 + }, + { + "epoch": 1.4, + "learning_rate": 8.974678499175121e-05, + "loss": 0.0071, + "step": 277830 + }, + { + "epoch": 1.4, + "learning_rate": 8.97392172987372e-05, + "loss": 0.0104, + "step": 277840 + }, + { + "epoch": 1.4, + "learning_rate": 8.973164960572319e-05, + "loss": 0.0064, + "step": 277850 + }, + { + "epoch": 1.4, + "learning_rate": 8.972408191270918e-05, + "loss": 0.007, + "step": 277860 + }, + { + "epoch": 1.4, + "learning_rate": 8.971651421969516e-05, + "loss": 0.0072, + "step": 277870 + }, + { + "epoch": 1.4, + "learning_rate": 8.970894652668116e-05, + "loss": 0.0095, + "step": 277880 + }, + { + "epoch": 1.4, + "learning_rate": 8.970137883366714e-05, + "loss": 0.0055, + "step": 277890 + }, + { + "epoch": 1.4, + "learning_rate": 8.969381114065314e-05, + "loss": 0.0072, + "step": 277900 + }, + { + "epoch": 1.4, + "learning_rate": 8.968624344763913e-05, + "loss": 0.007, + "step": 277910 + }, + { + "epoch": 1.4, + "learning_rate": 8.967867575462511e-05, + "loss": 0.0077, + "step": 277920 + }, + { + "epoch": 1.4, + "learning_rate": 8.967110806161111e-05, + "loss": 0.008, + "step": 277930 + }, + { + "epoch": 1.4, + "learning_rate": 8.96635403685971e-05, + "loss": 0.0076, + "step": 277940 + }, + { + "epoch": 1.4, + "learning_rate": 8.965597267558308e-05, + "loss": 0.0095, + "step": 277950 + }, + { + "epoch": 1.4, + "learning_rate": 8.964840498256908e-05, + "loss": 0.0068, + "step": 277960 + }, + { + "epoch": 1.4, + "learning_rate": 8.964083728955507e-05, + "loss": 0.007, + "step": 277970 + }, + { + "epoch": 1.4, + "learning_rate": 8.963326959654106e-05, + "loss": 0.0061, + "step": 277980 + }, + { + "epoch": 1.4, + "learning_rate": 8.962570190352705e-05, + "loss": 0.0084, + "step": 277990 + }, + { + "epoch": 1.4, + "learning_rate": 8.961813421051303e-05, + "loss": 0.0072, + "step": 278000 + }, + { + "epoch": 1.4, + "eval_cer": 0.9144246472852683, + "eval_loss": 0.0060167377814650536, + "eval_runtime": 116.7043, + "eval_samples_per_second": 17.137, + "eval_steps_per_second": 4.284, + "step": 278000 + }, + { + "epoch": 1.4, + "learning_rate": 8.961056651749903e-05, + "loss": 0.0077, + "step": 278010 + }, + { + "epoch": 1.4, + "learning_rate": 8.960299882448502e-05, + "loss": 0.0077, + "step": 278020 + }, + { + "epoch": 1.4, + "learning_rate": 8.9595431131471e-05, + "loss": 0.0079, + "step": 278030 + }, + { + "epoch": 1.4, + "learning_rate": 8.9587863438457e-05, + "loss": 0.0053, + "step": 278040 + }, + { + "epoch": 1.4, + "learning_rate": 8.9580295745443e-05, + "loss": 0.0078, + "step": 278050 + }, + { + "epoch": 1.4, + "learning_rate": 8.957272805242897e-05, + "loss": 0.0081, + "step": 278060 + }, + { + "epoch": 1.4, + "learning_rate": 8.956516035941497e-05, + "loss": 0.0333, + "step": 278070 + }, + { + "epoch": 1.4, + "learning_rate": 8.955759266640095e-05, + "loss": 0.0085, + "step": 278080 + }, + { + "epoch": 1.4, + "learning_rate": 8.955002497338693e-05, + "loss": 0.0099, + "step": 278090 + }, + { + "epoch": 1.4, + "learning_rate": 8.954245728037291e-05, + "loss": 0.0075, + "step": 278100 + }, + { + "epoch": 1.4, + "learning_rate": 8.953488958735891e-05, + "loss": 0.0079, + "step": 278110 + }, + { + "epoch": 1.4, + "learning_rate": 8.95273218943449e-05, + "loss": 0.006, + "step": 278120 + }, + { + "epoch": 1.4, + "learning_rate": 8.951975420133089e-05, + "loss": 0.0086, + "step": 278130 + }, + { + "epoch": 1.4, + "learning_rate": 8.951218650831688e-05, + "loss": 0.0102, + "step": 278140 + }, + { + "epoch": 1.4, + "learning_rate": 8.950461881530288e-05, + "loss": 0.0066, + "step": 278150 + }, + { + "epoch": 1.4, + "learning_rate": 8.949705112228886e-05, + "loss": 0.0067, + "step": 278160 + }, + { + "epoch": 1.4, + "learning_rate": 8.948948342927485e-05, + "loss": 0.0073, + "step": 278170 + }, + { + "epoch": 1.4, + "learning_rate": 8.948191573626083e-05, + "loss": 0.0079, + "step": 278180 + }, + { + "epoch": 1.4, + "learning_rate": 8.947434804324683e-05, + "loss": 0.0069, + "step": 278190 + }, + { + "epoch": 1.4, + "learning_rate": 8.946678035023282e-05, + "loss": 0.0076, + "step": 278200 + }, + { + "epoch": 1.4, + "learning_rate": 8.94592126572188e-05, + "loss": 0.0058, + "step": 278210 + }, + { + "epoch": 1.4, + "learning_rate": 8.94516449642048e-05, + "loss": 0.0093, + "step": 278220 + }, + { + "epoch": 1.4, + "learning_rate": 8.94440772711908e-05, + "loss": 0.0097, + "step": 278230 + }, + { + "epoch": 1.4, + "learning_rate": 8.943650957817678e-05, + "loss": 0.0078, + "step": 278240 + }, + { + "epoch": 1.4, + "learning_rate": 8.942894188516277e-05, + "loss": 0.0091, + "step": 278250 + }, + { + "epoch": 1.4, + "learning_rate": 8.942137419214875e-05, + "loss": 0.009, + "step": 278260 + }, + { + "epoch": 1.4, + "learning_rate": 8.941380649913475e-05, + "loss": 0.0104, + "step": 278270 + }, + { + "epoch": 1.4, + "learning_rate": 8.940623880612074e-05, + "loss": 0.0088, + "step": 278280 + }, + { + "epoch": 1.4, + "learning_rate": 8.939867111310672e-05, + "loss": 0.0088, + "step": 278290 + }, + { + "epoch": 1.4, + "learning_rate": 8.939110342009272e-05, + "loss": 0.0064, + "step": 278300 + }, + { + "epoch": 1.4, + "learning_rate": 8.938353572707871e-05, + "loss": 0.0117, + "step": 278310 + }, + { + "epoch": 1.4, + "learning_rate": 8.93759680340647e-05, + "loss": 0.0091, + "step": 278320 + }, + { + "epoch": 1.4, + "learning_rate": 8.936840034105069e-05, + "loss": 0.0065, + "step": 278330 + }, + { + "epoch": 1.4, + "learning_rate": 8.936083264803667e-05, + "loss": 0.0086, + "step": 278340 + }, + { + "epoch": 1.4, + "learning_rate": 8.935326495502267e-05, + "loss": 0.01, + "step": 278350 + }, + { + "epoch": 1.4, + "learning_rate": 8.934569726200866e-05, + "loss": 0.0098, + "step": 278360 + }, + { + "epoch": 1.4, + "learning_rate": 8.933812956899464e-05, + "loss": 0.0073, + "step": 278370 + }, + { + "epoch": 1.4, + "learning_rate": 8.933056187598064e-05, + "loss": 0.0072, + "step": 278380 + }, + { + "epoch": 1.4, + "learning_rate": 8.932299418296663e-05, + "loss": 0.009, + "step": 278390 + }, + { + "epoch": 1.4, + "learning_rate": 8.931542648995261e-05, + "loss": 0.0078, + "step": 278400 + }, + { + "epoch": 1.4, + "learning_rate": 8.930785879693861e-05, + "loss": 0.0084, + "step": 278410 + }, + { + "epoch": 1.4, + "learning_rate": 8.93002911039246e-05, + "loss": 0.0071, + "step": 278420 + }, + { + "epoch": 1.4, + "learning_rate": 8.929272341091059e-05, + "loss": 0.0102, + "step": 278430 + }, + { + "epoch": 1.4, + "learning_rate": 8.928515571789658e-05, + "loss": 0.0086, + "step": 278440 + }, + { + "epoch": 1.4, + "learning_rate": 8.927758802488256e-05, + "loss": 0.0069, + "step": 278450 + }, + { + "epoch": 1.4, + "learning_rate": 8.927002033186856e-05, + "loss": 0.0084, + "step": 278460 + }, + { + "epoch": 1.4, + "learning_rate": 8.926245263885455e-05, + "loss": 0.007, + "step": 278470 + }, + { + "epoch": 1.4, + "learning_rate": 8.925488494584053e-05, + "loss": 0.0083, + "step": 278480 + }, + { + "epoch": 1.41, + "learning_rate": 8.924731725282653e-05, + "loss": 0.0057, + "step": 278490 + }, + { + "epoch": 1.41, + "learning_rate": 8.923974955981252e-05, + "loss": 0.0076, + "step": 278500 + }, + { + "epoch": 1.41, + "learning_rate": 8.92321818667985e-05, + "loss": 0.0075, + "step": 278510 + }, + { + "epoch": 1.41, + "learning_rate": 8.92246141737845e-05, + "loss": 0.0074, + "step": 278520 + }, + { + "epoch": 1.41, + "learning_rate": 8.921704648077048e-05, + "loss": 0.0076, + "step": 278530 + }, + { + "epoch": 1.41, + "learning_rate": 8.920947878775648e-05, + "loss": 0.0058, + "step": 278540 + }, + { + "epoch": 1.41, + "learning_rate": 8.920191109474247e-05, + "loss": 0.0066, + "step": 278550 + }, + { + "epoch": 1.41, + "learning_rate": 8.919434340172845e-05, + "loss": 0.0095, + "step": 278560 + }, + { + "epoch": 1.41, + "learning_rate": 8.918677570871445e-05, + "loss": 0.006, + "step": 278570 + }, + { + "epoch": 1.41, + "learning_rate": 8.917920801570044e-05, + "loss": 0.0083, + "step": 278580 + }, + { + "epoch": 1.41, + "learning_rate": 8.917164032268643e-05, + "loss": 0.0092, + "step": 278590 + }, + { + "epoch": 1.41, + "learning_rate": 8.916407262967242e-05, + "loss": 0.0093, + "step": 278600 + }, + { + "epoch": 1.41, + "learning_rate": 8.91565049366584e-05, + "loss": 0.0077, + "step": 278610 + }, + { + "epoch": 1.41, + "learning_rate": 8.91489372436444e-05, + "loss": 0.0076, + "step": 278620 + }, + { + "epoch": 1.41, + "learning_rate": 8.914136955063039e-05, + "loss": 0.0093, + "step": 278630 + }, + { + "epoch": 1.41, + "learning_rate": 8.913380185761637e-05, + "loss": 0.0081, + "step": 278640 + }, + { + "epoch": 1.41, + "learning_rate": 8.912623416460237e-05, + "loss": 0.0067, + "step": 278650 + }, + { + "epoch": 1.41, + "learning_rate": 8.911866647158836e-05, + "loss": 0.0076, + "step": 278660 + }, + { + "epoch": 1.41, + "learning_rate": 8.911109877857434e-05, + "loss": 0.0068, + "step": 278670 + }, + { + "epoch": 1.41, + "learning_rate": 8.910353108556034e-05, + "loss": 0.0163, + "step": 278680 + }, + { + "epoch": 1.41, + "learning_rate": 8.909596339254632e-05, + "loss": 0.0074, + "step": 278690 + }, + { + "epoch": 1.41, + "learning_rate": 8.908839569953232e-05, + "loss": 0.0058, + "step": 278700 + }, + { + "epoch": 1.41, + "learning_rate": 8.908082800651831e-05, + "loss": 0.0087, + "step": 278710 + }, + { + "epoch": 1.41, + "learning_rate": 8.907326031350428e-05, + "loss": 0.0092, + "step": 278720 + }, + { + "epoch": 1.41, + "learning_rate": 8.906569262049027e-05, + "loss": 0.006, + "step": 278730 + }, + { + "epoch": 1.41, + "learning_rate": 8.905812492747626e-05, + "loss": 0.0092, + "step": 278740 + }, + { + "epoch": 1.41, + "learning_rate": 8.905055723446225e-05, + "loss": 0.0081, + "step": 278750 + }, + { + "epoch": 1.41, + "learning_rate": 8.904298954144825e-05, + "loss": 0.0115, + "step": 278760 + }, + { + "epoch": 1.41, + "learning_rate": 8.903542184843423e-05, + "loss": 0.0111, + "step": 278770 + }, + { + "epoch": 1.41, + "learning_rate": 8.902785415542022e-05, + "loss": 0.0076, + "step": 278780 + }, + { + "epoch": 1.41, + "learning_rate": 8.90202864624062e-05, + "loss": 0.0093, + "step": 278790 + }, + { + "epoch": 1.41, + "learning_rate": 8.90127187693922e-05, + "loss": 0.0068, + "step": 278800 + }, + { + "epoch": 1.41, + "learning_rate": 8.900515107637819e-05, + "loss": 0.0084, + "step": 278810 + }, + { + "epoch": 1.41, + "learning_rate": 8.899758338336417e-05, + "loss": 0.009, + "step": 278820 + }, + { + "epoch": 1.41, + "learning_rate": 8.899001569035017e-05, + "loss": 0.0107, + "step": 278830 + }, + { + "epoch": 1.41, + "learning_rate": 8.898244799733616e-05, + "loss": 0.0064, + "step": 278840 + }, + { + "epoch": 1.41, + "learning_rate": 8.897488030432215e-05, + "loss": 0.0068, + "step": 278850 + }, + { + "epoch": 1.41, + "learning_rate": 8.896731261130814e-05, + "loss": 0.0069, + "step": 278860 + }, + { + "epoch": 1.41, + "learning_rate": 8.895974491829414e-05, + "loss": 0.0059, + "step": 278870 + }, + { + "epoch": 1.41, + "learning_rate": 8.895217722528012e-05, + "loss": 0.0076, + "step": 278880 + }, + { + "epoch": 1.41, + "learning_rate": 8.894460953226611e-05, + "loss": 0.0083, + "step": 278890 + }, + { + "epoch": 1.41, + "learning_rate": 8.89370418392521e-05, + "loss": 0.0081, + "step": 278900 + }, + { + "epoch": 1.41, + "learning_rate": 8.892947414623809e-05, + "loss": 0.0057, + "step": 278910 + }, + { + "epoch": 1.41, + "learning_rate": 8.892190645322408e-05, + "loss": 0.0089, + "step": 278920 + }, + { + "epoch": 1.41, + "learning_rate": 8.891433876021007e-05, + "loss": 0.0064, + "step": 278930 + }, + { + "epoch": 1.41, + "learning_rate": 8.890677106719606e-05, + "loss": 0.0072, + "step": 278940 + }, + { + "epoch": 1.41, + "learning_rate": 8.889920337418206e-05, + "loss": 0.006, + "step": 278950 + }, + { + "epoch": 1.41, + "learning_rate": 8.889163568116804e-05, + "loss": 0.0081, + "step": 278960 + }, + { + "epoch": 1.41, + "learning_rate": 8.888406798815403e-05, + "loss": 0.0066, + "step": 278970 + }, + { + "epoch": 1.41, + "learning_rate": 8.887650029514001e-05, + "loss": 0.0074, + "step": 278980 + }, + { + "epoch": 1.41, + "learning_rate": 8.886893260212601e-05, + "loss": 0.0054, + "step": 278990 + }, + { + "epoch": 1.41, + "learning_rate": 8.8861364909112e-05, + "loss": 0.0108, + "step": 279000 + }, + { + "epoch": 1.41, + "eval_cer": 0.9144304696620207, + "eval_loss": 0.005943993106484413, + "eval_runtime": 116.6988, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.285, + "step": 279000 + }, + { + "epoch": 1.41, + "learning_rate": 8.885379721609798e-05, + "loss": 0.0093, + "step": 279010 + }, + { + "epoch": 1.41, + "learning_rate": 8.884622952308398e-05, + "loss": 0.0072, + "step": 279020 + }, + { + "epoch": 1.41, + "learning_rate": 8.883866183006997e-05, + "loss": 0.0059, + "step": 279030 + }, + { + "epoch": 1.41, + "learning_rate": 8.883109413705596e-05, + "loss": 0.0074, + "step": 279040 + }, + { + "epoch": 1.41, + "learning_rate": 8.882352644404195e-05, + "loss": 0.008, + "step": 279050 + }, + { + "epoch": 1.41, + "learning_rate": 8.881595875102793e-05, + "loss": 0.006, + "step": 279060 + }, + { + "epoch": 1.41, + "learning_rate": 8.880839105801393e-05, + "loss": 0.0079, + "step": 279070 + }, + { + "epoch": 1.41, + "learning_rate": 8.880082336499992e-05, + "loss": 0.0054, + "step": 279080 + }, + { + "epoch": 1.41, + "learning_rate": 8.87932556719859e-05, + "loss": 0.0101, + "step": 279090 + }, + { + "epoch": 1.41, + "learning_rate": 8.87856879789719e-05, + "loss": 0.0071, + "step": 279100 + }, + { + "epoch": 1.41, + "learning_rate": 8.87781202859579e-05, + "loss": 0.0065, + "step": 279110 + }, + { + "epoch": 1.41, + "learning_rate": 8.877055259294388e-05, + "loss": 0.0083, + "step": 279120 + }, + { + "epoch": 1.41, + "learning_rate": 8.876298489992987e-05, + "loss": 0.0102, + "step": 279130 + }, + { + "epoch": 1.41, + "learning_rate": 8.875541720691585e-05, + "loss": 0.0076, + "step": 279140 + }, + { + "epoch": 1.41, + "learning_rate": 8.874784951390185e-05, + "loss": 0.008, + "step": 279150 + }, + { + "epoch": 1.41, + "learning_rate": 8.874028182088784e-05, + "loss": 0.0103, + "step": 279160 + }, + { + "epoch": 1.41, + "learning_rate": 8.873271412787382e-05, + "loss": 0.0114, + "step": 279170 + }, + { + "epoch": 1.41, + "learning_rate": 8.872514643485982e-05, + "loss": 0.011, + "step": 279180 + }, + { + "epoch": 1.41, + "learning_rate": 8.871757874184581e-05, + "loss": 0.0088, + "step": 279190 + }, + { + "epoch": 1.41, + "learning_rate": 8.87100110488318e-05, + "loss": 0.0078, + "step": 279200 + }, + { + "epoch": 1.41, + "learning_rate": 8.870244335581779e-05, + "loss": 0.0108, + "step": 279210 + }, + { + "epoch": 1.41, + "learning_rate": 8.869487566280377e-05, + "loss": 0.01, + "step": 279220 + }, + { + "epoch": 1.41, + "learning_rate": 8.868730796978977e-05, + "loss": 0.0081, + "step": 279230 + }, + { + "epoch": 1.41, + "learning_rate": 8.867974027677576e-05, + "loss": 0.0081, + "step": 279240 + }, + { + "epoch": 1.41, + "learning_rate": 8.867217258376174e-05, + "loss": 0.0055, + "step": 279250 + }, + { + "epoch": 1.41, + "learning_rate": 8.866460489074774e-05, + "loss": 0.0071, + "step": 279260 + }, + { + "epoch": 1.41, + "learning_rate": 8.865703719773373e-05, + "loss": 0.0096, + "step": 279270 + }, + { + "epoch": 1.41, + "learning_rate": 8.864946950471971e-05, + "loss": 0.0088, + "step": 279280 + }, + { + "epoch": 1.41, + "learning_rate": 8.864190181170571e-05, + "loss": 0.0068, + "step": 279290 + }, + { + "epoch": 1.41, + "learning_rate": 8.863433411869169e-05, + "loss": 0.0068, + "step": 279300 + }, + { + "epoch": 1.41, + "learning_rate": 8.862676642567769e-05, + "loss": 0.0074, + "step": 279310 + }, + { + "epoch": 1.41, + "learning_rate": 8.861919873266368e-05, + "loss": 0.0099, + "step": 279320 + }, + { + "epoch": 1.41, + "learning_rate": 8.861163103964966e-05, + "loss": 0.0091, + "step": 279330 + }, + { + "epoch": 1.41, + "learning_rate": 8.860406334663566e-05, + "loss": 0.0082, + "step": 279340 + }, + { + "epoch": 1.41, + "learning_rate": 8.859649565362162e-05, + "loss": 0.0097, + "step": 279350 + }, + { + "epoch": 1.41, + "learning_rate": 8.858892796060762e-05, + "loss": 0.0079, + "step": 279360 + }, + { + "epoch": 1.41, + "learning_rate": 8.858136026759361e-05, + "loss": 0.0092, + "step": 279370 + }, + { + "epoch": 1.41, + "learning_rate": 8.85737925745796e-05, + "loss": 0.0101, + "step": 279380 + }, + { + "epoch": 1.41, + "learning_rate": 8.856622488156559e-05, + "loss": 0.0099, + "step": 279390 + }, + { + "epoch": 1.41, + "learning_rate": 8.855865718855159e-05, + "loss": 0.01, + "step": 279400 + }, + { + "epoch": 1.41, + "learning_rate": 8.855108949553757e-05, + "loss": 0.0079, + "step": 279410 + }, + { + "epoch": 1.41, + "learning_rate": 8.854352180252356e-05, + "loss": 0.0092, + "step": 279420 + }, + { + "epoch": 1.41, + "learning_rate": 8.853595410950954e-05, + "loss": 0.0098, + "step": 279430 + }, + { + "epoch": 1.41, + "learning_rate": 8.852838641649554e-05, + "loss": 0.0073, + "step": 279440 + }, + { + "epoch": 1.41, + "learning_rate": 8.852081872348153e-05, + "loss": 0.0056, + "step": 279450 + }, + { + "epoch": 1.41, + "learning_rate": 8.851325103046752e-05, + "loss": 0.0063, + "step": 279460 + }, + { + "epoch": 1.41, + "learning_rate": 8.850568333745351e-05, + "loss": 0.0073, + "step": 279470 + }, + { + "epoch": 1.41, + "learning_rate": 8.84981156444395e-05, + "loss": 0.0077, + "step": 279480 + }, + { + "epoch": 1.41, + "learning_rate": 8.849054795142549e-05, + "loss": 0.0109, + "step": 279490 + }, + { + "epoch": 1.41, + "learning_rate": 8.848298025841148e-05, + "loss": 0.0085, + "step": 279500 + }, + { + "epoch": 1.41, + "learning_rate": 8.847541256539746e-05, + "loss": 0.0091, + "step": 279510 + }, + { + "epoch": 1.41, + "learning_rate": 8.846784487238346e-05, + "loss": 0.0081, + "step": 279520 + }, + { + "epoch": 1.41, + "learning_rate": 8.846027717936945e-05, + "loss": 0.0068, + "step": 279530 + }, + { + "epoch": 1.41, + "learning_rate": 8.845270948635543e-05, + "loss": 0.0084, + "step": 279540 + }, + { + "epoch": 1.41, + "learning_rate": 8.844514179334143e-05, + "loss": 0.0085, + "step": 279550 + }, + { + "epoch": 1.41, + "learning_rate": 8.843757410032742e-05, + "loss": 0.0079, + "step": 279560 + }, + { + "epoch": 1.41, + "learning_rate": 8.84300064073134e-05, + "loss": 0.0079, + "step": 279570 + }, + { + "epoch": 1.41, + "learning_rate": 8.84224387142994e-05, + "loss": 0.0062, + "step": 279580 + }, + { + "epoch": 1.41, + "learning_rate": 8.841487102128538e-05, + "loss": 0.0073, + "step": 279590 + }, + { + "epoch": 1.41, + "learning_rate": 8.840730332827138e-05, + "loss": 0.006, + "step": 279600 + }, + { + "epoch": 1.41, + "learning_rate": 8.839973563525737e-05, + "loss": 0.0069, + "step": 279610 + }, + { + "epoch": 1.41, + "learning_rate": 8.839216794224335e-05, + "loss": 0.0088, + "step": 279620 + }, + { + "epoch": 1.41, + "learning_rate": 8.838460024922935e-05, + "loss": 0.0078, + "step": 279630 + }, + { + "epoch": 1.41, + "learning_rate": 8.837703255621534e-05, + "loss": 0.0078, + "step": 279640 + }, + { + "epoch": 1.41, + "learning_rate": 8.836946486320133e-05, + "loss": 0.0078, + "step": 279650 + }, + { + "epoch": 1.41, + "learning_rate": 8.836189717018732e-05, + "loss": 0.0093, + "step": 279660 + }, + { + "epoch": 1.41, + "learning_rate": 8.83543294771733e-05, + "loss": 0.0081, + "step": 279670 + }, + { + "epoch": 1.41, + "learning_rate": 8.83467617841593e-05, + "loss": 0.0066, + "step": 279680 + }, + { + "epoch": 1.41, + "learning_rate": 8.833919409114529e-05, + "loss": 0.0081, + "step": 279690 + }, + { + "epoch": 1.41, + "learning_rate": 8.833162639813127e-05, + "loss": 0.0074, + "step": 279700 + }, + { + "epoch": 1.41, + "learning_rate": 8.832405870511727e-05, + "loss": 0.0071, + "step": 279710 + }, + { + "epoch": 1.41, + "learning_rate": 8.831649101210326e-05, + "loss": 0.0065, + "step": 279720 + }, + { + "epoch": 1.41, + "learning_rate": 8.830892331908924e-05, + "loss": 0.0079, + "step": 279730 + }, + { + "epoch": 1.41, + "learning_rate": 8.830135562607524e-05, + "loss": 0.0097, + "step": 279740 + }, + { + "epoch": 1.41, + "learning_rate": 8.829378793306122e-05, + "loss": 0.0058, + "step": 279750 + }, + { + "epoch": 1.41, + "learning_rate": 8.828622024004722e-05, + "loss": 0.0074, + "step": 279760 + }, + { + "epoch": 1.41, + "learning_rate": 8.827865254703321e-05, + "loss": 0.0084, + "step": 279770 + }, + { + "epoch": 1.41, + "learning_rate": 8.827108485401919e-05, + "loss": 0.0069, + "step": 279780 + }, + { + "epoch": 1.41, + "learning_rate": 8.826351716100519e-05, + "loss": 0.0096, + "step": 279790 + }, + { + "epoch": 1.41, + "learning_rate": 8.825594946799118e-05, + "loss": 0.0073, + "step": 279800 + }, + { + "epoch": 1.41, + "learning_rate": 8.824838177497716e-05, + "loss": 0.007, + "step": 279810 + }, + { + "epoch": 1.41, + "learning_rate": 8.824081408196316e-05, + "loss": 0.0091, + "step": 279820 + }, + { + "epoch": 1.41, + "learning_rate": 8.823324638894914e-05, + "loss": 0.0073, + "step": 279830 + }, + { + "epoch": 1.41, + "learning_rate": 8.822567869593514e-05, + "loss": 0.008, + "step": 279840 + }, + { + "epoch": 1.41, + "learning_rate": 8.821811100292113e-05, + "loss": 0.0069, + "step": 279850 + }, + { + "epoch": 1.41, + "learning_rate": 8.821054330990711e-05, + "loss": 0.0103, + "step": 279860 + }, + { + "epoch": 1.41, + "learning_rate": 8.820297561689311e-05, + "loss": 0.0126, + "step": 279870 + }, + { + "epoch": 1.41, + "learning_rate": 8.81954079238791e-05, + "loss": 0.0068, + "step": 279880 + }, + { + "epoch": 1.41, + "learning_rate": 8.818784023086508e-05, + "loss": 0.0083, + "step": 279890 + }, + { + "epoch": 1.41, + "learning_rate": 8.818027253785108e-05, + "loss": 0.0071, + "step": 279900 + }, + { + "epoch": 1.41, + "learning_rate": 8.817270484483707e-05, + "loss": 0.0073, + "step": 279910 + }, + { + "epoch": 1.41, + "learning_rate": 8.816513715182305e-05, + "loss": 0.006, + "step": 279920 + }, + { + "epoch": 1.41, + "learning_rate": 8.815756945880905e-05, + "loss": 0.0077, + "step": 279930 + }, + { + "epoch": 1.41, + "learning_rate": 8.815000176579503e-05, + "loss": 0.009, + "step": 279940 + }, + { + "epoch": 1.41, + "learning_rate": 8.814243407278103e-05, + "loss": 0.0081, + "step": 279950 + }, + { + "epoch": 1.41, + "learning_rate": 8.813486637976702e-05, + "loss": 0.0089, + "step": 279960 + }, + { + "epoch": 1.41, + "learning_rate": 8.8127298686753e-05, + "loss": 0.0083, + "step": 279970 + }, + { + "epoch": 1.41, + "learning_rate": 8.811973099373898e-05, + "loss": 0.0079, + "step": 279980 + }, + { + "epoch": 1.41, + "learning_rate": 8.811216330072497e-05, + "loss": 0.0088, + "step": 279990 + }, + { + "epoch": 1.41, + "learning_rate": 8.810459560771096e-05, + "loss": 0.0067, + "step": 280000 + }, + { + "epoch": 1.41, + "eval_cer": 0.914423676889143, + "eval_loss": 0.005915849469602108, + "eval_runtime": 116.6786, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, + "step": 280000 + }, + { + "epoch": 1.41, + "learning_rate": 8.809702791469696e-05, + "loss": 0.0075, + "step": 280010 + }, + { + "epoch": 1.41, + "learning_rate": 8.808946022168294e-05, + "loss": 0.0087, + "step": 280020 + }, + { + "epoch": 1.41, + "learning_rate": 8.808189252866893e-05, + "loss": 0.0069, + "step": 280030 + }, + { + "epoch": 1.41, + "learning_rate": 8.807432483565491e-05, + "loss": 0.0081, + "step": 280040 + }, + { + "epoch": 1.41, + "learning_rate": 8.806675714264091e-05, + "loss": 0.0091, + "step": 280050 + }, + { + "epoch": 1.41, + "learning_rate": 8.80591894496269e-05, + "loss": 0.0067, + "step": 280060 + }, + { + "epoch": 1.41, + "learning_rate": 8.805162175661288e-05, + "loss": 0.0065, + "step": 280070 + }, + { + "epoch": 1.41, + "learning_rate": 8.804405406359888e-05, + "loss": 0.0092, + "step": 280080 + }, + { + "epoch": 1.41, + "learning_rate": 8.803648637058487e-05, + "loss": 0.0086, + "step": 280090 + }, + { + "epoch": 1.41, + "learning_rate": 8.802891867757086e-05, + "loss": 0.0066, + "step": 280100 + }, + { + "epoch": 1.41, + "learning_rate": 8.802135098455685e-05, + "loss": 0.0096, + "step": 280110 + }, + { + "epoch": 1.41, + "learning_rate": 8.801378329154283e-05, + "loss": 0.0122, + "step": 280120 + }, + { + "epoch": 1.41, + "learning_rate": 8.800621559852883e-05, + "loss": 0.0083, + "step": 280130 + }, + { + "epoch": 1.41, + "learning_rate": 8.799864790551482e-05, + "loss": 0.0074, + "step": 280140 + }, + { + "epoch": 1.41, + "learning_rate": 8.79910802125008e-05, + "loss": 0.0068, + "step": 280150 + }, + { + "epoch": 1.41, + "learning_rate": 8.79835125194868e-05, + "loss": 0.0067, + "step": 280160 + }, + { + "epoch": 1.41, + "learning_rate": 8.79759448264728e-05, + "loss": 0.007, + "step": 280170 + }, + { + "epoch": 1.41, + "learning_rate": 8.796837713345878e-05, + "loss": 0.0065, + "step": 280180 + }, + { + "epoch": 1.41, + "learning_rate": 8.796080944044477e-05, + "loss": 0.0076, + "step": 280190 + }, + { + "epoch": 1.41, + "learning_rate": 8.795324174743075e-05, + "loss": 0.0083, + "step": 280200 + }, + { + "epoch": 1.41, + "learning_rate": 8.794567405441675e-05, + "loss": 0.0071, + "step": 280210 + }, + { + "epoch": 1.41, + "learning_rate": 8.793810636140274e-05, + "loss": 0.0096, + "step": 280220 + }, + { + "epoch": 1.41, + "learning_rate": 8.793053866838872e-05, + "loss": 0.0086, + "step": 280230 + }, + { + "epoch": 1.41, + "learning_rate": 8.792297097537472e-05, + "loss": 0.0073, + "step": 280240 + }, + { + "epoch": 1.41, + "learning_rate": 8.791540328236071e-05, + "loss": 0.0096, + "step": 280250 + }, + { + "epoch": 1.41, + "learning_rate": 8.79078355893467e-05, + "loss": 0.0091, + "step": 280260 + }, + { + "epoch": 1.41, + "learning_rate": 8.790026789633269e-05, + "loss": 0.0068, + "step": 280270 + }, + { + "epoch": 1.41, + "learning_rate": 8.789270020331867e-05, + "loss": 0.0076, + "step": 280280 + }, + { + "epoch": 1.41, + "learning_rate": 8.788513251030467e-05, + "loss": 0.0065, + "step": 280290 + }, + { + "epoch": 1.41, + "learning_rate": 8.787756481729066e-05, + "loss": 0.0112, + "step": 280300 + }, + { + "epoch": 1.41, + "learning_rate": 8.786999712427664e-05, + "loss": 0.0057, + "step": 280310 + }, + { + "epoch": 1.41, + "learning_rate": 8.786242943126264e-05, + "loss": 0.0099, + "step": 280320 + }, + { + "epoch": 1.41, + "learning_rate": 8.785486173824863e-05, + "loss": 0.0113, + "step": 280330 + }, + { + "epoch": 1.41, + "learning_rate": 8.784729404523461e-05, + "loss": 0.0066, + "step": 280340 + }, + { + "epoch": 1.41, + "learning_rate": 8.783972635222061e-05, + "loss": 0.0084, + "step": 280350 + }, + { + "epoch": 1.41, + "learning_rate": 8.78321586592066e-05, + "loss": 0.0072, + "step": 280360 + }, + { + "epoch": 1.41, + "learning_rate": 8.782459096619259e-05, + "loss": 0.0094, + "step": 280370 + }, + { + "epoch": 1.41, + "learning_rate": 8.781702327317858e-05, + "loss": 0.008, + "step": 280380 + }, + { + "epoch": 1.41, + "learning_rate": 8.780945558016456e-05, + "loss": 0.0075, + "step": 280390 + }, + { + "epoch": 1.41, + "learning_rate": 8.780188788715056e-05, + "loss": 0.0078, + "step": 280400 + }, + { + "epoch": 1.41, + "learning_rate": 8.779432019413655e-05, + "loss": 0.0072, + "step": 280410 + }, + { + "epoch": 1.41, + "learning_rate": 8.778675250112253e-05, + "loss": 0.0064, + "step": 280420 + }, + { + "epoch": 1.41, + "learning_rate": 8.777918480810853e-05, + "loss": 0.0049, + "step": 280430 + }, + { + "epoch": 1.41, + "learning_rate": 8.777161711509452e-05, + "loss": 0.0099, + "step": 280440 + }, + { + "epoch": 1.41, + "learning_rate": 8.77640494220805e-05, + "loss": 0.0074, + "step": 280450 + }, + { + "epoch": 1.41, + "learning_rate": 8.77564817290665e-05, + "loss": 0.0061, + "step": 280460 + }, + { + "epoch": 1.42, + "learning_rate": 8.774891403605248e-05, + "loss": 0.0074, + "step": 280470 + }, + { + "epoch": 1.42, + "learning_rate": 8.774134634303848e-05, + "loss": 0.0063, + "step": 280480 + }, + { + "epoch": 1.42, + "learning_rate": 8.773377865002447e-05, + "loss": 0.0077, + "step": 280490 + }, + { + "epoch": 1.42, + "learning_rate": 8.772621095701045e-05, + "loss": 0.0076, + "step": 280500 + }, + { + "epoch": 1.42, + "learning_rate": 8.771864326399645e-05, + "loss": 0.0074, + "step": 280510 + }, + { + "epoch": 1.42, + "learning_rate": 8.771107557098244e-05, + "loss": 0.0058, + "step": 280520 + }, + { + "epoch": 1.42, + "learning_rate": 8.770350787796842e-05, + "loss": 0.0072, + "step": 280530 + }, + { + "epoch": 1.42, + "learning_rate": 8.769594018495442e-05, + "loss": 0.0066, + "step": 280540 + }, + { + "epoch": 1.42, + "learning_rate": 8.76883724919404e-05, + "loss": 0.0074, + "step": 280550 + }, + { + "epoch": 1.42, + "learning_rate": 8.76808047989264e-05, + "loss": 0.0075, + "step": 280560 + }, + { + "epoch": 1.42, + "learning_rate": 8.767323710591239e-05, + "loss": 0.0091, + "step": 280570 + }, + { + "epoch": 1.42, + "learning_rate": 8.766566941289837e-05, + "loss": 0.006, + "step": 280580 + }, + { + "epoch": 1.42, + "learning_rate": 8.765810171988437e-05, + "loss": 0.0088, + "step": 280590 + }, + { + "epoch": 1.42, + "learning_rate": 8.765053402687033e-05, + "loss": 0.0076, + "step": 280600 + }, + { + "epoch": 1.42, + "learning_rate": 8.764296633385633e-05, + "loss": 0.009, + "step": 280610 + }, + { + "epoch": 1.42, + "learning_rate": 8.763539864084232e-05, + "loss": 0.0063, + "step": 280620 + }, + { + "epoch": 1.42, + "learning_rate": 8.76278309478283e-05, + "loss": 0.0081, + "step": 280630 + }, + { + "epoch": 1.42, + "learning_rate": 8.76202632548143e-05, + "loss": 0.0071, + "step": 280640 + }, + { + "epoch": 1.42, + "learning_rate": 8.761269556180028e-05, + "loss": 0.0088, + "step": 280650 + }, + { + "epoch": 1.42, + "learning_rate": 8.760512786878628e-05, + "loss": 0.0095, + "step": 280660 + }, + { + "epoch": 1.42, + "learning_rate": 8.759756017577227e-05, + "loss": 0.0079, + "step": 280670 + }, + { + "epoch": 1.42, + "learning_rate": 8.758999248275825e-05, + "loss": 0.0133, + "step": 280680 + }, + { + "epoch": 1.42, + "learning_rate": 8.758242478974425e-05, + "loss": 0.0079, + "step": 280690 + }, + { + "epoch": 1.42, + "learning_rate": 8.757485709673024e-05, + "loss": 0.0084, + "step": 280700 + }, + { + "epoch": 1.42, + "learning_rate": 8.756728940371623e-05, + "loss": 0.0092, + "step": 280710 + }, + { + "epoch": 1.42, + "learning_rate": 8.755972171070222e-05, + "loss": 0.0055, + "step": 280720 + }, + { + "epoch": 1.42, + "learning_rate": 8.75521540176882e-05, + "loss": 0.0091, + "step": 280730 + }, + { + "epoch": 1.42, + "learning_rate": 8.75445863246742e-05, + "loss": 0.0068, + "step": 280740 + }, + { + "epoch": 1.42, + "learning_rate": 8.753701863166019e-05, + "loss": 0.0069, + "step": 280750 + }, + { + "epoch": 1.42, + "learning_rate": 8.752945093864617e-05, + "loss": 0.0091, + "step": 280760 + }, + { + "epoch": 1.42, + "learning_rate": 8.752188324563217e-05, + "loss": 0.0101, + "step": 280770 + }, + { + "epoch": 1.42, + "learning_rate": 8.751431555261816e-05, + "loss": 0.0064, + "step": 280780 + }, + { + "epoch": 1.42, + "learning_rate": 8.750674785960414e-05, + "loss": 0.0068, + "step": 280790 + }, + { + "epoch": 1.42, + "learning_rate": 8.749918016659014e-05, + "loss": 0.0088, + "step": 280800 + }, + { + "epoch": 1.42, + "learning_rate": 8.749161247357613e-05, + "loss": 0.008, + "step": 280810 + }, + { + "epoch": 1.42, + "learning_rate": 8.748404478056212e-05, + "loss": 0.0075, + "step": 280820 + }, + { + "epoch": 1.42, + "learning_rate": 8.747647708754811e-05, + "loss": 0.0063, + "step": 280830 + }, + { + "epoch": 1.42, + "learning_rate": 8.746890939453409e-05, + "loss": 0.0058, + "step": 280840 + }, + { + "epoch": 1.42, + "learning_rate": 8.746134170152009e-05, + "loss": 0.0066, + "step": 280850 + }, + { + "epoch": 1.42, + "learning_rate": 8.745377400850608e-05, + "loss": 0.0055, + "step": 280860 + }, + { + "epoch": 1.42, + "learning_rate": 8.744620631549206e-05, + "loss": 0.011, + "step": 280870 + }, + { + "epoch": 1.42, + "learning_rate": 8.743863862247806e-05, + "loss": 0.0079, + "step": 280880 + }, + { + "epoch": 1.42, + "learning_rate": 8.743107092946405e-05, + "loss": 0.008, + "step": 280890 + }, + { + "epoch": 1.42, + "learning_rate": 8.742350323645004e-05, + "loss": 0.0079, + "step": 280900 + }, + { + "epoch": 1.42, + "learning_rate": 8.741593554343603e-05, + "loss": 0.006, + "step": 280910 + }, + { + "epoch": 1.42, + "learning_rate": 8.740836785042201e-05, + "loss": 0.0065, + "step": 280920 + }, + { + "epoch": 1.42, + "learning_rate": 8.740080015740801e-05, + "loss": 0.0091, + "step": 280930 + }, + { + "epoch": 1.42, + "learning_rate": 8.7393232464394e-05, + "loss": 0.008, + "step": 280940 + }, + { + "epoch": 1.42, + "learning_rate": 8.738566477137998e-05, + "loss": 0.0059, + "step": 280950 + }, + { + "epoch": 1.42, + "learning_rate": 8.737809707836598e-05, + "loss": 0.008, + "step": 280960 + }, + { + "epoch": 1.42, + "learning_rate": 8.737052938535197e-05, + "loss": 0.0063, + "step": 280970 + }, + { + "epoch": 1.42, + "learning_rate": 8.736296169233795e-05, + "loss": 0.0103, + "step": 280980 + }, + { + "epoch": 1.42, + "learning_rate": 8.735539399932395e-05, + "loss": 0.006, + "step": 280990 + }, + { + "epoch": 1.42, + "learning_rate": 8.734782630630993e-05, + "loss": 0.0063, + "step": 281000 + }, + { + "epoch": 1.42, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.0056717172265052795, + "eval_runtime": 115.6852, + "eval_samples_per_second": 17.288, + "eval_steps_per_second": 4.322, + "step": 281000 + }, + { + "epoch": 1.42, + "learning_rate": 8.734025861329593e-05, + "loss": 0.013, + "step": 281010 + }, + { + "epoch": 1.42, + "learning_rate": 8.733269092028192e-05, + "loss": 0.0076, + "step": 281020 + }, + { + "epoch": 1.42, + "learning_rate": 8.73251232272679e-05, + "loss": 0.0083, + "step": 281030 + }, + { + "epoch": 1.42, + "learning_rate": 8.73175555342539e-05, + "loss": 0.0075, + "step": 281040 + }, + { + "epoch": 1.42, + "learning_rate": 8.730998784123989e-05, + "loss": 0.006, + "step": 281050 + }, + { + "epoch": 1.42, + "learning_rate": 8.730242014822587e-05, + "loss": 0.0078, + "step": 281060 + }, + { + "epoch": 1.42, + "learning_rate": 8.729485245521187e-05, + "loss": 0.007, + "step": 281070 + }, + { + "epoch": 1.42, + "learning_rate": 8.728728476219785e-05, + "loss": 0.008, + "step": 281080 + }, + { + "epoch": 1.42, + "learning_rate": 8.727971706918385e-05, + "loss": 0.008, + "step": 281090 + }, + { + "epoch": 1.42, + "learning_rate": 8.727214937616984e-05, + "loss": 0.0062, + "step": 281100 + }, + { + "epoch": 1.42, + "learning_rate": 8.726458168315582e-05, + "loss": 0.0086, + "step": 281110 + }, + { + "epoch": 1.42, + "learning_rate": 8.725701399014182e-05, + "loss": 0.007, + "step": 281120 + }, + { + "epoch": 1.42, + "learning_rate": 8.724944629712781e-05, + "loss": 0.0095, + "step": 281130 + }, + { + "epoch": 1.42, + "learning_rate": 8.72418786041138e-05, + "loss": 0.0093, + "step": 281140 + }, + { + "epoch": 1.42, + "learning_rate": 8.723431091109979e-05, + "loss": 0.0066, + "step": 281150 + }, + { + "epoch": 1.42, + "learning_rate": 8.722674321808577e-05, + "loss": 0.0068, + "step": 281160 + }, + { + "epoch": 1.42, + "learning_rate": 8.721917552507176e-05, + "loss": 0.0051, + "step": 281170 + }, + { + "epoch": 1.42, + "learning_rate": 8.721160783205776e-05, + "loss": 0.0067, + "step": 281180 + }, + { + "epoch": 1.42, + "learning_rate": 8.720404013904374e-05, + "loss": 0.0088, + "step": 281190 + }, + { + "epoch": 1.42, + "learning_rate": 8.719647244602974e-05, + "loss": 0.0079, + "step": 281200 + }, + { + "epoch": 1.42, + "learning_rate": 8.718890475301573e-05, + "loss": 0.0084, + "step": 281210 + }, + { + "epoch": 1.42, + "learning_rate": 8.718133706000171e-05, + "loss": 0.0057, + "step": 281220 + }, + { + "epoch": 1.42, + "learning_rate": 8.71737693669877e-05, + "loss": 0.0094, + "step": 281230 + }, + { + "epoch": 1.42, + "learning_rate": 8.716620167397368e-05, + "loss": 0.0061, + "step": 281240 + }, + { + "epoch": 1.42, + "learning_rate": 8.715863398095967e-05, + "loss": 0.0065, + "step": 281250 + }, + { + "epoch": 1.42, + "learning_rate": 8.715106628794567e-05, + "loss": 0.0065, + "step": 281260 + }, + { + "epoch": 1.42, + "learning_rate": 8.714349859493165e-05, + "loss": 0.0082, + "step": 281270 + }, + { + "epoch": 1.42, + "learning_rate": 8.713593090191764e-05, + "loss": 0.0081, + "step": 281280 + }, + { + "epoch": 1.42, + "learning_rate": 8.712836320890362e-05, + "loss": 0.0062, + "step": 281290 + }, + { + "epoch": 1.42, + "learning_rate": 8.712079551588962e-05, + "loss": 0.007, + "step": 281300 + }, + { + "epoch": 1.42, + "learning_rate": 8.711322782287561e-05, + "loss": 0.0088, + "step": 281310 + }, + { + "epoch": 1.42, + "learning_rate": 8.71056601298616e-05, + "loss": 0.0084, + "step": 281320 + }, + { + "epoch": 1.42, + "learning_rate": 8.709809243684759e-05, + "loss": 0.0091, + "step": 281330 + }, + { + "epoch": 1.42, + "learning_rate": 8.709052474383359e-05, + "loss": 0.0081, + "step": 281340 + }, + { + "epoch": 1.42, + "learning_rate": 8.708295705081957e-05, + "loss": 0.0078, + "step": 281350 + }, + { + "epoch": 1.42, + "learning_rate": 8.707538935780556e-05, + "loss": 0.0079, + "step": 281360 + }, + { + "epoch": 1.42, + "learning_rate": 8.706782166479154e-05, + "loss": 0.0084, + "step": 281370 + }, + { + "epoch": 1.42, + "learning_rate": 8.706025397177754e-05, + "loss": 0.0046, + "step": 281380 + }, + { + "epoch": 1.42, + "learning_rate": 8.705268627876353e-05, + "loss": 0.0079, + "step": 281390 + }, + { + "epoch": 1.42, + "learning_rate": 8.704511858574951e-05, + "loss": 0.0096, + "step": 281400 + }, + { + "epoch": 1.42, + "learning_rate": 8.703755089273551e-05, + "loss": 0.0068, + "step": 281410 + }, + { + "epoch": 1.42, + "learning_rate": 8.70299831997215e-05, + "loss": 0.0091, + "step": 281420 + }, + { + "epoch": 1.42, + "learning_rate": 8.702241550670749e-05, + "loss": 0.007, + "step": 281430 + }, + { + "epoch": 1.42, + "learning_rate": 8.701484781369348e-05, + "loss": 0.007, + "step": 281440 + }, + { + "epoch": 1.42, + "learning_rate": 8.700728012067946e-05, + "loss": 0.0126, + "step": 281450 + }, + { + "epoch": 1.42, + "learning_rate": 8.699971242766546e-05, + "loss": 0.008, + "step": 281460 + }, + { + "epoch": 1.42, + "learning_rate": 8.699214473465145e-05, + "loss": 0.0085, + "step": 281470 + }, + { + "epoch": 1.42, + "learning_rate": 8.698457704163743e-05, + "loss": 0.0089, + "step": 281480 + }, + { + "epoch": 1.42, + "learning_rate": 8.697700934862343e-05, + "loss": 0.0081, + "step": 281490 + }, + { + "epoch": 1.42, + "learning_rate": 8.696944165560942e-05, + "loss": 0.0075, + "step": 281500 + }, + { + "epoch": 1.42, + "learning_rate": 8.69618739625954e-05, + "loss": 0.0077, + "step": 281510 + }, + { + "epoch": 1.42, + "learning_rate": 8.69543062695814e-05, + "loss": 0.0078, + "step": 281520 + }, + { + "epoch": 1.42, + "learning_rate": 8.694673857656738e-05, + "loss": 0.0061, + "step": 281530 + }, + { + "epoch": 1.42, + "learning_rate": 8.693917088355338e-05, + "loss": 0.0076, + "step": 281540 + }, + { + "epoch": 1.42, + "learning_rate": 8.693160319053937e-05, + "loss": 0.0069, + "step": 281550 + }, + { + "epoch": 1.42, + "learning_rate": 8.692403549752535e-05, + "loss": 0.0083, + "step": 281560 + }, + { + "epoch": 1.42, + "learning_rate": 8.691646780451135e-05, + "loss": 0.0094, + "step": 281570 + }, + { + "epoch": 1.42, + "learning_rate": 8.690890011149734e-05, + "loss": 0.0055, + "step": 281580 + }, + { + "epoch": 1.42, + "learning_rate": 8.690133241848332e-05, + "loss": 0.0089, + "step": 281590 + }, + { + "epoch": 1.42, + "learning_rate": 8.689376472546932e-05, + "loss": 0.0072, + "step": 281600 + }, + { + "epoch": 1.42, + "learning_rate": 8.68861970324553e-05, + "loss": 0.0072, + "step": 281610 + }, + { + "epoch": 1.42, + "learning_rate": 8.68786293394413e-05, + "loss": 0.0119, + "step": 281620 + }, + { + "epoch": 1.42, + "learning_rate": 8.687106164642729e-05, + "loss": 0.0078, + "step": 281630 + }, + { + "epoch": 1.42, + "learning_rate": 8.686349395341327e-05, + "loss": 0.0089, + "step": 281640 + }, + { + "epoch": 1.42, + "learning_rate": 8.685592626039927e-05, + "loss": 0.0082, + "step": 281650 + }, + { + "epoch": 1.42, + "learning_rate": 8.684835856738526e-05, + "loss": 0.0086, + "step": 281660 + }, + { + "epoch": 1.42, + "learning_rate": 8.684079087437124e-05, + "loss": 0.0081, + "step": 281670 + }, + { + "epoch": 1.42, + "learning_rate": 8.683322318135724e-05, + "loss": 0.0073, + "step": 281680 + }, + { + "epoch": 1.42, + "learning_rate": 8.682565548834322e-05, + "loss": 0.0078, + "step": 281690 + }, + { + "epoch": 1.42, + "learning_rate": 8.681808779532922e-05, + "loss": 0.0077, + "step": 281700 + }, + { + "epoch": 1.42, + "learning_rate": 8.681052010231521e-05, + "loss": 0.0157, + "step": 281710 + }, + { + "epoch": 1.42, + "learning_rate": 8.680295240930119e-05, + "loss": 0.0071, + "step": 281720 + }, + { + "epoch": 1.42, + "learning_rate": 8.679538471628719e-05, + "loss": 0.0096, + "step": 281730 + }, + { + "epoch": 1.42, + "learning_rate": 8.678781702327318e-05, + "loss": 0.0093, + "step": 281740 + }, + { + "epoch": 1.42, + "learning_rate": 8.678024933025916e-05, + "loss": 0.0089, + "step": 281750 + }, + { + "epoch": 1.42, + "learning_rate": 8.677268163724516e-05, + "loss": 0.006, + "step": 281760 + }, + { + "epoch": 1.42, + "learning_rate": 8.676511394423114e-05, + "loss": 0.008, + "step": 281770 + }, + { + "epoch": 1.42, + "learning_rate": 8.675754625121713e-05, + "loss": 0.007, + "step": 281780 + }, + { + "epoch": 1.42, + "learning_rate": 8.674997855820313e-05, + "loss": 0.0085, + "step": 281790 + }, + { + "epoch": 1.42, + "learning_rate": 8.674241086518911e-05, + "loss": 0.0058, + "step": 281800 + }, + { + "epoch": 1.42, + "learning_rate": 8.67348431721751e-05, + "loss": 0.0073, + "step": 281810 + }, + { + "epoch": 1.42, + "learning_rate": 8.67272754791611e-05, + "loss": 0.0072, + "step": 281820 + }, + { + "epoch": 1.42, + "learning_rate": 8.671970778614708e-05, + "loss": 0.0065, + "step": 281830 + }, + { + "epoch": 1.42, + "learning_rate": 8.671214009313308e-05, + "loss": 0.0092, + "step": 281840 + }, + { + "epoch": 1.42, + "learning_rate": 8.670457240011907e-05, + "loss": 0.0075, + "step": 281850 + }, + { + "epoch": 1.42, + "learning_rate": 8.669700470710504e-05, + "loss": 0.0083, + "step": 281860 + }, + { + "epoch": 1.42, + "learning_rate": 8.668943701409104e-05, + "loss": 0.0101, + "step": 281870 + }, + { + "epoch": 1.42, + "learning_rate": 8.668186932107702e-05, + "loss": 0.0076, + "step": 281880 + }, + { + "epoch": 1.42, + "learning_rate": 8.667430162806301e-05, + "loss": 0.0057, + "step": 281890 + }, + { + "epoch": 1.42, + "learning_rate": 8.666673393504899e-05, + "loss": 0.0069, + "step": 281900 + }, + { + "epoch": 1.42, + "learning_rate": 8.665916624203499e-05, + "loss": 0.0071, + "step": 281910 + }, + { + "epoch": 1.42, + "learning_rate": 8.665159854902098e-05, + "loss": 0.0088, + "step": 281920 + }, + { + "epoch": 1.42, + "learning_rate": 8.664403085600696e-05, + "loss": 0.0092, + "step": 281930 + }, + { + "epoch": 1.42, + "learning_rate": 8.663646316299296e-05, + "loss": 0.0067, + "step": 281940 + }, + { + "epoch": 1.42, + "learning_rate": 8.662889546997895e-05, + "loss": 0.0076, + "step": 281950 + }, + { + "epoch": 1.42, + "learning_rate": 8.662132777696494e-05, + "loss": 0.0079, + "step": 281960 + }, + { + "epoch": 1.42, + "learning_rate": 8.661376008395093e-05, + "loss": 0.0076, + "step": 281970 + }, + { + "epoch": 1.42, + "learning_rate": 8.660619239093691e-05, + "loss": 0.0057, + "step": 281980 + }, + { + "epoch": 1.42, + "learning_rate": 8.659862469792291e-05, + "loss": 0.0067, + "step": 281990 + }, + { + "epoch": 1.42, + "learning_rate": 8.65910570049089e-05, + "loss": 0.0071, + "step": 282000 + }, + { + "epoch": 1.42, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.005825493950396776, + "eval_runtime": 115.8458, + "eval_samples_per_second": 17.264, + "eval_steps_per_second": 4.316, + "step": 282000 + }, + { + "epoch": 1.42, + "learning_rate": 8.658348931189488e-05, + "loss": 0.0092, + "step": 282010 + }, + { + "epoch": 1.42, + "learning_rate": 8.657592161888088e-05, + "loss": 0.0068, + "step": 282020 + }, + { + "epoch": 1.42, + "learning_rate": 8.656835392586687e-05, + "loss": 0.0086, + "step": 282030 + }, + { + "epoch": 1.42, + "learning_rate": 8.656078623285286e-05, + "loss": 0.0094, + "step": 282040 + }, + { + "epoch": 1.42, + "learning_rate": 8.655321853983885e-05, + "loss": 0.0084, + "step": 282050 + }, + { + "epoch": 1.42, + "learning_rate": 8.654565084682483e-05, + "loss": 0.0071, + "step": 282060 + }, + { + "epoch": 1.42, + "learning_rate": 8.653808315381083e-05, + "loss": 0.008, + "step": 282070 + }, + { + "epoch": 1.42, + "learning_rate": 8.653051546079682e-05, + "loss": 0.0097, + "step": 282080 + }, + { + "epoch": 1.42, + "learning_rate": 8.65229477677828e-05, + "loss": 0.0075, + "step": 282090 + }, + { + "epoch": 1.42, + "learning_rate": 8.65153800747688e-05, + "loss": 0.0071, + "step": 282100 + }, + { + "epoch": 1.42, + "learning_rate": 8.650781238175479e-05, + "loss": 0.0071, + "step": 282110 + }, + { + "epoch": 1.42, + "learning_rate": 8.650024468874077e-05, + "loss": 0.0104, + "step": 282120 + }, + { + "epoch": 1.42, + "learning_rate": 8.649267699572677e-05, + "loss": 0.009, + "step": 282130 + }, + { + "epoch": 1.42, + "learning_rate": 8.648510930271275e-05, + "loss": 0.0076, + "step": 282140 + }, + { + "epoch": 1.42, + "learning_rate": 8.647754160969875e-05, + "loss": 0.0108, + "step": 282150 + }, + { + "epoch": 1.42, + "learning_rate": 8.646997391668474e-05, + "loss": 0.0059, + "step": 282160 + }, + { + "epoch": 1.42, + "learning_rate": 8.646240622367072e-05, + "loss": 0.0081, + "step": 282170 + }, + { + "epoch": 1.42, + "learning_rate": 8.645483853065672e-05, + "loss": 0.0078, + "step": 282180 + }, + { + "epoch": 1.42, + "learning_rate": 8.644727083764271e-05, + "loss": 0.0074, + "step": 282190 + }, + { + "epoch": 1.42, + "learning_rate": 8.64397031446287e-05, + "loss": 0.0103, + "step": 282200 + }, + { + "epoch": 1.42, + "learning_rate": 8.643213545161469e-05, + "loss": 0.0076, + "step": 282210 + }, + { + "epoch": 1.42, + "learning_rate": 8.642456775860067e-05, + "loss": 0.0071, + "step": 282220 + }, + { + "epoch": 1.42, + "learning_rate": 8.641700006558667e-05, + "loss": 0.0054, + "step": 282230 + }, + { + "epoch": 1.42, + "learning_rate": 8.640943237257266e-05, + "loss": 0.0093, + "step": 282240 + }, + { + "epoch": 1.42, + "learning_rate": 8.640186467955864e-05, + "loss": 0.0078, + "step": 282250 + }, + { + "epoch": 1.42, + "learning_rate": 8.639429698654464e-05, + "loss": 0.008, + "step": 282260 + }, + { + "epoch": 1.42, + "learning_rate": 8.638672929353063e-05, + "loss": 0.0095, + "step": 282270 + }, + { + "epoch": 1.42, + "learning_rate": 8.637916160051661e-05, + "loss": 0.0071, + "step": 282280 + }, + { + "epoch": 1.42, + "learning_rate": 8.637159390750261e-05, + "loss": 0.0089, + "step": 282290 + }, + { + "epoch": 1.42, + "learning_rate": 8.63640262144886e-05, + "loss": 0.0081, + "step": 282300 + }, + { + "epoch": 1.42, + "learning_rate": 8.635645852147458e-05, + "loss": 0.0067, + "step": 282310 + }, + { + "epoch": 1.42, + "learning_rate": 8.634889082846058e-05, + "loss": 0.0076, + "step": 282320 + }, + { + "epoch": 1.42, + "learning_rate": 8.634132313544656e-05, + "loss": 0.0069, + "step": 282330 + }, + { + "epoch": 1.42, + "learning_rate": 8.633375544243256e-05, + "loss": 0.0079, + "step": 282340 + }, + { + "epoch": 1.42, + "learning_rate": 8.632618774941855e-05, + "loss": 0.0069, + "step": 282350 + }, + { + "epoch": 1.42, + "learning_rate": 8.631862005640453e-05, + "loss": 0.0093, + "step": 282360 + }, + { + "epoch": 1.42, + "learning_rate": 8.631105236339053e-05, + "loss": 0.0074, + "step": 282370 + }, + { + "epoch": 1.42, + "learning_rate": 8.630348467037652e-05, + "loss": 0.0065, + "step": 282380 + }, + { + "epoch": 1.42, + "learning_rate": 8.62959169773625e-05, + "loss": 0.0073, + "step": 282390 + }, + { + "epoch": 1.42, + "learning_rate": 8.62883492843485e-05, + "loss": 0.0065, + "step": 282400 + }, + { + "epoch": 1.42, + "learning_rate": 8.628078159133448e-05, + "loss": 0.009, + "step": 282410 + }, + { + "epoch": 1.42, + "learning_rate": 8.627321389832048e-05, + "loss": 0.007, + "step": 282420 + }, + { + "epoch": 1.42, + "learning_rate": 8.626564620530647e-05, + "loss": 0.0077, + "step": 282430 + }, + { + "epoch": 1.42, + "learning_rate": 8.625807851229245e-05, + "loss": 0.0073, + "step": 282440 + }, + { + "epoch": 1.42, + "learning_rate": 8.625051081927845e-05, + "loss": 0.0081, + "step": 282450 + }, + { + "epoch": 1.43, + "learning_rate": 8.624294312626444e-05, + "loss": 0.0091, + "step": 282460 + }, + { + "epoch": 1.43, + "learning_rate": 8.623537543325042e-05, + "loss": 0.0093, + "step": 282470 + }, + { + "epoch": 1.43, + "learning_rate": 8.622780774023642e-05, + "loss": 0.0075, + "step": 282480 + }, + { + "epoch": 1.43, + "learning_rate": 8.622024004722239e-05, + "loss": 0.008, + "step": 282490 + }, + { + "epoch": 1.43, + "learning_rate": 8.621267235420838e-05, + "loss": 0.0081, + "step": 282500 + }, + { + "epoch": 1.43, + "learning_rate": 8.620510466119436e-05, + "loss": 0.0064, + "step": 282510 + }, + { + "epoch": 1.43, + "learning_rate": 8.619753696818036e-05, + "loss": 0.008, + "step": 282520 + }, + { + "epoch": 1.43, + "learning_rate": 8.618996927516635e-05, + "loss": 0.0079, + "step": 282530 + }, + { + "epoch": 1.43, + "learning_rate": 8.618240158215233e-05, + "loss": 0.0087, + "step": 282540 + }, + { + "epoch": 1.43, + "learning_rate": 8.617483388913833e-05, + "loss": 0.0072, + "step": 282550 + }, + { + "epoch": 1.43, + "learning_rate": 8.616726619612432e-05, + "loss": 0.0066, + "step": 282560 + }, + { + "epoch": 1.43, + "learning_rate": 8.61596985031103e-05, + "loss": 0.009, + "step": 282570 + }, + { + "epoch": 1.43, + "learning_rate": 8.61521308100963e-05, + "loss": 0.0083, + "step": 282580 + }, + { + "epoch": 1.43, + "learning_rate": 8.614456311708228e-05, + "loss": 0.0065, + "step": 282590 + }, + { + "epoch": 1.43, + "learning_rate": 8.613699542406828e-05, + "loss": 0.0079, + "step": 282600 + }, + { + "epoch": 1.43, + "learning_rate": 8.612942773105427e-05, + "loss": 0.0071, + "step": 282610 + }, + { + "epoch": 1.43, + "learning_rate": 8.612186003804025e-05, + "loss": 0.009, + "step": 282620 + }, + { + "epoch": 1.43, + "learning_rate": 8.611429234502625e-05, + "loss": 0.0072, + "step": 282630 + }, + { + "epoch": 1.43, + "learning_rate": 8.610672465201224e-05, + "loss": 0.008, + "step": 282640 + }, + { + "epoch": 1.43, + "learning_rate": 8.609915695899822e-05, + "loss": 0.0062, + "step": 282650 + }, + { + "epoch": 1.43, + "learning_rate": 8.609158926598422e-05, + "loss": 0.0074, + "step": 282660 + }, + { + "epoch": 1.43, + "learning_rate": 8.60840215729702e-05, + "loss": 0.0065, + "step": 282670 + }, + { + "epoch": 1.43, + "learning_rate": 8.60764538799562e-05, + "loss": 0.0081, + "step": 282680 + }, + { + "epoch": 1.43, + "learning_rate": 8.606888618694219e-05, + "loss": 0.0078, + "step": 282690 + }, + { + "epoch": 1.43, + "learning_rate": 8.606131849392817e-05, + "loss": 0.0062, + "step": 282700 + }, + { + "epoch": 1.43, + "learning_rate": 8.605375080091417e-05, + "loss": 0.007, + "step": 282710 + }, + { + "epoch": 1.43, + "learning_rate": 8.604618310790016e-05, + "loss": 0.0081, + "step": 282720 + }, + { + "epoch": 1.43, + "learning_rate": 8.603861541488614e-05, + "loss": 0.009, + "step": 282730 + }, + { + "epoch": 1.43, + "learning_rate": 8.603104772187214e-05, + "loss": 0.0065, + "step": 282740 + }, + { + "epoch": 1.43, + "learning_rate": 8.602348002885813e-05, + "loss": 0.007, + "step": 282750 + }, + { + "epoch": 1.43, + "learning_rate": 8.601591233584412e-05, + "loss": 0.0077, + "step": 282760 + }, + { + "epoch": 1.43, + "learning_rate": 8.600834464283011e-05, + "loss": 0.0069, + "step": 282770 + }, + { + "epoch": 1.43, + "learning_rate": 8.600077694981609e-05, + "loss": 0.0089, + "step": 282780 + }, + { + "epoch": 1.43, + "learning_rate": 8.599320925680209e-05, + "loss": 0.0071, + "step": 282790 + }, + { + "epoch": 1.43, + "learning_rate": 8.598564156378808e-05, + "loss": 0.007, + "step": 282800 + }, + { + "epoch": 1.43, + "learning_rate": 8.597807387077406e-05, + "loss": 0.0068, + "step": 282810 + }, + { + "epoch": 1.43, + "learning_rate": 8.597050617776006e-05, + "loss": 0.0091, + "step": 282820 + }, + { + "epoch": 1.43, + "learning_rate": 8.596293848474605e-05, + "loss": 0.0063, + "step": 282830 + }, + { + "epoch": 1.43, + "learning_rate": 8.595537079173203e-05, + "loss": 0.0078, + "step": 282840 + }, + { + "epoch": 1.43, + "learning_rate": 8.594780309871803e-05, + "loss": 0.0053, + "step": 282850 + }, + { + "epoch": 1.43, + "learning_rate": 8.594023540570401e-05, + "loss": 0.0067, + "step": 282860 + }, + { + "epoch": 1.43, + "learning_rate": 8.593266771269e-05, + "loss": 0.0078, + "step": 282870 + }, + { + "epoch": 1.43, + "learning_rate": 8.5925100019676e-05, + "loss": 0.0084, + "step": 282880 + }, + { + "epoch": 1.43, + "learning_rate": 8.591753232666198e-05, + "loss": 0.0067, + "step": 282890 + }, + { + "epoch": 1.43, + "learning_rate": 8.590996463364798e-05, + "loss": 0.0077, + "step": 282900 + }, + { + "epoch": 1.43, + "learning_rate": 8.590239694063397e-05, + "loss": 0.0089, + "step": 282910 + }, + { + "epoch": 1.43, + "learning_rate": 8.589482924761995e-05, + "loss": 0.0068, + "step": 282920 + }, + { + "epoch": 1.43, + "learning_rate": 8.588726155460595e-05, + "loss": 0.0072, + "step": 282930 + }, + { + "epoch": 1.43, + "learning_rate": 8.587969386159193e-05, + "loss": 0.0078, + "step": 282940 + }, + { + "epoch": 1.43, + "learning_rate": 8.587212616857793e-05, + "loss": 0.0083, + "step": 282950 + }, + { + "epoch": 1.43, + "learning_rate": 8.586455847556392e-05, + "loss": 0.0083, + "step": 282960 + }, + { + "epoch": 1.43, + "learning_rate": 8.58569907825499e-05, + "loss": 0.0081, + "step": 282970 + }, + { + "epoch": 1.43, + "learning_rate": 8.58494230895359e-05, + "loss": 0.0056, + "step": 282980 + }, + { + "epoch": 1.43, + "learning_rate": 8.584185539652189e-05, + "loss": 0.0069, + "step": 282990 + }, + { + "epoch": 1.43, + "learning_rate": 8.583428770350787e-05, + "loss": 0.0087, + "step": 283000 + }, + { + "epoch": 1.43, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.005669817794114351, + "eval_runtime": 115.6754, + "eval_samples_per_second": 17.29, + "eval_steps_per_second": 4.322, + "step": 283000 + }, + { + "epoch": 1.43, + "learning_rate": 8.582672001049387e-05, + "loss": 0.01, + "step": 283010 + }, + { + "epoch": 1.43, + "learning_rate": 8.581915231747985e-05, + "loss": 0.007, + "step": 283020 + }, + { + "epoch": 1.43, + "learning_rate": 8.581158462446584e-05, + "loss": 0.0089, + "step": 283030 + }, + { + "epoch": 1.43, + "learning_rate": 8.580401693145184e-05, + "loss": 0.007, + "step": 283040 + }, + { + "epoch": 1.43, + "learning_rate": 8.579644923843782e-05, + "loss": 0.0098, + "step": 283050 + }, + { + "epoch": 1.43, + "learning_rate": 8.578888154542382e-05, + "loss": 0.0071, + "step": 283060 + }, + { + "epoch": 1.43, + "learning_rate": 8.578131385240981e-05, + "loss": 0.0091, + "step": 283070 + }, + { + "epoch": 1.43, + "learning_rate": 8.577374615939579e-05, + "loss": 0.0081, + "step": 283080 + }, + { + "epoch": 1.43, + "learning_rate": 8.576617846638179e-05, + "loss": 0.008, + "step": 283090 + }, + { + "epoch": 1.43, + "learning_rate": 8.575861077336777e-05, + "loss": 0.0062, + "step": 283100 + }, + { + "epoch": 1.43, + "learning_rate": 8.575104308035376e-05, + "loss": 0.008, + "step": 283110 + }, + { + "epoch": 1.43, + "learning_rate": 8.574347538733973e-05, + "loss": 0.0079, + "step": 283120 + }, + { + "epoch": 1.43, + "learning_rate": 8.573590769432573e-05, + "loss": 0.0073, + "step": 283130 + }, + { + "epoch": 1.43, + "learning_rate": 8.572834000131172e-05, + "loss": 0.0102, + "step": 283140 + }, + { + "epoch": 1.43, + "learning_rate": 8.57207723082977e-05, + "loss": 0.0078, + "step": 283150 + }, + { + "epoch": 1.43, + "learning_rate": 8.57132046152837e-05, + "loss": 0.008, + "step": 283160 + }, + { + "epoch": 1.43, + "learning_rate": 8.57056369222697e-05, + "loss": 0.0056, + "step": 283170 + }, + { + "epoch": 1.43, + "learning_rate": 8.569806922925567e-05, + "loss": 0.0093, + "step": 283180 + }, + { + "epoch": 1.43, + "learning_rate": 8.569050153624167e-05, + "loss": 0.0057, + "step": 283190 + }, + { + "epoch": 1.43, + "learning_rate": 8.568293384322766e-05, + "loss": 0.0064, + "step": 283200 + }, + { + "epoch": 1.43, + "learning_rate": 8.567536615021365e-05, + "loss": 0.0068, + "step": 283210 + }, + { + "epoch": 1.43, + "learning_rate": 8.566779845719964e-05, + "loss": 0.0078, + "step": 283220 + }, + { + "epoch": 1.43, + "learning_rate": 8.566023076418562e-05, + "loss": 0.0071, + "step": 283230 + }, + { + "epoch": 1.43, + "learning_rate": 8.565266307117162e-05, + "loss": 0.0067, + "step": 283240 + }, + { + "epoch": 1.43, + "learning_rate": 8.564509537815761e-05, + "loss": 0.0101, + "step": 283250 + }, + { + "epoch": 1.43, + "learning_rate": 8.56375276851436e-05, + "loss": 0.0059, + "step": 283260 + }, + { + "epoch": 1.43, + "learning_rate": 8.562995999212959e-05, + "loss": 0.0079, + "step": 283270 + }, + { + "epoch": 1.43, + "learning_rate": 8.562239229911558e-05, + "loss": 0.0073, + "step": 283280 + }, + { + "epoch": 1.43, + "learning_rate": 8.561482460610157e-05, + "loss": 0.0074, + "step": 283290 + }, + { + "epoch": 1.43, + "learning_rate": 8.560725691308756e-05, + "loss": 0.0044, + "step": 283300 + }, + { + "epoch": 1.43, + "learning_rate": 8.559968922007354e-05, + "loss": 0.0089, + "step": 283310 + }, + { + "epoch": 1.43, + "learning_rate": 8.559212152705954e-05, + "loss": 0.0085, + "step": 283320 + }, + { + "epoch": 1.43, + "learning_rate": 8.558455383404553e-05, + "loss": 0.0079, + "step": 283330 + }, + { + "epoch": 1.43, + "learning_rate": 8.557698614103151e-05, + "loss": 0.0064, + "step": 283340 + }, + { + "epoch": 1.43, + "learning_rate": 8.556941844801751e-05, + "loss": 0.0078, + "step": 283350 + }, + { + "epoch": 1.43, + "learning_rate": 8.55618507550035e-05, + "loss": 0.0079, + "step": 283360 + }, + { + "epoch": 1.43, + "learning_rate": 8.555428306198948e-05, + "loss": 0.0071, + "step": 283370 + }, + { + "epoch": 1.43, + "learning_rate": 8.554671536897548e-05, + "loss": 0.0076, + "step": 283380 + }, + { + "epoch": 1.43, + "learning_rate": 8.553914767596146e-05, + "loss": 0.0082, + "step": 283390 + }, + { + "epoch": 1.43, + "learning_rate": 8.553157998294746e-05, + "loss": 0.0068, + "step": 283400 + }, + { + "epoch": 1.43, + "learning_rate": 8.552401228993345e-05, + "loss": 0.0062, + "step": 283410 + }, + { + "epoch": 1.43, + "learning_rate": 8.551644459691943e-05, + "loss": 0.0094, + "step": 283420 + }, + { + "epoch": 1.43, + "learning_rate": 8.550887690390543e-05, + "loss": 0.0075, + "step": 283430 + }, + { + "epoch": 1.43, + "learning_rate": 8.550130921089142e-05, + "loss": 0.0068, + "step": 283440 + }, + { + "epoch": 1.43, + "learning_rate": 8.54937415178774e-05, + "loss": 0.0063, + "step": 283450 + }, + { + "epoch": 1.43, + "learning_rate": 8.54861738248634e-05, + "loss": 0.0087, + "step": 283460 + }, + { + "epoch": 1.43, + "learning_rate": 8.547860613184938e-05, + "loss": 0.0081, + "step": 283470 + }, + { + "epoch": 1.43, + "learning_rate": 8.547103843883538e-05, + "loss": 0.0083, + "step": 283480 + }, + { + "epoch": 1.43, + "learning_rate": 8.546347074582137e-05, + "loss": 0.0088, + "step": 283490 + }, + { + "epoch": 1.43, + "learning_rate": 8.545590305280735e-05, + "loss": 0.0065, + "step": 283500 + }, + { + "epoch": 1.43, + "learning_rate": 8.544833535979335e-05, + "loss": 0.0096, + "step": 283510 + }, + { + "epoch": 1.43, + "learning_rate": 8.544076766677934e-05, + "loss": 0.0085, + "step": 283520 + }, + { + "epoch": 1.43, + "learning_rate": 8.543319997376532e-05, + "loss": 0.0063, + "step": 283530 + }, + { + "epoch": 1.43, + "learning_rate": 8.542563228075132e-05, + "loss": 0.006, + "step": 283540 + }, + { + "epoch": 1.43, + "learning_rate": 8.54180645877373e-05, + "loss": 0.005, + "step": 283550 + }, + { + "epoch": 1.43, + "learning_rate": 8.54104968947233e-05, + "loss": 0.0066, + "step": 283560 + }, + { + "epoch": 1.43, + "learning_rate": 8.540292920170929e-05, + "loss": 0.0073, + "step": 283570 + }, + { + "epoch": 1.43, + "learning_rate": 8.539536150869527e-05, + "loss": 0.0068, + "step": 283580 + }, + { + "epoch": 1.43, + "learning_rate": 8.538779381568127e-05, + "loss": 0.0055, + "step": 283590 + }, + { + "epoch": 1.43, + "learning_rate": 8.538022612266726e-05, + "loss": 0.0061, + "step": 283600 + }, + { + "epoch": 1.43, + "learning_rate": 8.537265842965324e-05, + "loss": 0.0077, + "step": 283610 + }, + { + "epoch": 1.43, + "learning_rate": 8.536509073663924e-05, + "loss": 0.0086, + "step": 283620 + }, + { + "epoch": 1.43, + "learning_rate": 8.535752304362522e-05, + "loss": 0.0076, + "step": 283630 + }, + { + "epoch": 1.43, + "learning_rate": 8.534995535061121e-05, + "loss": 0.0093, + "step": 283640 + }, + { + "epoch": 1.43, + "learning_rate": 8.534238765759721e-05, + "loss": 0.0096, + "step": 283650 + }, + { + "epoch": 1.43, + "learning_rate": 8.533481996458319e-05, + "loss": 0.0069, + "step": 283660 + }, + { + "epoch": 1.43, + "learning_rate": 8.532725227156919e-05, + "loss": 0.0069, + "step": 283670 + }, + { + "epoch": 1.43, + "learning_rate": 8.531968457855518e-05, + "loss": 0.0083, + "step": 283680 + }, + { + "epoch": 1.43, + "learning_rate": 8.531211688554116e-05, + "loss": 0.0062, + "step": 283690 + }, + { + "epoch": 1.43, + "learning_rate": 8.530454919252716e-05, + "loss": 0.0092, + "step": 283700 + }, + { + "epoch": 1.43, + "learning_rate": 8.529698149951314e-05, + "loss": 0.0081, + "step": 283710 + }, + { + "epoch": 1.43, + "learning_rate": 8.528941380649913e-05, + "loss": 0.0065, + "step": 283720 + }, + { + "epoch": 1.43, + "learning_rate": 8.528184611348513e-05, + "loss": 0.0071, + "step": 283730 + }, + { + "epoch": 1.43, + "learning_rate": 8.527427842047111e-05, + "loss": 0.0082, + "step": 283740 + }, + { + "epoch": 1.43, + "learning_rate": 8.526671072745709e-05, + "loss": 0.0076, + "step": 283750 + }, + { + "epoch": 1.43, + "learning_rate": 8.525914303444307e-05, + "loss": 0.0057, + "step": 283760 + }, + { + "epoch": 1.43, + "learning_rate": 8.525157534142907e-05, + "loss": 0.0081, + "step": 283770 + }, + { + "epoch": 1.43, + "learning_rate": 8.524400764841506e-05, + "loss": 0.0063, + "step": 283780 + }, + { + "epoch": 1.43, + "learning_rate": 8.523643995540104e-05, + "loss": 0.0081, + "step": 283790 + }, + { + "epoch": 1.43, + "learning_rate": 8.522887226238704e-05, + "loss": 0.0073, + "step": 283800 + }, + { + "epoch": 1.43, + "learning_rate": 8.522130456937303e-05, + "loss": 0.0091, + "step": 283810 + }, + { + "epoch": 1.43, + "learning_rate": 8.521373687635902e-05, + "loss": 0.0066, + "step": 283820 + }, + { + "epoch": 1.43, + "learning_rate": 8.520616918334501e-05, + "loss": 0.0067, + "step": 283830 + }, + { + "epoch": 1.43, + "learning_rate": 8.519860149033099e-05, + "loss": 0.0079, + "step": 283840 + }, + { + "epoch": 1.43, + "learning_rate": 8.519103379731699e-05, + "loss": 0.0055, + "step": 283850 + }, + { + "epoch": 1.43, + "learning_rate": 8.518346610430298e-05, + "loss": 0.0081, + "step": 283860 + }, + { + "epoch": 1.43, + "learning_rate": 8.517589841128896e-05, + "loss": 0.0089, + "step": 283870 + }, + { + "epoch": 1.43, + "learning_rate": 8.516833071827496e-05, + "loss": 0.0066, + "step": 283880 + }, + { + "epoch": 1.43, + "learning_rate": 8.516076302526095e-05, + "loss": 0.0077, + "step": 283890 + }, + { + "epoch": 1.43, + "learning_rate": 8.515319533224693e-05, + "loss": 0.0061, + "step": 283900 + }, + { + "epoch": 1.43, + "learning_rate": 8.514562763923293e-05, + "loss": 0.0061, + "step": 283910 + }, + { + "epoch": 1.43, + "learning_rate": 8.513805994621891e-05, + "loss": 0.0083, + "step": 283920 + }, + { + "epoch": 1.43, + "learning_rate": 8.51304922532049e-05, + "loss": 0.0089, + "step": 283930 + }, + { + "epoch": 1.43, + "learning_rate": 8.51229245601909e-05, + "loss": 0.0094, + "step": 283940 + }, + { + "epoch": 1.43, + "learning_rate": 8.511535686717688e-05, + "loss": 0.0072, + "step": 283950 + }, + { + "epoch": 1.43, + "learning_rate": 8.510778917416288e-05, + "loss": 0.0075, + "step": 283960 + }, + { + "epoch": 1.43, + "learning_rate": 8.510022148114887e-05, + "loss": 0.0089, + "step": 283970 + }, + { + "epoch": 1.43, + "learning_rate": 8.509265378813485e-05, + "loss": 0.0087, + "step": 283980 + }, + { + "epoch": 1.43, + "learning_rate": 8.508508609512085e-05, + "loss": 0.0085, + "step": 283990 + }, + { + "epoch": 1.43, + "learning_rate": 8.507751840210683e-05, + "loss": 0.0077, + "step": 284000 + }, + { + "epoch": 1.43, + "eval_cer": 0.914452788772905, + "eval_loss": 0.005701255518943071, + "eval_runtime": 115.7531, + "eval_samples_per_second": 17.278, + "eval_steps_per_second": 4.32, + "step": 284000 + }, + { + "epoch": 1.43, + "learning_rate": 8.506995070909283e-05, + "loss": 0.0066, + "step": 284010 + }, + { + "epoch": 1.43, + "learning_rate": 8.506238301607882e-05, + "loss": 0.0096, + "step": 284020 + }, + { + "epoch": 1.43, + "learning_rate": 8.50548153230648e-05, + "loss": 0.0078, + "step": 284030 + }, + { + "epoch": 1.43, + "learning_rate": 8.50472476300508e-05, + "loss": 0.0065, + "step": 284040 + }, + { + "epoch": 1.43, + "learning_rate": 8.503967993703679e-05, + "loss": 0.0051, + "step": 284050 + }, + { + "epoch": 1.43, + "learning_rate": 8.503211224402277e-05, + "loss": 0.0086, + "step": 284060 + }, + { + "epoch": 1.43, + "learning_rate": 8.502454455100877e-05, + "loss": 0.0053, + "step": 284070 + }, + { + "epoch": 1.43, + "learning_rate": 8.501697685799475e-05, + "loss": 0.006, + "step": 284080 + }, + { + "epoch": 1.43, + "learning_rate": 8.500940916498074e-05, + "loss": 0.0067, + "step": 284090 + }, + { + "epoch": 1.43, + "learning_rate": 8.500184147196674e-05, + "loss": 0.0077, + "step": 284100 + }, + { + "epoch": 1.43, + "learning_rate": 8.499427377895272e-05, + "loss": 0.0056, + "step": 284110 + }, + { + "epoch": 1.43, + "learning_rate": 8.498670608593872e-05, + "loss": 0.0081, + "step": 284120 + }, + { + "epoch": 1.43, + "learning_rate": 8.497913839292471e-05, + "loss": 0.0057, + "step": 284130 + }, + { + "epoch": 1.43, + "learning_rate": 8.497157069991069e-05, + "loss": 0.0098, + "step": 284140 + }, + { + "epoch": 1.43, + "learning_rate": 8.496400300689669e-05, + "loss": 0.008, + "step": 284150 + }, + { + "epoch": 1.43, + "learning_rate": 8.495643531388267e-05, + "loss": 0.01, + "step": 284160 + }, + { + "epoch": 1.43, + "learning_rate": 8.494886762086866e-05, + "loss": 0.0076, + "step": 284170 + }, + { + "epoch": 1.43, + "learning_rate": 8.494129992785466e-05, + "loss": 0.01, + "step": 284180 + }, + { + "epoch": 1.43, + "learning_rate": 8.493373223484064e-05, + "loss": 0.0084, + "step": 284190 + }, + { + "epoch": 1.43, + "learning_rate": 8.492616454182664e-05, + "loss": 0.0087, + "step": 284200 + }, + { + "epoch": 1.43, + "learning_rate": 8.491859684881263e-05, + "loss": 0.006, + "step": 284210 + }, + { + "epoch": 1.43, + "learning_rate": 8.491102915579861e-05, + "loss": 0.0073, + "step": 284220 + }, + { + "epoch": 1.43, + "learning_rate": 8.490346146278461e-05, + "loss": 0.0068, + "step": 284230 + }, + { + "epoch": 1.43, + "learning_rate": 8.48958937697706e-05, + "loss": 0.0079, + "step": 284240 + }, + { + "epoch": 1.43, + "learning_rate": 8.488832607675658e-05, + "loss": 0.0072, + "step": 284250 + }, + { + "epoch": 1.43, + "learning_rate": 8.488075838374258e-05, + "loss": 0.0069, + "step": 284260 + }, + { + "epoch": 1.43, + "learning_rate": 8.487319069072856e-05, + "loss": 0.0062, + "step": 284270 + }, + { + "epoch": 1.43, + "learning_rate": 8.486562299771456e-05, + "loss": 0.0072, + "step": 284280 + }, + { + "epoch": 1.43, + "learning_rate": 8.485805530470055e-05, + "loss": 0.0076, + "step": 284290 + }, + { + "epoch": 1.43, + "learning_rate": 8.485048761168653e-05, + "loss": 0.0089, + "step": 284300 + }, + { + "epoch": 1.43, + "learning_rate": 8.484291991867253e-05, + "loss": 0.0068, + "step": 284310 + }, + { + "epoch": 1.43, + "learning_rate": 8.483535222565852e-05, + "loss": 0.0049, + "step": 284320 + }, + { + "epoch": 1.43, + "learning_rate": 8.48277845326445e-05, + "loss": 0.0096, + "step": 284330 + }, + { + "epoch": 1.43, + "learning_rate": 8.48202168396305e-05, + "loss": 0.0077, + "step": 284340 + }, + { + "epoch": 1.43, + "learning_rate": 8.481264914661648e-05, + "loss": 0.0072, + "step": 284350 + }, + { + "epoch": 1.43, + "learning_rate": 8.480508145360247e-05, + "loss": 0.0078, + "step": 284360 + }, + { + "epoch": 1.43, + "learning_rate": 8.479751376058847e-05, + "loss": 0.0076, + "step": 284370 + }, + { + "epoch": 1.43, + "learning_rate": 8.478994606757444e-05, + "loss": 0.0071, + "step": 284380 + }, + { + "epoch": 1.43, + "learning_rate": 8.478237837456043e-05, + "loss": 0.0093, + "step": 284390 + }, + { + "epoch": 1.43, + "learning_rate": 8.477481068154641e-05, + "loss": 0.0096, + "step": 284400 + }, + { + "epoch": 1.43, + "learning_rate": 8.476724298853241e-05, + "loss": 0.01, + "step": 284410 + }, + { + "epoch": 1.43, + "learning_rate": 8.47596752955184e-05, + "loss": 0.0071, + "step": 284420 + }, + { + "epoch": 1.43, + "learning_rate": 8.475210760250439e-05, + "loss": 0.0073, + "step": 284430 + }, + { + "epoch": 1.44, + "learning_rate": 8.474453990949038e-05, + "loss": 0.0099, + "step": 284440 + }, + { + "epoch": 1.44, + "learning_rate": 8.473697221647636e-05, + "loss": 0.0073, + "step": 284450 + }, + { + "epoch": 1.44, + "learning_rate": 8.472940452346236e-05, + "loss": 0.0069, + "step": 284460 + }, + { + "epoch": 1.44, + "learning_rate": 8.472183683044835e-05, + "loss": 0.008, + "step": 284470 + }, + { + "epoch": 1.44, + "learning_rate": 8.471426913743433e-05, + "loss": 0.0087, + "step": 284480 + }, + { + "epoch": 1.44, + "learning_rate": 8.470670144442033e-05, + "loss": 0.007, + "step": 284490 + }, + { + "epoch": 1.44, + "learning_rate": 8.469913375140632e-05, + "loss": 0.0105, + "step": 284500 + }, + { + "epoch": 1.44, + "learning_rate": 8.46915660583923e-05, + "loss": 0.0077, + "step": 284510 + }, + { + "epoch": 1.44, + "learning_rate": 8.46839983653783e-05, + "loss": 0.0064, + "step": 284520 + }, + { + "epoch": 1.44, + "learning_rate": 8.467643067236428e-05, + "loss": 0.0085, + "step": 284530 + }, + { + "epoch": 1.44, + "learning_rate": 8.466886297935028e-05, + "loss": 0.0079, + "step": 284540 + }, + { + "epoch": 1.44, + "learning_rate": 8.466129528633627e-05, + "loss": 0.0076, + "step": 284550 + }, + { + "epoch": 1.44, + "learning_rate": 8.465372759332225e-05, + "loss": 0.0068, + "step": 284560 + }, + { + "epoch": 1.44, + "learning_rate": 8.464615990030825e-05, + "loss": 0.007, + "step": 284570 + }, + { + "epoch": 1.44, + "learning_rate": 8.463859220729424e-05, + "loss": 0.0094, + "step": 284580 + }, + { + "epoch": 1.44, + "learning_rate": 8.463102451428022e-05, + "loss": 0.0068, + "step": 284590 + }, + { + "epoch": 1.44, + "learning_rate": 8.462345682126622e-05, + "loss": 0.0078, + "step": 284600 + }, + { + "epoch": 1.44, + "learning_rate": 8.46158891282522e-05, + "loss": 0.0079, + "step": 284610 + }, + { + "epoch": 1.44, + "learning_rate": 8.46083214352382e-05, + "loss": 0.0067, + "step": 284620 + }, + { + "epoch": 1.44, + "learning_rate": 8.460075374222419e-05, + "loss": 0.0085, + "step": 284630 + }, + { + "epoch": 1.44, + "learning_rate": 8.459318604921017e-05, + "loss": 0.0082, + "step": 284640 + }, + { + "epoch": 1.44, + "learning_rate": 8.458561835619617e-05, + "loss": 0.007, + "step": 284650 + }, + { + "epoch": 1.44, + "learning_rate": 8.457805066318216e-05, + "loss": 0.0091, + "step": 284660 + }, + { + "epoch": 1.44, + "learning_rate": 8.457048297016814e-05, + "loss": 0.0082, + "step": 284670 + }, + { + "epoch": 1.44, + "learning_rate": 8.456291527715414e-05, + "loss": 0.0076, + "step": 284680 + }, + { + "epoch": 1.44, + "learning_rate": 8.455534758414013e-05, + "loss": 0.0086, + "step": 284690 + }, + { + "epoch": 1.44, + "learning_rate": 8.454777989112611e-05, + "loss": 0.0091, + "step": 284700 + }, + { + "epoch": 1.44, + "learning_rate": 8.454021219811211e-05, + "loss": 0.0089, + "step": 284710 + }, + { + "epoch": 1.44, + "learning_rate": 8.453264450509809e-05, + "loss": 0.007, + "step": 284720 + }, + { + "epoch": 1.44, + "learning_rate": 8.452507681208409e-05, + "loss": 0.0068, + "step": 284730 + }, + { + "epoch": 1.44, + "learning_rate": 8.451750911907008e-05, + "loss": 0.0073, + "step": 284740 + }, + { + "epoch": 1.44, + "learning_rate": 8.450994142605606e-05, + "loss": 0.0058, + "step": 284750 + }, + { + "epoch": 1.44, + "learning_rate": 8.450237373304206e-05, + "loss": 0.0079, + "step": 284760 + }, + { + "epoch": 1.44, + "learning_rate": 8.449480604002805e-05, + "loss": 0.0071, + "step": 284770 + }, + { + "epoch": 1.44, + "learning_rate": 8.448723834701403e-05, + "loss": 0.0085, + "step": 284780 + }, + { + "epoch": 1.44, + "learning_rate": 8.447967065400003e-05, + "loss": 0.0089, + "step": 284790 + }, + { + "epoch": 1.44, + "learning_rate": 8.447210296098601e-05, + "loss": 0.0075, + "step": 284800 + }, + { + "epoch": 1.44, + "learning_rate": 8.4464535267972e-05, + "loss": 0.0082, + "step": 284810 + }, + { + "epoch": 1.44, + "learning_rate": 8.4456967574958e-05, + "loss": 0.0078, + "step": 284820 + }, + { + "epoch": 1.44, + "learning_rate": 8.444939988194398e-05, + "loss": 0.0079, + "step": 284830 + }, + { + "epoch": 1.44, + "learning_rate": 8.444183218892998e-05, + "loss": 0.0099, + "step": 284840 + }, + { + "epoch": 1.44, + "learning_rate": 8.443426449591597e-05, + "loss": 0.0078, + "step": 284850 + }, + { + "epoch": 1.44, + "learning_rate": 8.442669680290195e-05, + "loss": 0.0056, + "step": 284860 + }, + { + "epoch": 1.44, + "learning_rate": 8.441912910988795e-05, + "loss": 0.0116, + "step": 284870 + }, + { + "epoch": 1.44, + "learning_rate": 8.441156141687393e-05, + "loss": 0.0071, + "step": 284880 + }, + { + "epoch": 1.44, + "learning_rate": 8.440399372385992e-05, + "loss": 0.0066, + "step": 284890 + }, + { + "epoch": 1.44, + "learning_rate": 8.439642603084592e-05, + "loss": 0.0103, + "step": 284900 + }, + { + "epoch": 1.44, + "learning_rate": 8.43888583378319e-05, + "loss": 0.0084, + "step": 284910 + }, + { + "epoch": 1.44, + "learning_rate": 8.43812906448179e-05, + "loss": 0.0082, + "step": 284920 + }, + { + "epoch": 1.44, + "learning_rate": 8.437372295180389e-05, + "loss": 0.0093, + "step": 284930 + }, + { + "epoch": 1.44, + "learning_rate": 8.436615525878987e-05, + "loss": 0.0093, + "step": 284940 + }, + { + "epoch": 1.44, + "learning_rate": 8.435858756577587e-05, + "loss": 0.0086, + "step": 284950 + }, + { + "epoch": 1.44, + "learning_rate": 8.435101987276185e-05, + "loss": 0.0077, + "step": 284960 + }, + { + "epoch": 1.44, + "learning_rate": 8.434345217974784e-05, + "loss": 0.0071, + "step": 284970 + }, + { + "epoch": 1.44, + "learning_rate": 8.433588448673384e-05, + "loss": 0.0079, + "step": 284980 + }, + { + "epoch": 1.44, + "learning_rate": 8.432831679371982e-05, + "loss": 0.0074, + "step": 284990 + }, + { + "epoch": 1.44, + "learning_rate": 8.43207491007058e-05, + "loss": 0.0069, + "step": 285000 + }, + { + "epoch": 1.44, + "eval_cer": 0.9144430848116509, + "eval_loss": 0.00582539290189743, + "eval_runtime": 115.8203, + "eval_samples_per_second": 17.268, + "eval_steps_per_second": 4.317, + "step": 285000 + }, + { + "epoch": 1.44, + "learning_rate": 8.431318140769178e-05, + "loss": 0.0072, + "step": 285010 + }, + { + "epoch": 1.44, + "learning_rate": 8.430561371467778e-05, + "loss": 0.0062, + "step": 285020 + }, + { + "epoch": 1.44, + "learning_rate": 8.429804602166377e-05, + "loss": 0.0053, + "step": 285030 + }, + { + "epoch": 1.44, + "learning_rate": 8.429047832864975e-05, + "loss": 0.0096, + "step": 285040 + }, + { + "epoch": 1.44, + "learning_rate": 8.428291063563575e-05, + "loss": 0.0096, + "step": 285050 + }, + { + "epoch": 1.44, + "learning_rate": 8.427534294262173e-05, + "loss": 0.0098, + "step": 285060 + }, + { + "epoch": 1.44, + "learning_rate": 8.426777524960773e-05, + "loss": 0.0075, + "step": 285070 + }, + { + "epoch": 1.44, + "learning_rate": 8.426020755659372e-05, + "loss": 0.0077, + "step": 285080 + }, + { + "epoch": 1.44, + "learning_rate": 8.42526398635797e-05, + "loss": 0.0084, + "step": 285090 + }, + { + "epoch": 1.44, + "learning_rate": 8.42450721705657e-05, + "loss": 0.0072, + "step": 285100 + }, + { + "epoch": 1.44, + "learning_rate": 8.423750447755169e-05, + "loss": 0.0072, + "step": 285110 + }, + { + "epoch": 1.44, + "learning_rate": 8.422993678453767e-05, + "loss": 0.0112, + "step": 285120 + }, + { + "epoch": 1.44, + "learning_rate": 8.422236909152367e-05, + "loss": 0.0082, + "step": 285130 + }, + { + "epoch": 1.44, + "learning_rate": 8.421480139850966e-05, + "loss": 0.0075, + "step": 285140 + }, + { + "epoch": 1.44, + "learning_rate": 8.420723370549565e-05, + "loss": 0.0069, + "step": 285150 + }, + { + "epoch": 1.44, + "learning_rate": 8.419966601248164e-05, + "loss": 0.0072, + "step": 285160 + }, + { + "epoch": 1.44, + "learning_rate": 8.419209831946762e-05, + "loss": 0.006, + "step": 285170 + }, + { + "epoch": 1.44, + "learning_rate": 8.418453062645362e-05, + "loss": 0.0121, + "step": 285180 + }, + { + "epoch": 1.44, + "learning_rate": 8.417696293343961e-05, + "loss": 0.0046, + "step": 285190 + }, + { + "epoch": 1.44, + "learning_rate": 8.416939524042559e-05, + "loss": 0.0088, + "step": 285200 + }, + { + "epoch": 1.44, + "learning_rate": 8.416182754741159e-05, + "loss": 0.0075, + "step": 285210 + }, + { + "epoch": 1.44, + "learning_rate": 8.415425985439758e-05, + "loss": 0.0096, + "step": 285220 + }, + { + "epoch": 1.44, + "learning_rate": 8.414669216138356e-05, + "loss": 0.0079, + "step": 285230 + }, + { + "epoch": 1.44, + "learning_rate": 8.413912446836956e-05, + "loss": 0.0079, + "step": 285240 + }, + { + "epoch": 1.44, + "learning_rate": 8.413155677535554e-05, + "loss": 0.0082, + "step": 285250 + }, + { + "epoch": 1.44, + "learning_rate": 8.412398908234154e-05, + "loss": 0.0096, + "step": 285260 + }, + { + "epoch": 1.44, + "learning_rate": 8.411642138932753e-05, + "loss": 0.0075, + "step": 285270 + }, + { + "epoch": 1.44, + "learning_rate": 8.410885369631351e-05, + "loss": 0.0075, + "step": 285280 + }, + { + "epoch": 1.44, + "learning_rate": 8.410128600329951e-05, + "loss": 0.0081, + "step": 285290 + }, + { + "epoch": 1.44, + "learning_rate": 8.40937183102855e-05, + "loss": 0.0085, + "step": 285300 + }, + { + "epoch": 1.44, + "learning_rate": 8.408615061727148e-05, + "loss": 0.0069, + "step": 285310 + }, + { + "epoch": 1.44, + "learning_rate": 8.407858292425748e-05, + "loss": 0.0073, + "step": 285320 + }, + { + "epoch": 1.44, + "learning_rate": 8.407101523124346e-05, + "loss": 0.009, + "step": 285330 + }, + { + "epoch": 1.44, + "learning_rate": 8.406344753822946e-05, + "loss": 0.0086, + "step": 285340 + }, + { + "epoch": 1.44, + "learning_rate": 8.405587984521545e-05, + "loss": 0.0069, + "step": 285350 + }, + { + "epoch": 1.44, + "learning_rate": 8.404831215220143e-05, + "loss": 0.0053, + "step": 285360 + }, + { + "epoch": 1.44, + "learning_rate": 8.404074445918743e-05, + "loss": 0.0094, + "step": 285370 + }, + { + "epoch": 1.44, + "learning_rate": 8.403317676617342e-05, + "loss": 0.0088, + "step": 285380 + }, + { + "epoch": 1.44, + "learning_rate": 8.40256090731594e-05, + "loss": 0.0063, + "step": 285390 + }, + { + "epoch": 1.44, + "learning_rate": 8.40180413801454e-05, + "loss": 0.008, + "step": 285400 + }, + { + "epoch": 1.44, + "learning_rate": 8.401047368713138e-05, + "loss": 0.0075, + "step": 285410 + }, + { + "epoch": 1.44, + "learning_rate": 8.400290599411737e-05, + "loss": 0.0062, + "step": 285420 + }, + { + "epoch": 1.44, + "learning_rate": 8.399533830110337e-05, + "loss": 0.0058, + "step": 285430 + }, + { + "epoch": 1.44, + "learning_rate": 8.398777060808935e-05, + "loss": 0.0072, + "step": 285440 + }, + { + "epoch": 1.44, + "learning_rate": 8.398020291507535e-05, + "loss": 0.0067, + "step": 285450 + }, + { + "epoch": 1.44, + "learning_rate": 8.397263522206134e-05, + "loss": 0.0121, + "step": 285460 + }, + { + "epoch": 1.44, + "learning_rate": 8.396506752904732e-05, + "loss": 0.0099, + "step": 285470 + }, + { + "epoch": 1.44, + "learning_rate": 8.395749983603332e-05, + "loss": 0.0088, + "step": 285480 + }, + { + "epoch": 1.44, + "learning_rate": 8.39499321430193e-05, + "loss": 0.005, + "step": 285490 + }, + { + "epoch": 1.44, + "learning_rate": 8.39423644500053e-05, + "loss": 0.0078, + "step": 285500 + }, + { + "epoch": 1.44, + "learning_rate": 8.393479675699129e-05, + "loss": 0.0066, + "step": 285510 + }, + { + "epoch": 1.44, + "learning_rate": 8.392722906397727e-05, + "loss": 0.0066, + "step": 285520 + }, + { + "epoch": 1.44, + "learning_rate": 8.391966137096327e-05, + "loss": 0.0087, + "step": 285530 + }, + { + "epoch": 1.44, + "learning_rate": 8.391209367794926e-05, + "loss": 0.0092, + "step": 285540 + }, + { + "epoch": 1.44, + "learning_rate": 8.390452598493524e-05, + "loss": 0.0069, + "step": 285550 + }, + { + "epoch": 1.44, + "learning_rate": 8.389695829192124e-05, + "loss": 0.0083, + "step": 285560 + }, + { + "epoch": 1.44, + "learning_rate": 8.388939059890722e-05, + "loss": 0.0083, + "step": 285570 + }, + { + "epoch": 1.44, + "learning_rate": 8.388182290589321e-05, + "loss": 0.0066, + "step": 285580 + }, + { + "epoch": 1.44, + "learning_rate": 8.387425521287921e-05, + "loss": 0.0094, + "step": 285590 + }, + { + "epoch": 1.44, + "learning_rate": 8.386668751986519e-05, + "loss": 0.0083, + "step": 285600 + }, + { + "epoch": 1.44, + "learning_rate": 8.385911982685118e-05, + "loss": 0.0064, + "step": 285610 + }, + { + "epoch": 1.44, + "learning_rate": 8.385155213383718e-05, + "loss": 0.0074, + "step": 285620 + }, + { + "epoch": 1.44, + "learning_rate": 8.384398444082315e-05, + "loss": 0.0057, + "step": 285630 + }, + { + "epoch": 1.44, + "learning_rate": 8.383641674780914e-05, + "loss": 0.0077, + "step": 285640 + }, + { + "epoch": 1.44, + "learning_rate": 8.382884905479512e-05, + "loss": 0.0083, + "step": 285650 + }, + { + "epoch": 1.44, + "learning_rate": 8.382128136178112e-05, + "loss": 0.0095, + "step": 285660 + }, + { + "epoch": 1.44, + "learning_rate": 8.381371366876711e-05, + "loss": 0.0059, + "step": 285670 + }, + { + "epoch": 1.44, + "learning_rate": 8.38061459757531e-05, + "loss": 0.0081, + "step": 285680 + }, + { + "epoch": 1.44, + "learning_rate": 8.379857828273909e-05, + "loss": 0.0065, + "step": 285690 + }, + { + "epoch": 1.44, + "learning_rate": 8.379101058972507e-05, + "loss": 0.0093, + "step": 285700 + }, + { + "epoch": 1.44, + "learning_rate": 8.378344289671107e-05, + "loss": 0.0081, + "step": 285710 + }, + { + "epoch": 1.44, + "learning_rate": 8.377587520369706e-05, + "loss": 0.0121, + "step": 285720 + }, + { + "epoch": 1.44, + "learning_rate": 8.376830751068304e-05, + "loss": 0.0085, + "step": 285730 + }, + { + "epoch": 1.44, + "learning_rate": 8.376073981766904e-05, + "loss": 0.0073, + "step": 285740 + }, + { + "epoch": 1.44, + "learning_rate": 8.375317212465503e-05, + "loss": 0.0074, + "step": 285750 + }, + { + "epoch": 1.44, + "learning_rate": 8.374560443164101e-05, + "loss": 0.0077, + "step": 285760 + }, + { + "epoch": 1.44, + "learning_rate": 8.373803673862701e-05, + "loss": 0.0059, + "step": 285770 + }, + { + "epoch": 1.44, + "learning_rate": 8.373046904561299e-05, + "loss": 0.0068, + "step": 285780 + }, + { + "epoch": 1.44, + "learning_rate": 8.372290135259899e-05, + "loss": 0.0084, + "step": 285790 + }, + { + "epoch": 1.44, + "learning_rate": 8.371533365958498e-05, + "loss": 0.0058, + "step": 285800 + }, + { + "epoch": 1.44, + "learning_rate": 8.370776596657096e-05, + "loss": 0.0072, + "step": 285810 + }, + { + "epoch": 1.44, + "learning_rate": 8.370019827355696e-05, + "loss": 0.0074, + "step": 285820 + }, + { + "epoch": 1.44, + "learning_rate": 8.369263058054295e-05, + "loss": 0.0063, + "step": 285830 + }, + { + "epoch": 1.44, + "learning_rate": 8.368506288752893e-05, + "loss": 0.0089, + "step": 285840 + }, + { + "epoch": 1.44, + "learning_rate": 8.367749519451493e-05, + "loss": 0.0083, + "step": 285850 + }, + { + "epoch": 1.44, + "learning_rate": 8.366992750150091e-05, + "loss": 0.0087, + "step": 285860 + }, + { + "epoch": 1.44, + "learning_rate": 8.36623598084869e-05, + "loss": 0.0074, + "step": 285870 + }, + { + "epoch": 1.44, + "learning_rate": 8.36547921154729e-05, + "loss": 0.0094, + "step": 285880 + }, + { + "epoch": 1.44, + "learning_rate": 8.364722442245888e-05, + "loss": 0.0077, + "step": 285890 + }, + { + "epoch": 1.44, + "learning_rate": 8.363965672944488e-05, + "loss": 0.007, + "step": 285900 + }, + { + "epoch": 1.44, + "learning_rate": 8.363208903643087e-05, + "loss": 0.0097, + "step": 285910 + }, + { + "epoch": 1.44, + "learning_rate": 8.362452134341685e-05, + "loss": 0.007, + "step": 285920 + }, + { + "epoch": 1.44, + "learning_rate": 8.361695365040285e-05, + "loss": 0.0078, + "step": 285930 + }, + { + "epoch": 1.44, + "learning_rate": 8.360938595738883e-05, + "loss": 0.0073, + "step": 285940 + }, + { + "epoch": 1.44, + "learning_rate": 8.360181826437482e-05, + "loss": 0.0112, + "step": 285950 + }, + { + "epoch": 1.44, + "learning_rate": 8.359425057136082e-05, + "loss": 0.0101, + "step": 285960 + }, + { + "epoch": 1.44, + "learning_rate": 8.35866828783468e-05, + "loss": 0.0092, + "step": 285970 + }, + { + "epoch": 1.44, + "learning_rate": 8.35791151853328e-05, + "loss": 0.0067, + "step": 285980 + }, + { + "epoch": 1.44, + "learning_rate": 8.357154749231879e-05, + "loss": 0.011, + "step": 285990 + }, + { + "epoch": 1.44, + "learning_rate": 8.356397979930477e-05, + "loss": 0.0077, + "step": 286000 + }, + { + "epoch": 1.44, + "eval_cer": 0.914438232831024, + "eval_loss": 0.005684024654328823, + "eval_runtime": 115.553, + "eval_samples_per_second": 17.308, + "eval_steps_per_second": 4.327, + "step": 286000 + }, + { + "epoch": 1.44, + "learning_rate": 8.355641210629077e-05, + "loss": 0.0067, + "step": 286010 + }, + { + "epoch": 1.44, + "learning_rate": 8.354884441327675e-05, + "loss": 0.0081, + "step": 286020 + }, + { + "epoch": 1.44, + "learning_rate": 8.354127672026274e-05, + "loss": 0.0082, + "step": 286030 + }, + { + "epoch": 1.44, + "learning_rate": 8.353370902724874e-05, + "loss": 0.0087, + "step": 286040 + }, + { + "epoch": 1.44, + "learning_rate": 8.352614133423472e-05, + "loss": 0.0059, + "step": 286050 + }, + { + "epoch": 1.44, + "learning_rate": 8.351857364122072e-05, + "loss": 0.0076, + "step": 286060 + }, + { + "epoch": 1.44, + "learning_rate": 8.351100594820671e-05, + "loss": 0.0074, + "step": 286070 + }, + { + "epoch": 1.44, + "learning_rate": 8.350343825519269e-05, + "loss": 0.0069, + "step": 286080 + }, + { + "epoch": 1.44, + "learning_rate": 8.349587056217869e-05, + "loss": 0.0068, + "step": 286090 + }, + { + "epoch": 1.44, + "learning_rate": 8.348830286916467e-05, + "loss": 0.0076, + "step": 286100 + }, + { + "epoch": 1.44, + "learning_rate": 8.348073517615066e-05, + "loss": 0.0074, + "step": 286110 + }, + { + "epoch": 1.44, + "learning_rate": 8.347316748313666e-05, + "loss": 0.0092, + "step": 286120 + }, + { + "epoch": 1.44, + "learning_rate": 8.346559979012264e-05, + "loss": 0.0099, + "step": 286130 + }, + { + "epoch": 1.44, + "learning_rate": 8.345803209710863e-05, + "loss": 0.0066, + "step": 286140 + }, + { + "epoch": 1.44, + "learning_rate": 8.345046440409463e-05, + "loss": 0.0075, + "step": 286150 + }, + { + "epoch": 1.44, + "learning_rate": 8.344289671108061e-05, + "loss": 0.0094, + "step": 286160 + }, + { + "epoch": 1.44, + "learning_rate": 8.34353290180666e-05, + "loss": 0.0064, + "step": 286170 + }, + { + "epoch": 1.44, + "learning_rate": 8.34277613250526e-05, + "loss": 0.0122, + "step": 286180 + }, + { + "epoch": 1.44, + "learning_rate": 8.342019363203858e-05, + "loss": 0.0086, + "step": 286190 + }, + { + "epoch": 1.44, + "learning_rate": 8.341262593902458e-05, + "loss": 0.0059, + "step": 286200 + }, + { + "epoch": 1.44, + "learning_rate": 8.340505824601056e-05, + "loss": 0.0048, + "step": 286210 + }, + { + "epoch": 1.44, + "learning_rate": 8.339749055299655e-05, + "loss": 0.0088, + "step": 286220 + }, + { + "epoch": 1.44, + "learning_rate": 8.338992285998255e-05, + "loss": 0.0069, + "step": 286230 + }, + { + "epoch": 1.44, + "learning_rate": 8.338235516696853e-05, + "loss": 0.0074, + "step": 286240 + }, + { + "epoch": 1.44, + "learning_rate": 8.337478747395453e-05, + "loss": 0.0069, + "step": 286250 + }, + { + "epoch": 1.44, + "learning_rate": 8.33672197809405e-05, + "loss": 0.0075, + "step": 286260 + }, + { + "epoch": 1.44, + "learning_rate": 8.335965208792649e-05, + "loss": 0.007, + "step": 286270 + }, + { + "epoch": 1.44, + "learning_rate": 8.335208439491248e-05, + "loss": 0.0057, + "step": 286280 + }, + { + "epoch": 1.44, + "learning_rate": 8.334451670189846e-05, + "loss": 0.0098, + "step": 286290 + }, + { + "epoch": 1.44, + "learning_rate": 8.333694900888446e-05, + "loss": 0.008, + "step": 286300 + }, + { + "epoch": 1.44, + "learning_rate": 8.332938131587044e-05, + "loss": 0.0071, + "step": 286310 + }, + { + "epoch": 1.44, + "learning_rate": 8.332181362285644e-05, + "loss": 0.0106, + "step": 286320 + }, + { + "epoch": 1.44, + "learning_rate": 8.331424592984243e-05, + "loss": 0.0068, + "step": 286330 + }, + { + "epoch": 1.44, + "learning_rate": 8.330667823682841e-05, + "loss": 0.005, + "step": 286340 + }, + { + "epoch": 1.44, + "learning_rate": 8.329911054381441e-05, + "loss": 0.0091, + "step": 286350 + }, + { + "epoch": 1.44, + "learning_rate": 8.32915428508004e-05, + "loss": 0.0077, + "step": 286360 + }, + { + "epoch": 1.44, + "learning_rate": 8.328397515778638e-05, + "loss": 0.0069, + "step": 286370 + }, + { + "epoch": 1.44, + "learning_rate": 8.327640746477238e-05, + "loss": 0.0062, + "step": 286380 + }, + { + "epoch": 1.44, + "learning_rate": 8.326883977175836e-05, + "loss": 0.0083, + "step": 286390 + }, + { + "epoch": 1.44, + "learning_rate": 8.326127207874436e-05, + "loss": 0.0083, + "step": 286400 + }, + { + "epoch": 1.44, + "learning_rate": 8.325370438573035e-05, + "loss": 0.0081, + "step": 286410 + }, + { + "epoch": 1.45, + "learning_rate": 8.324613669271633e-05, + "loss": 0.0066, + "step": 286420 + }, + { + "epoch": 1.45, + "learning_rate": 8.323856899970233e-05, + "loss": 0.0073, + "step": 286430 + }, + { + "epoch": 1.45, + "learning_rate": 8.323100130668832e-05, + "loss": 0.0081, + "step": 286440 + }, + { + "epoch": 1.45, + "learning_rate": 8.32234336136743e-05, + "loss": 0.0085, + "step": 286450 + }, + { + "epoch": 1.45, + "learning_rate": 8.32158659206603e-05, + "loss": 0.0059, + "step": 286460 + }, + { + "epoch": 1.45, + "learning_rate": 8.320829822764628e-05, + "loss": 0.0065, + "step": 286470 + }, + { + "epoch": 1.45, + "learning_rate": 8.320073053463227e-05, + "loss": 0.0085, + "step": 286480 + }, + { + "epoch": 1.45, + "learning_rate": 8.319316284161827e-05, + "loss": 0.0083, + "step": 286490 + }, + { + "epoch": 1.45, + "learning_rate": 8.318559514860425e-05, + "loss": 0.0062, + "step": 286500 + }, + { + "epoch": 1.45, + "learning_rate": 8.317802745559025e-05, + "loss": 0.0094, + "step": 286510 + }, + { + "epoch": 1.45, + "learning_rate": 8.317045976257624e-05, + "loss": 0.0103, + "step": 286520 + }, + { + "epoch": 1.45, + "learning_rate": 8.316289206956222e-05, + "loss": 0.0066, + "step": 286530 + }, + { + "epoch": 1.45, + "learning_rate": 8.315532437654822e-05, + "loss": 0.0091, + "step": 286540 + }, + { + "epoch": 1.45, + "learning_rate": 8.31477566835342e-05, + "loss": 0.0075, + "step": 286550 + }, + { + "epoch": 1.45, + "learning_rate": 8.31401889905202e-05, + "loss": 0.0103, + "step": 286560 + }, + { + "epoch": 1.45, + "learning_rate": 8.313262129750619e-05, + "loss": 0.009, + "step": 286570 + }, + { + "epoch": 1.45, + "learning_rate": 8.312505360449217e-05, + "loss": 0.0069, + "step": 286580 + }, + { + "epoch": 1.45, + "learning_rate": 8.311748591147817e-05, + "loss": 0.0085, + "step": 286590 + }, + { + "epoch": 1.45, + "learning_rate": 8.310991821846416e-05, + "loss": 0.007, + "step": 286600 + }, + { + "epoch": 1.45, + "learning_rate": 8.310235052545014e-05, + "loss": 0.0095, + "step": 286610 + }, + { + "epoch": 1.45, + "learning_rate": 8.309478283243614e-05, + "loss": 0.0085, + "step": 286620 + }, + { + "epoch": 1.45, + "learning_rate": 8.308721513942213e-05, + "loss": 0.0069, + "step": 286630 + }, + { + "epoch": 1.45, + "learning_rate": 8.307964744640811e-05, + "loss": 0.0085, + "step": 286640 + }, + { + "epoch": 1.45, + "learning_rate": 8.307207975339411e-05, + "loss": 0.006, + "step": 286650 + }, + { + "epoch": 1.45, + "learning_rate": 8.306451206038009e-05, + "loss": 0.0092, + "step": 286660 + }, + { + "epoch": 1.45, + "learning_rate": 8.305694436736608e-05, + "loss": 0.0094, + "step": 286670 + }, + { + "epoch": 1.45, + "learning_rate": 8.304937667435208e-05, + "loss": 0.0084, + "step": 286680 + }, + { + "epoch": 1.45, + "learning_rate": 8.304180898133806e-05, + "loss": 0.0062, + "step": 286690 + }, + { + "epoch": 1.45, + "learning_rate": 8.303424128832406e-05, + "loss": 0.0086, + "step": 286700 + }, + { + "epoch": 1.45, + "learning_rate": 8.302667359531005e-05, + "loss": 0.0084, + "step": 286710 + }, + { + "epoch": 1.45, + "learning_rate": 8.301910590229603e-05, + "loss": 0.0065, + "step": 286720 + }, + { + "epoch": 1.45, + "learning_rate": 8.301153820928203e-05, + "loss": 0.0085, + "step": 286730 + }, + { + "epoch": 1.45, + "learning_rate": 8.300397051626801e-05, + "loss": 0.0074, + "step": 286740 + }, + { + "epoch": 1.45, + "learning_rate": 8.2996402823254e-05, + "loss": 0.0068, + "step": 286750 + }, + { + "epoch": 1.45, + "learning_rate": 8.298883513024e-05, + "loss": 0.0093, + "step": 286760 + }, + { + "epoch": 1.45, + "learning_rate": 8.298126743722598e-05, + "loss": 0.0072, + "step": 286770 + }, + { + "epoch": 1.45, + "learning_rate": 8.297369974421198e-05, + "loss": 0.0082, + "step": 286780 + }, + { + "epoch": 1.45, + "learning_rate": 8.296613205119797e-05, + "loss": 0.0086, + "step": 286790 + }, + { + "epoch": 1.45, + "learning_rate": 8.295856435818395e-05, + "loss": 0.0083, + "step": 286800 + }, + { + "epoch": 1.45, + "learning_rate": 8.295099666516995e-05, + "loss": 0.0081, + "step": 286810 + }, + { + "epoch": 1.45, + "learning_rate": 8.294342897215593e-05, + "loss": 0.0102, + "step": 286820 + }, + { + "epoch": 1.45, + "learning_rate": 8.293586127914192e-05, + "loss": 0.009, + "step": 286830 + }, + { + "epoch": 1.45, + "learning_rate": 8.292829358612792e-05, + "loss": 0.0077, + "step": 286840 + }, + { + "epoch": 1.45, + "learning_rate": 8.29207258931139e-05, + "loss": 0.0085, + "step": 286850 + }, + { + "epoch": 1.45, + "learning_rate": 8.29131582000999e-05, + "loss": 0.0074, + "step": 286860 + }, + { + "epoch": 1.45, + "learning_rate": 8.290559050708589e-05, + "loss": 0.008, + "step": 286870 + }, + { + "epoch": 1.45, + "learning_rate": 8.289802281407187e-05, + "loss": 0.0063, + "step": 286880 + }, + { + "epoch": 1.45, + "learning_rate": 8.289045512105785e-05, + "loss": 0.0078, + "step": 286890 + }, + { + "epoch": 1.45, + "learning_rate": 8.288288742804383e-05, + "loss": 0.0095, + "step": 286900 + }, + { + "epoch": 1.45, + "learning_rate": 8.287531973502983e-05, + "loss": 0.0081, + "step": 286910 + }, + { + "epoch": 1.45, + "learning_rate": 8.286775204201581e-05, + "loss": 0.0069, + "step": 286920 + }, + { + "epoch": 1.45, + "learning_rate": 8.28601843490018e-05, + "loss": 0.0092, + "step": 286930 + }, + { + "epoch": 1.45, + "learning_rate": 8.28526166559878e-05, + "loss": 0.0095, + "step": 286940 + }, + { + "epoch": 1.45, + "learning_rate": 8.284504896297378e-05, + "loss": 0.0075, + "step": 286950 + }, + { + "epoch": 1.45, + "learning_rate": 8.283748126995978e-05, + "loss": 0.0052, + "step": 286960 + }, + { + "epoch": 1.45, + "learning_rate": 8.282991357694577e-05, + "loss": 0.0072, + "step": 286970 + }, + { + "epoch": 1.45, + "learning_rate": 8.282234588393175e-05, + "loss": 0.0081, + "step": 286980 + }, + { + "epoch": 1.45, + "learning_rate": 8.281477819091775e-05, + "loss": 0.0067, + "step": 286990 + }, + { + "epoch": 1.45, + "learning_rate": 8.280721049790373e-05, + "loss": 0.0068, + "step": 287000 + }, + { + "epoch": 1.45, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.0057329838164150715, + "eval_runtime": 115.5304, + "eval_samples_per_second": 17.311, + "eval_steps_per_second": 4.328, + "step": 287000 + }, + { + "epoch": 1.45, + "learning_rate": 8.279964280488972e-05, + "loss": 0.007, + "step": 287010 + }, + { + "epoch": 1.45, + "learning_rate": 8.279207511187572e-05, + "loss": 0.007, + "step": 287020 + }, + { + "epoch": 1.45, + "learning_rate": 8.27845074188617e-05, + "loss": 0.0062, + "step": 287030 + }, + { + "epoch": 1.45, + "learning_rate": 8.27769397258477e-05, + "loss": 0.0058, + "step": 287040 + }, + { + "epoch": 1.45, + "learning_rate": 8.276937203283369e-05, + "loss": 0.0082, + "step": 287050 + }, + { + "epoch": 1.45, + "learning_rate": 8.276180433981967e-05, + "loss": 0.0064, + "step": 287060 + }, + { + "epoch": 1.45, + "learning_rate": 8.275423664680567e-05, + "loss": 0.0075, + "step": 287070 + }, + { + "epoch": 1.45, + "learning_rate": 8.274666895379166e-05, + "loss": 0.0094, + "step": 287080 + }, + { + "epoch": 1.45, + "learning_rate": 8.273910126077764e-05, + "loss": 0.0068, + "step": 287090 + }, + { + "epoch": 1.45, + "learning_rate": 8.273153356776364e-05, + "loss": 0.0068, + "step": 287100 + }, + { + "epoch": 1.45, + "learning_rate": 8.272396587474962e-05, + "loss": 0.0054, + "step": 287110 + }, + { + "epoch": 1.45, + "learning_rate": 8.271639818173562e-05, + "loss": 0.0068, + "step": 287120 + }, + { + "epoch": 1.45, + "learning_rate": 8.270883048872161e-05, + "loss": 0.0065, + "step": 287130 + }, + { + "epoch": 1.45, + "learning_rate": 8.270126279570759e-05, + "loss": 0.0097, + "step": 287140 + }, + { + "epoch": 1.45, + "learning_rate": 8.269369510269359e-05, + "loss": 0.0064, + "step": 287150 + }, + { + "epoch": 1.45, + "learning_rate": 8.268612740967958e-05, + "loss": 0.0076, + "step": 287160 + }, + { + "epoch": 1.45, + "learning_rate": 8.267855971666556e-05, + "loss": 0.009, + "step": 287170 + }, + { + "epoch": 1.45, + "learning_rate": 8.267099202365156e-05, + "loss": 0.0066, + "step": 287180 + }, + { + "epoch": 1.45, + "learning_rate": 8.266342433063754e-05, + "loss": 0.0058, + "step": 287190 + }, + { + "epoch": 1.45, + "learning_rate": 8.265585663762354e-05, + "loss": 0.0064, + "step": 287200 + }, + { + "epoch": 1.45, + "learning_rate": 8.264828894460953e-05, + "loss": 0.0075, + "step": 287210 + }, + { + "epoch": 1.45, + "learning_rate": 8.264072125159551e-05, + "loss": 0.0097, + "step": 287220 + }, + { + "epoch": 1.45, + "learning_rate": 8.26331535585815e-05, + "loss": 0.0065, + "step": 287230 + }, + { + "epoch": 1.45, + "learning_rate": 8.26255858655675e-05, + "loss": 0.0105, + "step": 287240 + }, + { + "epoch": 1.45, + "learning_rate": 8.261801817255348e-05, + "loss": 0.0059, + "step": 287250 + }, + { + "epoch": 1.45, + "learning_rate": 8.261045047953948e-05, + "loss": 0.0071, + "step": 287260 + }, + { + "epoch": 1.45, + "learning_rate": 8.260288278652546e-05, + "loss": 0.0064, + "step": 287270 + }, + { + "epoch": 1.45, + "learning_rate": 8.259531509351145e-05, + "loss": 0.0086, + "step": 287280 + }, + { + "epoch": 1.45, + "learning_rate": 8.258774740049745e-05, + "loss": 0.0094, + "step": 287290 + }, + { + "epoch": 1.45, + "learning_rate": 8.258017970748343e-05, + "loss": 0.0055, + "step": 287300 + }, + { + "epoch": 1.45, + "learning_rate": 8.257261201446943e-05, + "loss": 0.0072, + "step": 287310 + }, + { + "epoch": 1.45, + "learning_rate": 8.256504432145542e-05, + "loss": 0.008, + "step": 287320 + }, + { + "epoch": 1.45, + "learning_rate": 8.25574766284414e-05, + "loss": 0.0085, + "step": 287330 + }, + { + "epoch": 1.45, + "learning_rate": 8.25499089354274e-05, + "loss": 0.009, + "step": 287340 + }, + { + "epoch": 1.45, + "learning_rate": 8.254234124241338e-05, + "loss": 0.0091, + "step": 287350 + }, + { + "epoch": 1.45, + "learning_rate": 8.253477354939937e-05, + "loss": 0.0068, + "step": 287360 + }, + { + "epoch": 1.45, + "learning_rate": 8.252720585638537e-05, + "loss": 0.0078, + "step": 287370 + }, + { + "epoch": 1.45, + "learning_rate": 8.251963816337135e-05, + "loss": 0.0068, + "step": 287380 + }, + { + "epoch": 1.45, + "learning_rate": 8.251207047035735e-05, + "loss": 0.0066, + "step": 287390 + }, + { + "epoch": 1.45, + "learning_rate": 8.250450277734334e-05, + "loss": 0.0074, + "step": 287400 + }, + { + "epoch": 1.45, + "learning_rate": 8.249693508432932e-05, + "loss": 0.0062, + "step": 287410 + }, + { + "epoch": 1.45, + "learning_rate": 8.248936739131532e-05, + "loss": 0.0079, + "step": 287420 + }, + { + "epoch": 1.45, + "learning_rate": 8.24817996983013e-05, + "loss": 0.0056, + "step": 287430 + }, + { + "epoch": 1.45, + "learning_rate": 8.247423200528729e-05, + "loss": 0.0096, + "step": 287440 + }, + { + "epoch": 1.45, + "learning_rate": 8.246666431227329e-05, + "loss": 0.0087, + "step": 287450 + }, + { + "epoch": 1.45, + "learning_rate": 8.245909661925927e-05, + "loss": 0.0084, + "step": 287460 + }, + { + "epoch": 1.45, + "learning_rate": 8.245152892624526e-05, + "loss": 0.0082, + "step": 287470 + }, + { + "epoch": 1.45, + "learning_rate": 8.244396123323126e-05, + "loss": 0.0084, + "step": 287480 + }, + { + "epoch": 1.45, + "learning_rate": 8.243639354021724e-05, + "loss": 0.0068, + "step": 287490 + }, + { + "epoch": 1.45, + "learning_rate": 8.242882584720324e-05, + "loss": 0.0081, + "step": 287500 + }, + { + "epoch": 1.45, + "learning_rate": 8.242125815418922e-05, + "loss": 0.0074, + "step": 287510 + }, + { + "epoch": 1.45, + "learning_rate": 8.24136904611752e-05, + "loss": 0.0046, + "step": 287520 + }, + { + "epoch": 1.45, + "learning_rate": 8.240612276816118e-05, + "loss": 0.0074, + "step": 287530 + }, + { + "epoch": 1.45, + "learning_rate": 8.239855507514718e-05, + "loss": 0.0061, + "step": 287540 + }, + { + "epoch": 1.45, + "learning_rate": 8.239098738213317e-05, + "loss": 0.0058, + "step": 287550 + }, + { + "epoch": 1.45, + "learning_rate": 8.238341968911915e-05, + "loss": 0.0062, + "step": 287560 + }, + { + "epoch": 1.45, + "learning_rate": 8.237585199610515e-05, + "loss": 0.0066, + "step": 287570 + }, + { + "epoch": 1.45, + "learning_rate": 8.236828430309114e-05, + "loss": 0.007, + "step": 287580 + }, + { + "epoch": 1.45, + "learning_rate": 8.236071661007712e-05, + "loss": 0.0066, + "step": 287590 + }, + { + "epoch": 1.45, + "learning_rate": 8.235314891706312e-05, + "loss": 0.0054, + "step": 287600 + }, + { + "epoch": 1.45, + "learning_rate": 8.234558122404911e-05, + "loss": 0.0071, + "step": 287610 + }, + { + "epoch": 1.45, + "learning_rate": 8.23380135310351e-05, + "loss": 0.0067, + "step": 287620 + }, + { + "epoch": 1.45, + "learning_rate": 8.233044583802109e-05, + "loss": 0.0093, + "step": 287630 + }, + { + "epoch": 1.45, + "learning_rate": 8.232287814500707e-05, + "loss": 0.0099, + "step": 287640 + }, + { + "epoch": 1.45, + "learning_rate": 8.231531045199307e-05, + "loss": 0.0072, + "step": 287650 + }, + { + "epoch": 1.45, + "learning_rate": 8.230774275897906e-05, + "loss": 0.007, + "step": 287660 + }, + { + "epoch": 1.45, + "learning_rate": 8.230017506596504e-05, + "loss": 0.0058, + "step": 287670 + }, + { + "epoch": 1.45, + "learning_rate": 8.229260737295104e-05, + "loss": 0.0081, + "step": 287680 + }, + { + "epoch": 1.45, + "learning_rate": 8.228503967993703e-05, + "loss": 0.0074, + "step": 287690 + }, + { + "epoch": 1.45, + "learning_rate": 8.227747198692301e-05, + "loss": 0.0076, + "step": 287700 + }, + { + "epoch": 1.45, + "learning_rate": 8.226990429390901e-05, + "loss": 0.008, + "step": 287710 + }, + { + "epoch": 1.45, + "learning_rate": 8.226233660089499e-05, + "loss": 0.0089, + "step": 287720 + }, + { + "epoch": 1.45, + "learning_rate": 8.225476890788099e-05, + "loss": 0.0065, + "step": 287730 + }, + { + "epoch": 1.45, + "learning_rate": 8.224720121486698e-05, + "loss": 0.0086, + "step": 287740 + }, + { + "epoch": 1.45, + "learning_rate": 8.223963352185296e-05, + "loss": 0.0077, + "step": 287750 + }, + { + "epoch": 1.45, + "learning_rate": 8.223206582883896e-05, + "loss": 0.0065, + "step": 287760 + }, + { + "epoch": 1.45, + "learning_rate": 8.222449813582495e-05, + "loss": 0.0069, + "step": 287770 + }, + { + "epoch": 1.45, + "learning_rate": 8.221693044281093e-05, + "loss": 0.0077, + "step": 287780 + }, + { + "epoch": 1.45, + "learning_rate": 8.220936274979693e-05, + "loss": 0.0054, + "step": 287790 + }, + { + "epoch": 1.45, + "learning_rate": 8.220179505678291e-05, + "loss": 0.0068, + "step": 287800 + }, + { + "epoch": 1.45, + "learning_rate": 8.21942273637689e-05, + "loss": 0.0057, + "step": 287810 + }, + { + "epoch": 1.45, + "learning_rate": 8.21866596707549e-05, + "loss": 0.007, + "step": 287820 + }, + { + "epoch": 1.45, + "learning_rate": 8.217909197774088e-05, + "loss": 0.0058, + "step": 287830 + }, + { + "epoch": 1.45, + "learning_rate": 8.217152428472688e-05, + "loss": 0.0104, + "step": 287840 + }, + { + "epoch": 1.45, + "learning_rate": 8.216395659171287e-05, + "loss": 0.005, + "step": 287850 + }, + { + "epoch": 1.45, + "learning_rate": 8.215638889869885e-05, + "loss": 0.0082, + "step": 287860 + }, + { + "epoch": 1.45, + "learning_rate": 8.214882120568485e-05, + "loss": 0.0084, + "step": 287870 + }, + { + "epoch": 1.45, + "learning_rate": 8.214125351267083e-05, + "loss": 0.0087, + "step": 287880 + }, + { + "epoch": 1.45, + "learning_rate": 8.213368581965682e-05, + "loss": 0.0069, + "step": 287890 + }, + { + "epoch": 1.45, + "learning_rate": 8.212611812664282e-05, + "loss": 0.0068, + "step": 287900 + }, + { + "epoch": 1.45, + "learning_rate": 8.21185504336288e-05, + "loss": 0.0085, + "step": 287910 + }, + { + "epoch": 1.45, + "learning_rate": 8.21109827406148e-05, + "loss": 0.0092, + "step": 287920 + }, + { + "epoch": 1.45, + "learning_rate": 8.210341504760079e-05, + "loss": 0.0063, + "step": 287930 + }, + { + "epoch": 1.45, + "learning_rate": 8.209584735458677e-05, + "loss": 0.0071, + "step": 287940 + }, + { + "epoch": 1.45, + "learning_rate": 8.208827966157277e-05, + "loss": 0.0086, + "step": 287950 + }, + { + "epoch": 1.45, + "learning_rate": 8.208071196855875e-05, + "loss": 0.0058, + "step": 287960 + }, + { + "epoch": 1.45, + "learning_rate": 8.207314427554474e-05, + "loss": 0.0076, + "step": 287970 + }, + { + "epoch": 1.45, + "learning_rate": 8.206557658253074e-05, + "loss": 0.0079, + "step": 287980 + }, + { + "epoch": 1.45, + "learning_rate": 8.205800888951672e-05, + "loss": 0.0071, + "step": 287990 + }, + { + "epoch": 1.45, + "learning_rate": 8.205044119650271e-05, + "loss": 0.0098, + "step": 288000 + }, + { + "epoch": 1.45, + "eval_cer": 0.9144294992658953, + "eval_loss": 0.005808565299957991, + "eval_runtime": 115.5954, + "eval_samples_per_second": 17.302, + "eval_steps_per_second": 4.325, + "step": 288000 + }, + { + "epoch": 1.45, + "learning_rate": 8.204287350348871e-05, + "loss": 0.0074, + "step": 288010 + }, + { + "epoch": 1.45, + "learning_rate": 8.203530581047469e-05, + "loss": 0.005, + "step": 288020 + }, + { + "epoch": 1.45, + "learning_rate": 8.202773811746069e-05, + "loss": 0.0085, + "step": 288030 + }, + { + "epoch": 1.45, + "learning_rate": 8.202017042444667e-05, + "loss": 0.0083, + "step": 288040 + }, + { + "epoch": 1.45, + "learning_rate": 8.201260273143266e-05, + "loss": 0.0062, + "step": 288050 + }, + { + "epoch": 1.45, + "learning_rate": 8.200503503841866e-05, + "loss": 0.0086, + "step": 288060 + }, + { + "epoch": 1.45, + "learning_rate": 8.199746734540464e-05, + "loss": 0.0069, + "step": 288070 + }, + { + "epoch": 1.45, + "learning_rate": 8.198989965239063e-05, + "loss": 0.0068, + "step": 288080 + }, + { + "epoch": 1.45, + "learning_rate": 8.198233195937663e-05, + "loss": 0.0066, + "step": 288090 + }, + { + "epoch": 1.45, + "learning_rate": 8.197476426636261e-05, + "loss": 0.0067, + "step": 288100 + }, + { + "epoch": 1.45, + "learning_rate": 8.19671965733486e-05, + "loss": 0.007, + "step": 288110 + }, + { + "epoch": 1.45, + "learning_rate": 8.19596288803346e-05, + "loss": 0.0069, + "step": 288120 + }, + { + "epoch": 1.45, + "learning_rate": 8.195206118732058e-05, + "loss": 0.0069, + "step": 288130 + }, + { + "epoch": 1.45, + "learning_rate": 8.194449349430658e-05, + "loss": 0.0068, + "step": 288140 + }, + { + "epoch": 1.45, + "learning_rate": 8.193692580129254e-05, + "loss": 0.0056, + "step": 288150 + }, + { + "epoch": 1.45, + "learning_rate": 8.192935810827854e-05, + "loss": 0.0062, + "step": 288160 + }, + { + "epoch": 1.45, + "learning_rate": 8.192179041526452e-05, + "loss": 0.0079, + "step": 288170 + }, + { + "epoch": 1.45, + "learning_rate": 8.191422272225052e-05, + "loss": 0.008, + "step": 288180 + }, + { + "epoch": 1.45, + "learning_rate": 8.190665502923651e-05, + "loss": 0.0058, + "step": 288190 + }, + { + "epoch": 1.45, + "learning_rate": 8.189908733622249e-05, + "loss": 0.0078, + "step": 288200 + }, + { + "epoch": 1.45, + "learning_rate": 8.189151964320849e-05, + "loss": 0.0065, + "step": 288210 + }, + { + "epoch": 1.45, + "learning_rate": 8.188395195019448e-05, + "loss": 0.0079, + "step": 288220 + }, + { + "epoch": 1.45, + "learning_rate": 8.187638425718046e-05, + "loss": 0.0089, + "step": 288230 + }, + { + "epoch": 1.45, + "learning_rate": 8.186881656416646e-05, + "loss": 0.0086, + "step": 288240 + }, + { + "epoch": 1.45, + "learning_rate": 8.186124887115244e-05, + "loss": 0.0064, + "step": 288250 + }, + { + "epoch": 1.45, + "learning_rate": 8.185368117813844e-05, + "loss": 0.0069, + "step": 288260 + }, + { + "epoch": 1.45, + "learning_rate": 8.184611348512443e-05, + "loss": 0.0079, + "step": 288270 + }, + { + "epoch": 1.45, + "learning_rate": 8.183854579211041e-05, + "loss": 0.0076, + "step": 288280 + }, + { + "epoch": 1.45, + "learning_rate": 8.18309780990964e-05, + "loss": 0.0061, + "step": 288290 + }, + { + "epoch": 1.45, + "learning_rate": 8.18234104060824e-05, + "loss": 0.0063, + "step": 288300 + }, + { + "epoch": 1.45, + "learning_rate": 8.181584271306838e-05, + "loss": 0.0061, + "step": 288310 + }, + { + "epoch": 1.45, + "learning_rate": 8.180827502005438e-05, + "loss": 0.0076, + "step": 288320 + }, + { + "epoch": 1.45, + "learning_rate": 8.180070732704036e-05, + "loss": 0.0059, + "step": 288330 + }, + { + "epoch": 1.45, + "learning_rate": 8.179313963402635e-05, + "loss": 0.0086, + "step": 288340 + }, + { + "epoch": 1.45, + "learning_rate": 8.178557194101235e-05, + "loss": 0.0069, + "step": 288350 + }, + { + "epoch": 1.45, + "learning_rate": 8.177800424799833e-05, + "loss": 0.0077, + "step": 288360 + }, + { + "epoch": 1.45, + "learning_rate": 8.177043655498433e-05, + "loss": 0.0094, + "step": 288370 + }, + { + "epoch": 1.45, + "learning_rate": 8.176286886197032e-05, + "loss": 0.0085, + "step": 288380 + }, + { + "epoch": 1.45, + "learning_rate": 8.17553011689563e-05, + "loss": 0.0101, + "step": 288390 + }, + { + "epoch": 1.46, + "learning_rate": 8.17477334759423e-05, + "loss": 0.0065, + "step": 288400 + }, + { + "epoch": 1.46, + "learning_rate": 8.174016578292828e-05, + "loss": 0.0088, + "step": 288410 + }, + { + "epoch": 1.46, + "learning_rate": 8.173259808991427e-05, + "loss": 0.0083, + "step": 288420 + }, + { + "epoch": 1.46, + "learning_rate": 8.172503039690027e-05, + "loss": 0.0097, + "step": 288430 + }, + { + "epoch": 1.46, + "learning_rate": 8.171746270388625e-05, + "loss": 0.0067, + "step": 288440 + }, + { + "epoch": 1.46, + "learning_rate": 8.170989501087225e-05, + "loss": 0.0082, + "step": 288450 + }, + { + "epoch": 1.46, + "learning_rate": 8.170232731785824e-05, + "loss": 0.0073, + "step": 288460 + }, + { + "epoch": 1.46, + "learning_rate": 8.169475962484422e-05, + "loss": 0.0065, + "step": 288470 + }, + { + "epoch": 1.46, + "learning_rate": 8.168719193183022e-05, + "loss": 0.0098, + "step": 288480 + }, + { + "epoch": 1.46, + "learning_rate": 8.16796242388162e-05, + "loss": 0.0086, + "step": 288490 + }, + { + "epoch": 1.46, + "learning_rate": 8.167205654580219e-05, + "loss": 0.0061, + "step": 288500 + }, + { + "epoch": 1.46, + "learning_rate": 8.166448885278819e-05, + "loss": 0.0107, + "step": 288510 + }, + { + "epoch": 1.46, + "learning_rate": 8.165692115977417e-05, + "loss": 0.0065, + "step": 288520 + }, + { + "epoch": 1.46, + "learning_rate": 8.164935346676016e-05, + "loss": 0.0061, + "step": 288530 + }, + { + "epoch": 1.46, + "learning_rate": 8.164178577374616e-05, + "loss": 0.0061, + "step": 288540 + }, + { + "epoch": 1.46, + "learning_rate": 8.163421808073214e-05, + "loss": 0.0062, + "step": 288550 + }, + { + "epoch": 1.46, + "learning_rate": 8.162665038771814e-05, + "loss": 0.0097, + "step": 288560 + }, + { + "epoch": 1.46, + "learning_rate": 8.161908269470413e-05, + "loss": 0.0077, + "step": 288570 + }, + { + "epoch": 1.46, + "learning_rate": 8.161151500169011e-05, + "loss": 0.0095, + "step": 288580 + }, + { + "epoch": 1.46, + "learning_rate": 8.160394730867611e-05, + "loss": 0.0089, + "step": 288590 + }, + { + "epoch": 1.46, + "learning_rate": 8.159637961566209e-05, + "loss": 0.0075, + "step": 288600 + }, + { + "epoch": 1.46, + "learning_rate": 8.158881192264808e-05, + "loss": 0.0066, + "step": 288610 + }, + { + "epoch": 1.46, + "learning_rate": 8.158124422963408e-05, + "loss": 0.0055, + "step": 288620 + }, + { + "epoch": 1.46, + "learning_rate": 8.157367653662006e-05, + "loss": 0.0078, + "step": 288630 + }, + { + "epoch": 1.46, + "learning_rate": 8.156610884360606e-05, + "loss": 0.0053, + "step": 288640 + }, + { + "epoch": 1.46, + "learning_rate": 8.155854115059205e-05, + "loss": 0.0089, + "step": 288650 + }, + { + "epoch": 1.46, + "learning_rate": 8.155097345757803e-05, + "loss": 0.0053, + "step": 288660 + }, + { + "epoch": 1.46, + "learning_rate": 8.154340576456403e-05, + "loss": 0.0068, + "step": 288670 + }, + { + "epoch": 1.46, + "learning_rate": 8.153583807155001e-05, + "loss": 0.0097, + "step": 288680 + }, + { + "epoch": 1.46, + "learning_rate": 8.1528270378536e-05, + "loss": 0.0109, + "step": 288690 + }, + { + "epoch": 1.46, + "learning_rate": 8.1520702685522e-05, + "loss": 0.006, + "step": 288700 + }, + { + "epoch": 1.46, + "learning_rate": 8.151313499250798e-05, + "loss": 0.0065, + "step": 288710 + }, + { + "epoch": 1.46, + "learning_rate": 8.150556729949397e-05, + "loss": 0.0056, + "step": 288720 + }, + { + "epoch": 1.46, + "learning_rate": 8.149799960647997e-05, + "loss": 0.0076, + "step": 288730 + }, + { + "epoch": 1.46, + "learning_rate": 8.149043191346595e-05, + "loss": 0.0064, + "step": 288740 + }, + { + "epoch": 1.46, + "learning_rate": 8.148286422045195e-05, + "loss": 0.0078, + "step": 288750 + }, + { + "epoch": 1.46, + "learning_rate": 8.147529652743793e-05, + "loss": 0.0084, + "step": 288760 + }, + { + "epoch": 1.46, + "learning_rate": 8.146772883442391e-05, + "loss": 0.0084, + "step": 288770 + }, + { + "epoch": 1.46, + "learning_rate": 8.146016114140989e-05, + "loss": 0.0103, + "step": 288780 + }, + { + "epoch": 1.46, + "learning_rate": 8.145259344839589e-05, + "loss": 0.007, + "step": 288790 + }, + { + "epoch": 1.46, + "learning_rate": 8.144502575538188e-05, + "loss": 0.006, + "step": 288800 + }, + { + "epoch": 1.46, + "learning_rate": 8.143745806236786e-05, + "loss": 0.008, + "step": 288810 + }, + { + "epoch": 1.46, + "learning_rate": 8.142989036935386e-05, + "loss": 0.0071, + "step": 288820 + }, + { + "epoch": 1.46, + "learning_rate": 8.142232267633985e-05, + "loss": 0.0088, + "step": 288830 + }, + { + "epoch": 1.46, + "learning_rate": 8.141475498332583e-05, + "loss": 0.0061, + "step": 288840 + }, + { + "epoch": 1.46, + "learning_rate": 8.140718729031183e-05, + "loss": 0.0086, + "step": 288850 + }, + { + "epoch": 1.46, + "learning_rate": 8.139961959729781e-05, + "loss": 0.0082, + "step": 288860 + }, + { + "epoch": 1.46, + "learning_rate": 8.13920519042838e-05, + "loss": 0.0092, + "step": 288870 + }, + { + "epoch": 1.46, + "learning_rate": 8.13844842112698e-05, + "loss": 0.0092, + "step": 288880 + }, + { + "epoch": 1.46, + "learning_rate": 8.137691651825578e-05, + "loss": 0.008, + "step": 288890 + }, + { + "epoch": 1.46, + "learning_rate": 8.136934882524178e-05, + "loss": 0.0065, + "step": 288900 + }, + { + "epoch": 1.46, + "learning_rate": 8.136178113222777e-05, + "loss": 0.0061, + "step": 288910 + }, + { + "epoch": 1.46, + "learning_rate": 8.135421343921375e-05, + "loss": 0.007, + "step": 288920 + }, + { + "epoch": 1.46, + "learning_rate": 8.134664574619975e-05, + "loss": 0.0085, + "step": 288930 + }, + { + "epoch": 1.46, + "learning_rate": 8.133907805318573e-05, + "loss": 0.0088, + "step": 288940 + }, + { + "epoch": 1.46, + "learning_rate": 8.133151036017172e-05, + "loss": 0.0088, + "step": 288950 + }, + { + "epoch": 1.46, + "learning_rate": 8.132394266715772e-05, + "loss": 0.0072, + "step": 288960 + }, + { + "epoch": 1.46, + "learning_rate": 8.13163749741437e-05, + "loss": 0.0075, + "step": 288970 + }, + { + "epoch": 1.46, + "learning_rate": 8.13088072811297e-05, + "loss": 0.0079, + "step": 288980 + }, + { + "epoch": 1.46, + "learning_rate": 8.130123958811569e-05, + "loss": 0.0069, + "step": 288990 + }, + { + "epoch": 1.46, + "learning_rate": 8.129367189510167e-05, + "loss": 0.0077, + "step": 289000 + }, + { + "epoch": 1.46, + "eval_cer": 0.9144401736232748, + "eval_loss": 0.005669711157679558, + "eval_runtime": 115.6193, + "eval_samples_per_second": 17.298, + "eval_steps_per_second": 4.325, + "step": 289000 + }, + { + "epoch": 1.46, + "learning_rate": 8.128610420208767e-05, + "loss": 0.0083, + "step": 289010 + }, + { + "epoch": 1.46, + "learning_rate": 8.127853650907366e-05, + "loss": 0.0078, + "step": 289020 + }, + { + "epoch": 1.46, + "learning_rate": 8.127096881605964e-05, + "loss": 0.0074, + "step": 289030 + }, + { + "epoch": 1.46, + "learning_rate": 8.126340112304564e-05, + "loss": 0.0092, + "step": 289040 + }, + { + "epoch": 1.46, + "learning_rate": 8.125583343003162e-05, + "loss": 0.0096, + "step": 289050 + }, + { + "epoch": 1.46, + "learning_rate": 8.124826573701761e-05, + "loss": 0.0076, + "step": 289060 + }, + { + "epoch": 1.46, + "learning_rate": 8.124069804400361e-05, + "loss": 0.0094, + "step": 289070 + }, + { + "epoch": 1.46, + "learning_rate": 8.123313035098959e-05, + "loss": 0.0089, + "step": 289080 + }, + { + "epoch": 1.46, + "learning_rate": 8.122556265797559e-05, + "loss": 0.0081, + "step": 289090 + }, + { + "epoch": 1.46, + "learning_rate": 8.121799496496158e-05, + "loss": 0.0074, + "step": 289100 + }, + { + "epoch": 1.46, + "learning_rate": 8.121042727194756e-05, + "loss": 0.0086, + "step": 289110 + }, + { + "epoch": 1.46, + "learning_rate": 8.120285957893356e-05, + "loss": 0.0066, + "step": 289120 + }, + { + "epoch": 1.46, + "learning_rate": 8.119529188591954e-05, + "loss": 0.0077, + "step": 289130 + }, + { + "epoch": 1.46, + "learning_rate": 8.118772419290553e-05, + "loss": 0.0051, + "step": 289140 + }, + { + "epoch": 1.46, + "learning_rate": 8.118015649989153e-05, + "loss": 0.0075, + "step": 289150 + }, + { + "epoch": 1.46, + "learning_rate": 8.117258880687751e-05, + "loss": 0.0066, + "step": 289160 + }, + { + "epoch": 1.46, + "learning_rate": 8.11650211138635e-05, + "loss": 0.0078, + "step": 289170 + }, + { + "epoch": 1.46, + "learning_rate": 8.11574534208495e-05, + "loss": 0.0134, + "step": 289180 + }, + { + "epoch": 1.46, + "learning_rate": 8.114988572783548e-05, + "loss": 0.0069, + "step": 289190 + }, + { + "epoch": 1.46, + "learning_rate": 8.114231803482148e-05, + "loss": 0.0054, + "step": 289200 + }, + { + "epoch": 1.46, + "learning_rate": 8.113475034180746e-05, + "loss": 0.0081, + "step": 289210 + }, + { + "epoch": 1.46, + "learning_rate": 8.112718264879345e-05, + "loss": 0.0065, + "step": 289220 + }, + { + "epoch": 1.46, + "learning_rate": 8.111961495577945e-05, + "loss": 0.0126, + "step": 289230 + }, + { + "epoch": 1.46, + "learning_rate": 8.111204726276543e-05, + "loss": 0.0083, + "step": 289240 + }, + { + "epoch": 1.46, + "learning_rate": 8.110447956975142e-05, + "loss": 0.0057, + "step": 289250 + }, + { + "epoch": 1.46, + "learning_rate": 8.109691187673742e-05, + "loss": 0.0074, + "step": 289260 + }, + { + "epoch": 1.46, + "learning_rate": 8.10893441837234e-05, + "loss": 0.0083, + "step": 289270 + }, + { + "epoch": 1.46, + "learning_rate": 8.10817764907094e-05, + "loss": 0.0078, + "step": 289280 + }, + { + "epoch": 1.46, + "learning_rate": 8.107420879769538e-05, + "loss": 0.0091, + "step": 289290 + }, + { + "epoch": 1.46, + "learning_rate": 8.106664110468137e-05, + "loss": 0.0087, + "step": 289300 + }, + { + "epoch": 1.46, + "learning_rate": 8.105907341166737e-05, + "loss": 0.0074, + "step": 289310 + }, + { + "epoch": 1.46, + "learning_rate": 8.105150571865335e-05, + "loss": 0.0129, + "step": 289320 + }, + { + "epoch": 1.46, + "learning_rate": 8.104393802563934e-05, + "loss": 0.0071, + "step": 289330 + }, + { + "epoch": 1.46, + "learning_rate": 8.103637033262534e-05, + "loss": 0.0109, + "step": 289340 + }, + { + "epoch": 1.46, + "learning_rate": 8.102880263961132e-05, + "loss": 0.0089, + "step": 289350 + }, + { + "epoch": 1.46, + "learning_rate": 8.102123494659732e-05, + "loss": 0.0071, + "step": 289360 + }, + { + "epoch": 1.46, + "learning_rate": 8.10136672535833e-05, + "loss": 0.0074, + "step": 289370 + }, + { + "epoch": 1.46, + "learning_rate": 8.100609956056929e-05, + "loss": 0.0107, + "step": 289380 + }, + { + "epoch": 1.46, + "learning_rate": 8.099853186755529e-05, + "loss": 0.0076, + "step": 289390 + }, + { + "epoch": 1.46, + "learning_rate": 8.099096417454125e-05, + "loss": 0.0075, + "step": 289400 + }, + { + "epoch": 1.46, + "learning_rate": 8.098339648152725e-05, + "loss": 0.0066, + "step": 289410 + }, + { + "epoch": 1.46, + "learning_rate": 8.097582878851323e-05, + "loss": 0.0068, + "step": 289420 + }, + { + "epoch": 1.46, + "learning_rate": 8.096826109549923e-05, + "loss": 0.0068, + "step": 289430 + }, + { + "epoch": 1.46, + "learning_rate": 8.096069340248522e-05, + "loss": 0.0068, + "step": 289440 + }, + { + "epoch": 1.46, + "learning_rate": 8.09531257094712e-05, + "loss": 0.0061, + "step": 289450 + }, + { + "epoch": 1.46, + "learning_rate": 8.09455580164572e-05, + "loss": 0.0067, + "step": 289460 + }, + { + "epoch": 1.46, + "learning_rate": 8.093799032344318e-05, + "loss": 0.0075, + "step": 289470 + }, + { + "epoch": 1.46, + "learning_rate": 8.093042263042917e-05, + "loss": 0.0092, + "step": 289480 + }, + { + "epoch": 1.46, + "learning_rate": 8.092285493741517e-05, + "loss": 0.0063, + "step": 289490 + }, + { + "epoch": 1.46, + "learning_rate": 8.091528724440115e-05, + "loss": 0.0077, + "step": 289500 + }, + { + "epoch": 1.46, + "learning_rate": 8.090771955138715e-05, + "loss": 0.0061, + "step": 289510 + }, + { + "epoch": 1.46, + "learning_rate": 8.090015185837314e-05, + "loss": 0.0064, + "step": 289520 + }, + { + "epoch": 1.46, + "learning_rate": 8.089258416535912e-05, + "loss": 0.0069, + "step": 289530 + }, + { + "epoch": 1.46, + "learning_rate": 8.088501647234512e-05, + "loss": 0.0076, + "step": 289540 + }, + { + "epoch": 1.46, + "learning_rate": 8.087744877933111e-05, + "loss": 0.0095, + "step": 289550 + }, + { + "epoch": 1.46, + "learning_rate": 8.08698810863171e-05, + "loss": 0.0064, + "step": 289560 + }, + { + "epoch": 1.46, + "learning_rate": 8.086231339330309e-05, + "loss": 0.0063, + "step": 289570 + }, + { + "epoch": 1.46, + "learning_rate": 8.085474570028907e-05, + "loss": 0.0075, + "step": 289580 + }, + { + "epoch": 1.46, + "learning_rate": 8.084717800727506e-05, + "loss": 0.0087, + "step": 289590 + }, + { + "epoch": 1.46, + "learning_rate": 8.083961031426106e-05, + "loss": 0.0085, + "step": 289600 + }, + { + "epoch": 1.46, + "learning_rate": 8.083204262124704e-05, + "loss": 0.0058, + "step": 289610 + }, + { + "epoch": 1.46, + "learning_rate": 8.082447492823304e-05, + "loss": 0.0068, + "step": 289620 + }, + { + "epoch": 1.46, + "learning_rate": 8.081690723521903e-05, + "loss": 0.0084, + "step": 289630 + }, + { + "epoch": 1.46, + "learning_rate": 8.080933954220501e-05, + "loss": 0.007, + "step": 289640 + }, + { + "epoch": 1.46, + "learning_rate": 8.080177184919101e-05, + "loss": 0.0063, + "step": 289650 + }, + { + "epoch": 1.46, + "learning_rate": 8.079420415617699e-05, + "loss": 0.0074, + "step": 289660 + }, + { + "epoch": 1.46, + "learning_rate": 8.078663646316298e-05, + "loss": 0.0075, + "step": 289670 + }, + { + "epoch": 1.46, + "learning_rate": 8.077906877014898e-05, + "loss": 0.0087, + "step": 289680 + }, + { + "epoch": 1.46, + "learning_rate": 8.077150107713496e-05, + "loss": 0.0083, + "step": 289690 + }, + { + "epoch": 1.46, + "learning_rate": 8.076393338412096e-05, + "loss": 0.0081, + "step": 289700 + }, + { + "epoch": 1.46, + "learning_rate": 8.075636569110695e-05, + "loss": 0.0069, + "step": 289710 + }, + { + "epoch": 1.46, + "learning_rate": 8.074879799809293e-05, + "loss": 0.0067, + "step": 289720 + }, + { + "epoch": 1.46, + "learning_rate": 8.074123030507893e-05, + "loss": 0.0077, + "step": 289730 + }, + { + "epoch": 1.46, + "learning_rate": 8.073366261206491e-05, + "loss": 0.0057, + "step": 289740 + }, + { + "epoch": 1.46, + "learning_rate": 8.07260949190509e-05, + "loss": 0.0068, + "step": 289750 + }, + { + "epoch": 1.46, + "learning_rate": 8.07185272260369e-05, + "loss": 0.0092, + "step": 289760 + }, + { + "epoch": 1.46, + "learning_rate": 8.071095953302288e-05, + "loss": 0.0071, + "step": 289770 + }, + { + "epoch": 1.46, + "learning_rate": 8.070339184000887e-05, + "loss": 0.0061, + "step": 289780 + }, + { + "epoch": 1.46, + "learning_rate": 8.069582414699487e-05, + "loss": 0.0079, + "step": 289790 + }, + { + "epoch": 1.46, + "learning_rate": 8.068825645398085e-05, + "loss": 0.007, + "step": 289800 + }, + { + "epoch": 1.46, + "learning_rate": 8.068068876096685e-05, + "loss": 0.0064, + "step": 289810 + }, + { + "epoch": 1.46, + "learning_rate": 8.067312106795283e-05, + "loss": 0.0073, + "step": 289820 + }, + { + "epoch": 1.46, + "learning_rate": 8.066555337493882e-05, + "loss": 0.0079, + "step": 289830 + }, + { + "epoch": 1.46, + "learning_rate": 8.065798568192482e-05, + "loss": 0.007, + "step": 289840 + }, + { + "epoch": 1.46, + "learning_rate": 8.06504179889108e-05, + "loss": 0.0076, + "step": 289850 + }, + { + "epoch": 1.46, + "learning_rate": 8.06428502958968e-05, + "loss": 0.0075, + "step": 289860 + }, + { + "epoch": 1.46, + "learning_rate": 8.063528260288279e-05, + "loss": 0.0061, + "step": 289870 + }, + { + "epoch": 1.46, + "learning_rate": 8.062771490986877e-05, + "loss": 0.0087, + "step": 289880 + }, + { + "epoch": 1.46, + "learning_rate": 8.062014721685477e-05, + "loss": 0.0097, + "step": 289890 + }, + { + "epoch": 1.46, + "learning_rate": 8.061257952384075e-05, + "loss": 0.0077, + "step": 289900 + }, + { + "epoch": 1.46, + "learning_rate": 8.060501183082674e-05, + "loss": 0.0085, + "step": 289910 + }, + { + "epoch": 1.46, + "learning_rate": 8.059744413781274e-05, + "loss": 0.007, + "step": 289920 + }, + { + "epoch": 1.46, + "learning_rate": 8.058987644479872e-05, + "loss": 0.0067, + "step": 289930 + }, + { + "epoch": 1.46, + "learning_rate": 8.058230875178471e-05, + "loss": 0.0078, + "step": 289940 + }, + { + "epoch": 1.46, + "learning_rate": 8.057474105877071e-05, + "loss": 0.0072, + "step": 289950 + }, + { + "epoch": 1.46, + "learning_rate": 8.056717336575669e-05, + "loss": 0.0068, + "step": 289960 + }, + { + "epoch": 1.46, + "learning_rate": 8.055960567274268e-05, + "loss": 0.0086, + "step": 289970 + }, + { + "epoch": 1.46, + "learning_rate": 8.055203797972867e-05, + "loss": 0.0066, + "step": 289980 + }, + { + "epoch": 1.46, + "learning_rate": 8.054447028671466e-05, + "loss": 0.0083, + "step": 289990 + }, + { + "epoch": 1.46, + "learning_rate": 8.053690259370066e-05, + "loss": 0.0078, + "step": 290000 + }, + { + "epoch": 1.46, + "eval_cer": 0.9144586111496574, + "eval_loss": 0.005535100121051073, + "eval_runtime": 115.6597, + "eval_samples_per_second": 17.292, + "eval_steps_per_second": 4.323, + "step": 290000 + }, + { + "epoch": 1.46, + "learning_rate": 8.052933490068664e-05, + "loss": 0.0064, + "step": 290010 + }, + { + "epoch": 1.46, + "learning_rate": 8.052176720767263e-05, + "loss": 0.0088, + "step": 290020 + }, + { + "epoch": 1.46, + "learning_rate": 8.05141995146586e-05, + "loss": 0.0092, + "step": 290030 + }, + { + "epoch": 1.46, + "learning_rate": 8.05066318216446e-05, + "loss": 0.01, + "step": 290040 + }, + { + "epoch": 1.46, + "learning_rate": 8.049906412863059e-05, + "loss": 0.0075, + "step": 290050 + }, + { + "epoch": 1.46, + "learning_rate": 8.049149643561657e-05, + "loss": 0.0086, + "step": 290060 + }, + { + "epoch": 1.46, + "learning_rate": 8.048392874260257e-05, + "loss": 0.0071, + "step": 290070 + }, + { + "epoch": 1.46, + "learning_rate": 8.047636104958856e-05, + "loss": 0.0067, + "step": 290080 + }, + { + "epoch": 1.46, + "learning_rate": 8.046879335657454e-05, + "loss": 0.0062, + "step": 290090 + }, + { + "epoch": 1.46, + "learning_rate": 8.046122566356054e-05, + "loss": 0.0078, + "step": 290100 + }, + { + "epoch": 1.46, + "learning_rate": 8.045365797054652e-05, + "loss": 0.0079, + "step": 290110 + }, + { + "epoch": 1.46, + "learning_rate": 8.044609027753252e-05, + "loss": 0.0057, + "step": 290120 + }, + { + "epoch": 1.46, + "learning_rate": 8.043852258451851e-05, + "loss": 0.0101, + "step": 290130 + }, + { + "epoch": 1.46, + "learning_rate": 8.043095489150449e-05, + "loss": 0.0063, + "step": 290140 + }, + { + "epoch": 1.46, + "learning_rate": 8.042338719849049e-05, + "loss": 0.0072, + "step": 290150 + }, + { + "epoch": 1.46, + "learning_rate": 8.041581950547648e-05, + "loss": 0.0078, + "step": 290160 + }, + { + "epoch": 1.46, + "learning_rate": 8.040825181246246e-05, + "loss": 0.007, + "step": 290170 + }, + { + "epoch": 1.46, + "learning_rate": 8.040068411944846e-05, + "loss": 0.0085, + "step": 290180 + }, + { + "epoch": 1.46, + "learning_rate": 8.039311642643444e-05, + "loss": 0.0089, + "step": 290190 + }, + { + "epoch": 1.46, + "learning_rate": 8.038554873342043e-05, + "loss": 0.0091, + "step": 290200 + }, + { + "epoch": 1.46, + "learning_rate": 8.037798104040643e-05, + "loss": 0.0055, + "step": 290210 + }, + { + "epoch": 1.46, + "learning_rate": 8.037041334739241e-05, + "loss": 0.0091, + "step": 290220 + }, + { + "epoch": 1.46, + "learning_rate": 8.03628456543784e-05, + "loss": 0.0073, + "step": 290230 + }, + { + "epoch": 1.46, + "learning_rate": 8.03552779613644e-05, + "loss": 0.0066, + "step": 290240 + }, + { + "epoch": 1.46, + "learning_rate": 8.034771026835038e-05, + "loss": 0.0065, + "step": 290250 + }, + { + "epoch": 1.46, + "learning_rate": 8.034014257533638e-05, + "loss": 0.008, + "step": 290260 + }, + { + "epoch": 1.46, + "learning_rate": 8.033257488232236e-05, + "loss": 0.006, + "step": 290270 + }, + { + "epoch": 1.46, + "learning_rate": 8.032500718930835e-05, + "loss": 0.0061, + "step": 290280 + }, + { + "epoch": 1.46, + "learning_rate": 8.031743949629435e-05, + "loss": 0.0073, + "step": 290290 + }, + { + "epoch": 1.46, + "learning_rate": 8.030987180328033e-05, + "loss": 0.0075, + "step": 290300 + }, + { + "epoch": 1.46, + "learning_rate": 8.030230411026633e-05, + "loss": 0.0068, + "step": 290310 + }, + { + "epoch": 1.46, + "learning_rate": 8.029473641725232e-05, + "loss": 0.0066, + "step": 290320 + }, + { + "epoch": 1.46, + "learning_rate": 8.02871687242383e-05, + "loss": 0.0066, + "step": 290330 + }, + { + "epoch": 1.46, + "learning_rate": 8.02796010312243e-05, + "loss": 0.0081, + "step": 290340 + }, + { + "epoch": 1.46, + "learning_rate": 8.027203333821028e-05, + "loss": 0.0063, + "step": 290350 + }, + { + "epoch": 1.46, + "learning_rate": 8.026446564519627e-05, + "loss": 0.0075, + "step": 290360 + }, + { + "epoch": 1.46, + "learning_rate": 8.025689795218227e-05, + "loss": 0.0081, + "step": 290370 + }, + { + "epoch": 1.46, + "learning_rate": 8.024933025916825e-05, + "loss": 0.0071, + "step": 290380 + }, + { + "epoch": 1.47, + "learning_rate": 8.024176256615424e-05, + "loss": 0.007, + "step": 290390 + }, + { + "epoch": 1.47, + "learning_rate": 8.023419487314024e-05, + "loss": 0.0057, + "step": 290400 + }, + { + "epoch": 1.47, + "learning_rate": 8.022662718012622e-05, + "loss": 0.0058, + "step": 290410 + }, + { + "epoch": 1.47, + "learning_rate": 8.021905948711222e-05, + "loss": 0.0077, + "step": 290420 + }, + { + "epoch": 1.47, + "learning_rate": 8.02114917940982e-05, + "loss": 0.0067, + "step": 290430 + }, + { + "epoch": 1.47, + "learning_rate": 8.020392410108419e-05, + "loss": 0.0058, + "step": 290440 + }, + { + "epoch": 1.47, + "learning_rate": 8.019635640807019e-05, + "loss": 0.0095, + "step": 290450 + }, + { + "epoch": 1.47, + "learning_rate": 8.018878871505617e-05, + "loss": 0.0098, + "step": 290460 + }, + { + "epoch": 1.47, + "learning_rate": 8.018122102204216e-05, + "loss": 0.0105, + "step": 290470 + }, + { + "epoch": 1.47, + "learning_rate": 8.017365332902816e-05, + "loss": 0.007, + "step": 290480 + }, + { + "epoch": 1.47, + "learning_rate": 8.016608563601414e-05, + "loss": 0.0059, + "step": 290490 + }, + { + "epoch": 1.47, + "learning_rate": 8.015851794300014e-05, + "loss": 0.0067, + "step": 290500 + }, + { + "epoch": 1.47, + "learning_rate": 8.015095024998613e-05, + "loss": 0.009, + "step": 290510 + }, + { + "epoch": 1.47, + "learning_rate": 8.014338255697211e-05, + "loss": 0.0062, + "step": 290520 + }, + { + "epoch": 1.47, + "learning_rate": 8.01358148639581e-05, + "loss": 0.0079, + "step": 290530 + }, + { + "epoch": 1.47, + "learning_rate": 8.012824717094409e-05, + "loss": 0.0063, + "step": 290540 + }, + { + "epoch": 1.47, + "learning_rate": 8.012067947793008e-05, + "loss": 0.0073, + "step": 290550 + }, + { + "epoch": 1.47, + "learning_rate": 8.011311178491608e-05, + "loss": 0.0069, + "step": 290560 + }, + { + "epoch": 1.47, + "learning_rate": 8.010554409190206e-05, + "loss": 0.0082, + "step": 290570 + }, + { + "epoch": 1.47, + "learning_rate": 8.009797639888805e-05, + "loss": 0.0099, + "step": 290580 + }, + { + "epoch": 1.47, + "learning_rate": 8.009040870587405e-05, + "loss": 0.0081, + "step": 290590 + }, + { + "epoch": 1.47, + "learning_rate": 8.008284101286003e-05, + "loss": 0.0058, + "step": 290600 + }, + { + "epoch": 1.47, + "learning_rate": 8.007527331984603e-05, + "loss": 0.0069, + "step": 290610 + }, + { + "epoch": 1.47, + "learning_rate": 8.006770562683201e-05, + "loss": 0.008, + "step": 290620 + }, + { + "epoch": 1.47, + "learning_rate": 8.0060137933818e-05, + "loss": 0.0076, + "step": 290630 + }, + { + "epoch": 1.47, + "learning_rate": 8.0052570240804e-05, + "loss": 0.0069, + "step": 290640 + }, + { + "epoch": 1.47, + "learning_rate": 8.004500254778998e-05, + "loss": 0.0066, + "step": 290650 + }, + { + "epoch": 1.47, + "learning_rate": 8.003743485477596e-05, + "loss": 0.0074, + "step": 290660 + }, + { + "epoch": 1.47, + "learning_rate": 8.002986716176194e-05, + "loss": 0.0059, + "step": 290670 + }, + { + "epoch": 1.47, + "learning_rate": 8.002229946874794e-05, + "loss": 0.0061, + "step": 290680 + }, + { + "epoch": 1.47, + "learning_rate": 8.001473177573393e-05, + "loss": 0.0069, + "step": 290690 + }, + { + "epoch": 1.47, + "learning_rate": 8.000716408271991e-05, + "loss": 0.0054, + "step": 290700 + }, + { + "epoch": 1.47, + "learning_rate": 7.999959638970591e-05, + "loss": 0.0069, + "step": 290710 + }, + { + "epoch": 1.47, + "learning_rate": 7.999202869669189e-05, + "loss": 0.0099, + "step": 290720 + }, + { + "epoch": 1.47, + "learning_rate": 7.998446100367788e-05, + "loss": 0.0087, + "step": 290730 + }, + { + "epoch": 1.47, + "learning_rate": 7.997689331066388e-05, + "loss": 0.008, + "step": 290740 + }, + { + "epoch": 1.47, + "learning_rate": 7.996932561764986e-05, + "loss": 0.0067, + "step": 290750 + }, + { + "epoch": 1.47, + "learning_rate": 7.996175792463586e-05, + "loss": 0.0086, + "step": 290760 + }, + { + "epoch": 1.47, + "learning_rate": 7.995419023162185e-05, + "loss": 0.0082, + "step": 290770 + }, + { + "epoch": 1.47, + "learning_rate": 7.994662253860783e-05, + "loss": 0.0076, + "step": 290780 + }, + { + "epoch": 1.47, + "learning_rate": 7.993905484559383e-05, + "loss": 0.0088, + "step": 290790 + }, + { + "epoch": 1.47, + "learning_rate": 7.993148715257981e-05, + "loss": 0.0075, + "step": 290800 + }, + { + "epoch": 1.47, + "learning_rate": 7.99239194595658e-05, + "loss": 0.0065, + "step": 290810 + }, + { + "epoch": 1.47, + "learning_rate": 7.99163517665518e-05, + "loss": 0.0085, + "step": 290820 + }, + { + "epoch": 1.47, + "learning_rate": 7.990878407353778e-05, + "loss": 0.0107, + "step": 290830 + }, + { + "epoch": 1.47, + "learning_rate": 7.990121638052378e-05, + "loss": 0.008, + "step": 290840 + }, + { + "epoch": 1.47, + "learning_rate": 7.989364868750977e-05, + "loss": 0.009, + "step": 290850 + }, + { + "epoch": 1.47, + "learning_rate": 7.988608099449575e-05, + "loss": 0.008, + "step": 290860 + }, + { + "epoch": 1.47, + "learning_rate": 7.987851330148175e-05, + "loss": 0.0079, + "step": 290870 + }, + { + "epoch": 1.47, + "learning_rate": 7.987094560846773e-05, + "loss": 0.0075, + "step": 290880 + }, + { + "epoch": 1.47, + "learning_rate": 7.986337791545372e-05, + "loss": 0.0104, + "step": 290890 + }, + { + "epoch": 1.47, + "learning_rate": 7.985581022243972e-05, + "loss": 0.0059, + "step": 290900 + }, + { + "epoch": 1.47, + "learning_rate": 7.98482425294257e-05, + "loss": 0.0065, + "step": 290910 + }, + { + "epoch": 1.47, + "learning_rate": 7.98406748364117e-05, + "loss": 0.0068, + "step": 290920 + }, + { + "epoch": 1.47, + "learning_rate": 7.983310714339769e-05, + "loss": 0.0076, + "step": 290930 + }, + { + "epoch": 1.47, + "learning_rate": 7.982553945038367e-05, + "loss": 0.0061, + "step": 290940 + }, + { + "epoch": 1.47, + "learning_rate": 7.981797175736967e-05, + "loss": 0.0078, + "step": 290950 + }, + { + "epoch": 1.47, + "learning_rate": 7.981040406435566e-05, + "loss": 0.0078, + "step": 290960 + }, + { + "epoch": 1.47, + "learning_rate": 7.980283637134164e-05, + "loss": 0.0056, + "step": 290970 + }, + { + "epoch": 1.47, + "learning_rate": 7.979526867832764e-05, + "loss": 0.0072, + "step": 290980 + }, + { + "epoch": 1.47, + "learning_rate": 7.978770098531362e-05, + "loss": 0.0065, + "step": 290990 + }, + { + "epoch": 1.47, + "learning_rate": 7.978013329229961e-05, + "loss": 0.0068, + "step": 291000 + }, + { + "epoch": 1.47, + "eval_cer": 0.9144314400581461, + "eval_loss": 0.00572578888386488, + "eval_runtime": 115.7089, + "eval_samples_per_second": 17.285, + "eval_steps_per_second": 4.321, + "step": 291000 + }, + { + "epoch": 1.47, + "learning_rate": 7.977256559928561e-05, + "loss": 0.0074, + "step": 291010 + }, + { + "epoch": 1.47, + "learning_rate": 7.976499790627159e-05, + "loss": 0.0065, + "step": 291020 + }, + { + "epoch": 1.47, + "learning_rate": 7.975743021325759e-05, + "loss": 0.0072, + "step": 291030 + }, + { + "epoch": 1.47, + "learning_rate": 7.974986252024358e-05, + "loss": 0.0094, + "step": 291040 + }, + { + "epoch": 1.47, + "learning_rate": 7.974229482722956e-05, + "loss": 0.0063, + "step": 291050 + }, + { + "epoch": 1.47, + "learning_rate": 7.973472713421556e-05, + "loss": 0.0079, + "step": 291060 + }, + { + "epoch": 1.47, + "learning_rate": 7.972715944120154e-05, + "loss": 0.0072, + "step": 291070 + }, + { + "epoch": 1.47, + "learning_rate": 7.971959174818753e-05, + "loss": 0.0079, + "step": 291080 + }, + { + "epoch": 1.47, + "learning_rate": 7.971202405517353e-05, + "loss": 0.0082, + "step": 291090 + }, + { + "epoch": 1.47, + "learning_rate": 7.970445636215951e-05, + "loss": 0.0075, + "step": 291100 + }, + { + "epoch": 1.47, + "learning_rate": 7.96968886691455e-05, + "loss": 0.0072, + "step": 291110 + }, + { + "epoch": 1.47, + "learning_rate": 7.96893209761315e-05, + "loss": 0.0062, + "step": 291120 + }, + { + "epoch": 1.47, + "learning_rate": 7.968175328311748e-05, + "loss": 0.0069, + "step": 291130 + }, + { + "epoch": 1.47, + "learning_rate": 7.967418559010348e-05, + "loss": 0.0065, + "step": 291140 + }, + { + "epoch": 1.47, + "learning_rate": 7.966661789708946e-05, + "loss": 0.0064, + "step": 291150 + }, + { + "epoch": 1.47, + "learning_rate": 7.965905020407545e-05, + "loss": 0.0065, + "step": 291160 + }, + { + "epoch": 1.47, + "learning_rate": 7.965148251106145e-05, + "loss": 0.0084, + "step": 291170 + }, + { + "epoch": 1.47, + "learning_rate": 7.964391481804743e-05, + "loss": 0.0071, + "step": 291180 + }, + { + "epoch": 1.47, + "learning_rate": 7.963634712503342e-05, + "loss": 0.0065, + "step": 291190 + }, + { + "epoch": 1.47, + "learning_rate": 7.962877943201942e-05, + "loss": 0.0054, + "step": 291200 + }, + { + "epoch": 1.47, + "learning_rate": 7.96212117390054e-05, + "loss": 0.0094, + "step": 291210 + }, + { + "epoch": 1.47, + "learning_rate": 7.96136440459914e-05, + "loss": 0.0073, + "step": 291220 + }, + { + "epoch": 1.47, + "learning_rate": 7.960607635297738e-05, + "loss": 0.0085, + "step": 291230 + }, + { + "epoch": 1.47, + "learning_rate": 7.959850865996337e-05, + "loss": 0.007, + "step": 291240 + }, + { + "epoch": 1.47, + "learning_rate": 7.959094096694937e-05, + "loss": 0.0076, + "step": 291250 + }, + { + "epoch": 1.47, + "learning_rate": 7.958337327393535e-05, + "loss": 0.0101, + "step": 291260 + }, + { + "epoch": 1.47, + "learning_rate": 7.957580558092134e-05, + "loss": 0.0066, + "step": 291270 + }, + { + "epoch": 1.47, + "learning_rate": 7.956823788790734e-05, + "loss": 0.0074, + "step": 291280 + }, + { + "epoch": 1.47, + "learning_rate": 7.95606701948933e-05, + "loss": 0.0065, + "step": 291290 + }, + { + "epoch": 1.47, + "learning_rate": 7.95531025018793e-05, + "loss": 0.0066, + "step": 291300 + }, + { + "epoch": 1.47, + "learning_rate": 7.954553480886528e-05, + "loss": 0.0076, + "step": 291310 + }, + { + "epoch": 1.47, + "learning_rate": 7.953796711585128e-05, + "loss": 0.0076, + "step": 291320 + }, + { + "epoch": 1.47, + "learning_rate": 7.953039942283726e-05, + "loss": 0.0058, + "step": 291330 + }, + { + "epoch": 1.47, + "learning_rate": 7.952283172982325e-05, + "loss": 0.0048, + "step": 291340 + }, + { + "epoch": 1.47, + "learning_rate": 7.951526403680925e-05, + "loss": 0.0088, + "step": 291350 + }, + { + "epoch": 1.47, + "learning_rate": 7.950769634379523e-05, + "loss": 0.0076, + "step": 291360 + }, + { + "epoch": 1.47, + "learning_rate": 7.950012865078123e-05, + "loss": 0.0103, + "step": 291370 + }, + { + "epoch": 1.47, + "learning_rate": 7.949256095776722e-05, + "loss": 0.0063, + "step": 291380 + }, + { + "epoch": 1.47, + "learning_rate": 7.94849932647532e-05, + "loss": 0.0058, + "step": 291390 + }, + { + "epoch": 1.47, + "learning_rate": 7.94774255717392e-05, + "loss": 0.0081, + "step": 291400 + }, + { + "epoch": 1.47, + "learning_rate": 7.946985787872518e-05, + "loss": 0.0072, + "step": 291410 + }, + { + "epoch": 1.47, + "learning_rate": 7.946229018571117e-05, + "loss": 0.0056, + "step": 291420 + }, + { + "epoch": 1.47, + "learning_rate": 7.945472249269717e-05, + "loss": 0.0075, + "step": 291430 + }, + { + "epoch": 1.47, + "learning_rate": 7.944715479968315e-05, + "loss": 0.0101, + "step": 291440 + }, + { + "epoch": 1.47, + "learning_rate": 7.943958710666914e-05, + "loss": 0.0093, + "step": 291450 + }, + { + "epoch": 1.47, + "learning_rate": 7.943201941365514e-05, + "loss": 0.0067, + "step": 291460 + }, + { + "epoch": 1.47, + "learning_rate": 7.942445172064112e-05, + "loss": 0.006, + "step": 291470 + }, + { + "epoch": 1.47, + "learning_rate": 7.941688402762712e-05, + "loss": 0.0071, + "step": 291480 + }, + { + "epoch": 1.47, + "learning_rate": 7.940931633461311e-05, + "loss": 0.0074, + "step": 291490 + }, + { + "epoch": 1.47, + "learning_rate": 7.940174864159909e-05, + "loss": 0.0118, + "step": 291500 + }, + { + "epoch": 1.47, + "learning_rate": 7.939418094858509e-05, + "loss": 0.0119, + "step": 291510 + }, + { + "epoch": 1.47, + "learning_rate": 7.938661325557107e-05, + "loss": 0.0089, + "step": 291520 + }, + { + "epoch": 1.47, + "learning_rate": 7.937904556255706e-05, + "loss": 0.0066, + "step": 291530 + }, + { + "epoch": 1.47, + "learning_rate": 7.937147786954306e-05, + "loss": 0.0084, + "step": 291540 + }, + { + "epoch": 1.47, + "learning_rate": 7.936391017652904e-05, + "loss": 0.0069, + "step": 291550 + }, + { + "epoch": 1.47, + "learning_rate": 7.935634248351504e-05, + "loss": 0.0099, + "step": 291560 + }, + { + "epoch": 1.47, + "learning_rate": 7.934877479050103e-05, + "loss": 0.0138, + "step": 291570 + }, + { + "epoch": 1.47, + "learning_rate": 7.934120709748701e-05, + "loss": 0.0103, + "step": 291580 + }, + { + "epoch": 1.47, + "learning_rate": 7.933363940447301e-05, + "loss": 0.0076, + "step": 291590 + }, + { + "epoch": 1.47, + "learning_rate": 7.932607171145899e-05, + "loss": 0.0089, + "step": 291600 + }, + { + "epoch": 1.47, + "learning_rate": 7.931850401844498e-05, + "loss": 0.0085, + "step": 291610 + }, + { + "epoch": 1.47, + "learning_rate": 7.931093632543098e-05, + "loss": 0.0066, + "step": 291620 + }, + { + "epoch": 1.47, + "learning_rate": 7.930336863241696e-05, + "loss": 0.0063, + "step": 291630 + }, + { + "epoch": 1.47, + "learning_rate": 7.929580093940295e-05, + "loss": 0.0085, + "step": 291640 + }, + { + "epoch": 1.47, + "learning_rate": 7.928823324638895e-05, + "loss": 0.0061, + "step": 291650 + }, + { + "epoch": 1.47, + "learning_rate": 7.928066555337493e-05, + "loss": 0.0066, + "step": 291660 + }, + { + "epoch": 1.47, + "learning_rate": 7.927309786036093e-05, + "loss": 0.0082, + "step": 291670 + }, + { + "epoch": 1.47, + "learning_rate": 7.926553016734691e-05, + "loss": 0.0107, + "step": 291680 + }, + { + "epoch": 1.47, + "learning_rate": 7.92579624743329e-05, + "loss": 0.0096, + "step": 291690 + }, + { + "epoch": 1.47, + "learning_rate": 7.92503947813189e-05, + "loss": 0.0065, + "step": 291700 + }, + { + "epoch": 1.47, + "learning_rate": 7.924282708830488e-05, + "loss": 0.007, + "step": 291710 + }, + { + "epoch": 1.47, + "learning_rate": 7.923525939529087e-05, + "loss": 0.0076, + "step": 291720 + }, + { + "epoch": 1.47, + "learning_rate": 7.922769170227687e-05, + "loss": 0.0083, + "step": 291730 + }, + { + "epoch": 1.47, + "learning_rate": 7.922012400926285e-05, + "loss": 0.0069, + "step": 291740 + }, + { + "epoch": 1.47, + "learning_rate": 7.921255631624885e-05, + "loss": 0.0074, + "step": 291750 + }, + { + "epoch": 1.47, + "learning_rate": 7.920498862323483e-05, + "loss": 0.0069, + "step": 291760 + }, + { + "epoch": 1.47, + "learning_rate": 7.919742093022082e-05, + "loss": 0.0076, + "step": 291770 + }, + { + "epoch": 1.47, + "learning_rate": 7.918985323720682e-05, + "loss": 0.0088, + "step": 291780 + }, + { + "epoch": 1.47, + "learning_rate": 7.91822855441928e-05, + "loss": 0.006, + "step": 291790 + }, + { + "epoch": 1.47, + "learning_rate": 7.91747178511788e-05, + "loss": 0.0103, + "step": 291800 + }, + { + "epoch": 1.47, + "learning_rate": 7.916715015816479e-05, + "loss": 0.006, + "step": 291810 + }, + { + "epoch": 1.47, + "learning_rate": 7.915958246515077e-05, + "loss": 0.0069, + "step": 291820 + }, + { + "epoch": 1.47, + "learning_rate": 7.915201477213676e-05, + "loss": 0.0069, + "step": 291830 + }, + { + "epoch": 1.47, + "learning_rate": 7.914444707912275e-05, + "loss": 0.0095, + "step": 291840 + }, + { + "epoch": 1.47, + "learning_rate": 7.913687938610874e-05, + "loss": 0.0098, + "step": 291850 + }, + { + "epoch": 1.47, + "learning_rate": 7.912931169309474e-05, + "loss": 0.008, + "step": 291860 + }, + { + "epoch": 1.47, + "learning_rate": 7.912174400008072e-05, + "loss": 0.009, + "step": 291870 + }, + { + "epoch": 1.47, + "learning_rate": 7.911417630706671e-05, + "loss": 0.006, + "step": 291880 + }, + { + "epoch": 1.47, + "learning_rate": 7.910660861405271e-05, + "loss": 0.0084, + "step": 291890 + }, + { + "epoch": 1.47, + "learning_rate": 7.909904092103869e-05, + "loss": 0.0072, + "step": 291900 + }, + { + "epoch": 1.47, + "learning_rate": 7.909147322802468e-05, + "loss": 0.006, + "step": 291910 + }, + { + "epoch": 1.47, + "learning_rate": 7.908390553501065e-05, + "loss": 0.0075, + "step": 291920 + }, + { + "epoch": 1.47, + "learning_rate": 7.907633784199665e-05, + "loss": 0.008, + "step": 291930 + }, + { + "epoch": 1.47, + "learning_rate": 7.906877014898264e-05, + "loss": 0.009, + "step": 291940 + }, + { + "epoch": 1.47, + "learning_rate": 7.906120245596862e-05, + "loss": 0.0079, + "step": 291950 + }, + { + "epoch": 1.47, + "learning_rate": 7.905363476295462e-05, + "loss": 0.0068, + "step": 291960 + }, + { + "epoch": 1.47, + "learning_rate": 7.90460670699406e-05, + "loss": 0.0057, + "step": 291970 + }, + { + "epoch": 1.47, + "learning_rate": 7.90384993769266e-05, + "loss": 0.0086, + "step": 291980 + }, + { + "epoch": 1.47, + "learning_rate": 7.903093168391259e-05, + "loss": 0.0059, + "step": 291990 + }, + { + "epoch": 1.47, + "learning_rate": 7.902336399089857e-05, + "loss": 0.0061, + "step": 292000 + }, + { + "epoch": 1.47, + "eval_cer": 0.9144362920387732, + "eval_loss": 0.0056129819713532925, + "eval_runtime": 115.8149, + "eval_samples_per_second": 17.269, + "eval_steps_per_second": 4.317, + "step": 292000 + }, + { + "epoch": 1.47, + "learning_rate": 7.901579629788457e-05, + "loss": 0.0076, + "step": 292010 + }, + { + "epoch": 1.47, + "learning_rate": 7.900822860487056e-05, + "loss": 0.0053, + "step": 292020 + }, + { + "epoch": 1.47, + "learning_rate": 7.900066091185654e-05, + "loss": 0.0056, + "step": 292030 + }, + { + "epoch": 1.47, + "learning_rate": 7.899309321884254e-05, + "loss": 0.008, + "step": 292040 + }, + { + "epoch": 1.47, + "learning_rate": 7.898552552582852e-05, + "loss": 0.0089, + "step": 292050 + }, + { + "epoch": 1.47, + "learning_rate": 7.897795783281451e-05, + "loss": 0.0076, + "step": 292060 + }, + { + "epoch": 1.47, + "learning_rate": 7.897039013980051e-05, + "loss": 0.0095, + "step": 292070 + }, + { + "epoch": 1.47, + "learning_rate": 7.896282244678649e-05, + "loss": 0.0099, + "step": 292080 + }, + { + "epoch": 1.47, + "learning_rate": 7.895525475377249e-05, + "loss": 0.0069, + "step": 292090 + }, + { + "epoch": 1.47, + "learning_rate": 7.894768706075848e-05, + "loss": 0.0068, + "step": 292100 + }, + { + "epoch": 1.47, + "learning_rate": 7.894011936774446e-05, + "loss": 0.0063, + "step": 292110 + }, + { + "epoch": 1.47, + "learning_rate": 7.893255167473046e-05, + "loss": 0.0073, + "step": 292120 + }, + { + "epoch": 1.47, + "learning_rate": 7.892498398171644e-05, + "loss": 0.0071, + "step": 292130 + }, + { + "epoch": 1.47, + "learning_rate": 7.891741628870243e-05, + "loss": 0.0078, + "step": 292140 + }, + { + "epoch": 1.47, + "learning_rate": 7.890984859568843e-05, + "loss": 0.0091, + "step": 292150 + }, + { + "epoch": 1.47, + "learning_rate": 7.890228090267441e-05, + "loss": 0.009, + "step": 292160 + }, + { + "epoch": 1.47, + "learning_rate": 7.88947132096604e-05, + "loss": 0.007, + "step": 292170 + }, + { + "epoch": 1.47, + "learning_rate": 7.88871455166464e-05, + "loss": 0.007, + "step": 292180 + }, + { + "epoch": 1.47, + "learning_rate": 7.887957782363238e-05, + "loss": 0.0096, + "step": 292190 + }, + { + "epoch": 1.47, + "learning_rate": 7.887201013061838e-05, + "loss": 0.0073, + "step": 292200 + }, + { + "epoch": 1.47, + "learning_rate": 7.886444243760436e-05, + "loss": 0.007, + "step": 292210 + }, + { + "epoch": 1.47, + "learning_rate": 7.885687474459035e-05, + "loss": 0.0093, + "step": 292220 + }, + { + "epoch": 1.47, + "learning_rate": 7.884930705157635e-05, + "loss": 0.0076, + "step": 292230 + }, + { + "epoch": 1.47, + "learning_rate": 7.884173935856233e-05, + "loss": 0.0087, + "step": 292240 + }, + { + "epoch": 1.47, + "learning_rate": 7.883417166554832e-05, + "loss": 0.0087, + "step": 292250 + }, + { + "epoch": 1.47, + "learning_rate": 7.882660397253432e-05, + "loss": 0.0072, + "step": 292260 + }, + { + "epoch": 1.47, + "learning_rate": 7.88190362795203e-05, + "loss": 0.0077, + "step": 292270 + }, + { + "epoch": 1.47, + "learning_rate": 7.88114685865063e-05, + "loss": 0.009, + "step": 292280 + }, + { + "epoch": 1.47, + "learning_rate": 7.880390089349228e-05, + "loss": 0.0054, + "step": 292290 + }, + { + "epoch": 1.47, + "learning_rate": 7.879633320047827e-05, + "loss": 0.0058, + "step": 292300 + }, + { + "epoch": 1.47, + "learning_rate": 7.878876550746427e-05, + "loss": 0.0056, + "step": 292310 + }, + { + "epoch": 1.47, + "learning_rate": 7.878119781445025e-05, + "loss": 0.0081, + "step": 292320 + }, + { + "epoch": 1.47, + "learning_rate": 7.877363012143624e-05, + "loss": 0.0059, + "step": 292330 + }, + { + "epoch": 1.47, + "learning_rate": 7.876606242842224e-05, + "loss": 0.0077, + "step": 292340 + }, + { + "epoch": 1.47, + "learning_rate": 7.875849473540822e-05, + "loss": 0.0067, + "step": 292350 + }, + { + "epoch": 1.47, + "learning_rate": 7.875092704239421e-05, + "loss": 0.0073, + "step": 292360 + }, + { + "epoch": 1.48, + "learning_rate": 7.87433593493802e-05, + "loss": 0.0094, + "step": 292370 + }, + { + "epoch": 1.48, + "learning_rate": 7.873579165636619e-05, + "loss": 0.0057, + "step": 292380 + }, + { + "epoch": 1.48, + "learning_rate": 7.872822396335219e-05, + "loss": 0.008, + "step": 292390 + }, + { + "epoch": 1.48, + "learning_rate": 7.872065627033817e-05, + "loss": 0.0082, + "step": 292400 + }, + { + "epoch": 1.48, + "learning_rate": 7.871308857732416e-05, + "loss": 0.0072, + "step": 292410 + }, + { + "epoch": 1.48, + "learning_rate": 7.870552088431016e-05, + "loss": 0.0052, + "step": 292420 + }, + { + "epoch": 1.48, + "learning_rate": 7.869795319129614e-05, + "loss": 0.0072, + "step": 292430 + }, + { + "epoch": 1.48, + "learning_rate": 7.869038549828213e-05, + "loss": 0.0069, + "step": 292440 + }, + { + "epoch": 1.48, + "learning_rate": 7.868281780526813e-05, + "loss": 0.0056, + "step": 292450 + }, + { + "epoch": 1.48, + "learning_rate": 7.867525011225411e-05, + "loss": 0.0094, + "step": 292460 + }, + { + "epoch": 1.48, + "learning_rate": 7.86676824192401e-05, + "loss": 0.0074, + "step": 292470 + }, + { + "epoch": 1.48, + "learning_rate": 7.866011472622609e-05, + "loss": 0.0078, + "step": 292480 + }, + { + "epoch": 1.48, + "learning_rate": 7.865254703321208e-05, + "loss": 0.0064, + "step": 292490 + }, + { + "epoch": 1.48, + "learning_rate": 7.864497934019808e-05, + "loss": 0.008, + "step": 292500 + }, + { + "epoch": 1.48, + "learning_rate": 7.863741164718406e-05, + "loss": 0.0072, + "step": 292510 + }, + { + "epoch": 1.48, + "learning_rate": 7.862984395417005e-05, + "loss": 0.0045, + "step": 292520 + }, + { + "epoch": 1.48, + "learning_rate": 7.862227626115605e-05, + "loss": 0.0054, + "step": 292530 + }, + { + "epoch": 1.48, + "learning_rate": 7.861470856814203e-05, + "loss": 0.006, + "step": 292540 + }, + { + "epoch": 1.48, + "learning_rate": 7.860714087512801e-05, + "loss": 0.0077, + "step": 292550 + }, + { + "epoch": 1.48, + "learning_rate": 7.859957318211399e-05, + "loss": 0.0068, + "step": 292560 + }, + { + "epoch": 1.48, + "learning_rate": 7.859200548909999e-05, + "loss": 0.0079, + "step": 292570 + }, + { + "epoch": 1.48, + "learning_rate": 7.858443779608597e-05, + "loss": 0.0064, + "step": 292580 + }, + { + "epoch": 1.48, + "learning_rate": 7.857687010307196e-05, + "loss": 0.0076, + "step": 292590 + }, + { + "epoch": 1.48, + "learning_rate": 7.856930241005796e-05, + "loss": 0.0085, + "step": 292600 + }, + { + "epoch": 1.48, + "learning_rate": 7.856173471704394e-05, + "loss": 0.0062, + "step": 292610 + }, + { + "epoch": 1.48, + "learning_rate": 7.855416702402994e-05, + "loss": 0.0094, + "step": 292620 + }, + { + "epoch": 1.48, + "learning_rate": 7.854659933101593e-05, + "loss": 0.0065, + "step": 292630 + }, + { + "epoch": 1.48, + "learning_rate": 7.853903163800191e-05, + "loss": 0.0078, + "step": 292640 + }, + { + "epoch": 1.48, + "learning_rate": 7.853146394498791e-05, + "loss": 0.0071, + "step": 292650 + }, + { + "epoch": 1.48, + "learning_rate": 7.852389625197389e-05, + "loss": 0.0081, + "step": 292660 + }, + { + "epoch": 1.48, + "learning_rate": 7.851632855895988e-05, + "loss": 0.0077, + "step": 292670 + }, + { + "epoch": 1.48, + "learning_rate": 7.850876086594588e-05, + "loss": 0.0068, + "step": 292680 + }, + { + "epoch": 1.48, + "learning_rate": 7.850119317293186e-05, + "loss": 0.0062, + "step": 292690 + }, + { + "epoch": 1.48, + "learning_rate": 7.849362547991785e-05, + "loss": 0.008, + "step": 292700 + }, + { + "epoch": 1.48, + "learning_rate": 7.848605778690385e-05, + "loss": 0.0079, + "step": 292710 + }, + { + "epoch": 1.48, + "learning_rate": 7.847849009388983e-05, + "loss": 0.0072, + "step": 292720 + }, + { + "epoch": 1.48, + "learning_rate": 7.847092240087583e-05, + "loss": 0.0071, + "step": 292730 + }, + { + "epoch": 1.48, + "learning_rate": 7.846335470786181e-05, + "loss": 0.0081, + "step": 292740 + }, + { + "epoch": 1.48, + "learning_rate": 7.84557870148478e-05, + "loss": 0.0061, + "step": 292750 + }, + { + "epoch": 1.48, + "learning_rate": 7.84482193218338e-05, + "loss": 0.0054, + "step": 292760 + }, + { + "epoch": 1.48, + "learning_rate": 7.844065162881978e-05, + "loss": 0.0076, + "step": 292770 + }, + { + "epoch": 1.48, + "learning_rate": 7.843308393580577e-05, + "loss": 0.0063, + "step": 292780 + }, + { + "epoch": 1.48, + "learning_rate": 7.842551624279177e-05, + "loss": 0.0097, + "step": 292790 + }, + { + "epoch": 1.48, + "learning_rate": 7.841794854977775e-05, + "loss": 0.0076, + "step": 292800 + }, + { + "epoch": 1.48, + "learning_rate": 7.841038085676375e-05, + "loss": 0.0086, + "step": 292810 + }, + { + "epoch": 1.48, + "learning_rate": 7.840281316374973e-05, + "loss": 0.006, + "step": 292820 + }, + { + "epoch": 1.48, + "learning_rate": 7.839524547073572e-05, + "loss": 0.0081, + "step": 292830 + }, + { + "epoch": 1.48, + "learning_rate": 7.838767777772172e-05, + "loss": 0.009, + "step": 292840 + }, + { + "epoch": 1.48, + "learning_rate": 7.83801100847077e-05, + "loss": 0.0073, + "step": 292850 + }, + { + "epoch": 1.48, + "learning_rate": 7.83725423916937e-05, + "loss": 0.0068, + "step": 292860 + }, + { + "epoch": 1.48, + "learning_rate": 7.836497469867969e-05, + "loss": 0.0097, + "step": 292870 + }, + { + "epoch": 1.48, + "learning_rate": 7.835740700566567e-05, + "loss": 0.0068, + "step": 292880 + }, + { + "epoch": 1.48, + "learning_rate": 7.834983931265166e-05, + "loss": 0.0042, + "step": 292890 + }, + { + "epoch": 1.48, + "learning_rate": 7.834227161963765e-05, + "loss": 0.0079, + "step": 292900 + }, + { + "epoch": 1.48, + "learning_rate": 7.833470392662364e-05, + "loss": 0.0097, + "step": 292910 + }, + { + "epoch": 1.48, + "learning_rate": 7.832713623360964e-05, + "loss": 0.0059, + "step": 292920 + }, + { + "epoch": 1.48, + "learning_rate": 7.831956854059562e-05, + "loss": 0.0075, + "step": 292930 + }, + { + "epoch": 1.48, + "learning_rate": 7.831200084758161e-05, + "loss": 0.0066, + "step": 292940 + }, + { + "epoch": 1.48, + "learning_rate": 7.830443315456761e-05, + "loss": 0.0074, + "step": 292950 + }, + { + "epoch": 1.48, + "learning_rate": 7.829686546155359e-05, + "loss": 0.008, + "step": 292960 + }, + { + "epoch": 1.48, + "learning_rate": 7.828929776853958e-05, + "loss": 0.0108, + "step": 292970 + }, + { + "epoch": 1.48, + "learning_rate": 7.828173007552558e-05, + "loss": 0.0069, + "step": 292980 + }, + { + "epoch": 1.48, + "learning_rate": 7.827416238251156e-05, + "loss": 0.0047, + "step": 292990 + }, + { + "epoch": 1.48, + "learning_rate": 7.826659468949756e-05, + "loss": 0.0053, + "step": 293000 + }, + { + "epoch": 1.48, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.005583611316978931, + "eval_runtime": 116.624, + "eval_samples_per_second": 17.149, + "eval_steps_per_second": 4.287, + "step": 293000 + }, + { + "epoch": 1.48, + "learning_rate": 7.825902699648354e-05, + "loss": 0.0054, + "step": 293010 + }, + { + "epoch": 1.48, + "learning_rate": 7.825145930346953e-05, + "loss": 0.0113, + "step": 293020 + }, + { + "epoch": 1.48, + "learning_rate": 7.824389161045553e-05, + "loss": 0.0055, + "step": 293030 + }, + { + "epoch": 1.48, + "learning_rate": 7.823632391744151e-05, + "loss": 0.0072, + "step": 293040 + }, + { + "epoch": 1.48, + "learning_rate": 7.82287562244275e-05, + "loss": 0.0078, + "step": 293050 + }, + { + "epoch": 1.48, + "learning_rate": 7.82211885314135e-05, + "loss": 0.0059, + "step": 293060 + }, + { + "epoch": 1.48, + "learning_rate": 7.821362083839948e-05, + "loss": 0.0088, + "step": 293070 + }, + { + "epoch": 1.48, + "learning_rate": 7.820605314538548e-05, + "loss": 0.0097, + "step": 293080 + }, + { + "epoch": 1.48, + "learning_rate": 7.819848545237146e-05, + "loss": 0.0066, + "step": 293090 + }, + { + "epoch": 1.48, + "learning_rate": 7.819091775935745e-05, + "loss": 0.0094, + "step": 293100 + }, + { + "epoch": 1.48, + "learning_rate": 7.818335006634345e-05, + "loss": 0.008, + "step": 293110 + }, + { + "epoch": 1.48, + "learning_rate": 7.817578237332943e-05, + "loss": 0.0072, + "step": 293120 + }, + { + "epoch": 1.48, + "learning_rate": 7.816821468031542e-05, + "loss": 0.0096, + "step": 293130 + }, + { + "epoch": 1.48, + "learning_rate": 7.816064698730142e-05, + "loss": 0.0061, + "step": 293140 + }, + { + "epoch": 1.48, + "learning_rate": 7.81530792942874e-05, + "loss": 0.0085, + "step": 293150 + }, + { + "epoch": 1.48, + "learning_rate": 7.81455116012734e-05, + "loss": 0.0087, + "step": 293160 + }, + { + "epoch": 1.48, + "learning_rate": 7.813794390825936e-05, + "loss": 0.0083, + "step": 293170 + }, + { + "epoch": 1.48, + "learning_rate": 7.813037621524536e-05, + "loss": 0.0067, + "step": 293180 + }, + { + "epoch": 1.48, + "learning_rate": 7.812280852223134e-05, + "loss": 0.0076, + "step": 293190 + }, + { + "epoch": 1.48, + "learning_rate": 7.811524082921733e-05, + "loss": 0.0067, + "step": 293200 + }, + { + "epoch": 1.48, + "learning_rate": 7.810767313620333e-05, + "loss": 0.009, + "step": 293210 + }, + { + "epoch": 1.48, + "learning_rate": 7.810010544318931e-05, + "loss": 0.0053, + "step": 293220 + }, + { + "epoch": 1.48, + "learning_rate": 7.80925377501753e-05, + "loss": 0.0089, + "step": 293230 + }, + { + "epoch": 1.48, + "learning_rate": 7.80849700571613e-05, + "loss": 0.0068, + "step": 293240 + }, + { + "epoch": 1.48, + "learning_rate": 7.807740236414728e-05, + "loss": 0.0063, + "step": 293250 + }, + { + "epoch": 1.48, + "learning_rate": 7.806983467113328e-05, + "loss": 0.0076, + "step": 293260 + }, + { + "epoch": 1.48, + "learning_rate": 7.806226697811926e-05, + "loss": 0.0059, + "step": 293270 + }, + { + "epoch": 1.48, + "learning_rate": 7.805469928510525e-05, + "loss": 0.0082, + "step": 293280 + }, + { + "epoch": 1.48, + "learning_rate": 7.804713159209125e-05, + "loss": 0.0058, + "step": 293290 + }, + { + "epoch": 1.48, + "learning_rate": 7.803956389907723e-05, + "loss": 0.0079, + "step": 293300 + }, + { + "epoch": 1.48, + "learning_rate": 7.803199620606322e-05, + "loss": 0.0087, + "step": 293310 + }, + { + "epoch": 1.48, + "learning_rate": 7.802442851304922e-05, + "loss": 0.0082, + "step": 293320 + }, + { + "epoch": 1.48, + "learning_rate": 7.80168608200352e-05, + "loss": 0.0075, + "step": 293330 + }, + { + "epoch": 1.48, + "learning_rate": 7.80092931270212e-05, + "loss": 0.0079, + "step": 293340 + }, + { + "epoch": 1.48, + "learning_rate": 7.800172543400718e-05, + "loss": 0.0084, + "step": 293350 + }, + { + "epoch": 1.48, + "learning_rate": 7.799415774099317e-05, + "loss": 0.0075, + "step": 293360 + }, + { + "epoch": 1.48, + "learning_rate": 7.798659004797917e-05, + "loss": 0.0075, + "step": 293370 + }, + { + "epoch": 1.48, + "learning_rate": 7.797902235496515e-05, + "loss": 0.0057, + "step": 293380 + }, + { + "epoch": 1.48, + "learning_rate": 7.797145466195114e-05, + "loss": 0.0112, + "step": 293390 + }, + { + "epoch": 1.48, + "learning_rate": 7.796388696893714e-05, + "loss": 0.0076, + "step": 293400 + }, + { + "epoch": 1.48, + "learning_rate": 7.795631927592312e-05, + "loss": 0.0054, + "step": 293410 + }, + { + "epoch": 1.48, + "learning_rate": 7.794875158290912e-05, + "loss": 0.0068, + "step": 293420 + }, + { + "epoch": 1.48, + "learning_rate": 7.794118388989511e-05, + "loss": 0.0087, + "step": 293430 + }, + { + "epoch": 1.48, + "learning_rate": 7.793361619688109e-05, + "loss": 0.0066, + "step": 293440 + }, + { + "epoch": 1.48, + "learning_rate": 7.792604850386709e-05, + "loss": 0.0069, + "step": 293450 + }, + { + "epoch": 1.48, + "learning_rate": 7.791848081085307e-05, + "loss": 0.0067, + "step": 293460 + }, + { + "epoch": 1.48, + "learning_rate": 7.791091311783906e-05, + "loss": 0.0058, + "step": 293470 + }, + { + "epoch": 1.48, + "learning_rate": 7.790334542482506e-05, + "loss": 0.0075, + "step": 293480 + }, + { + "epoch": 1.48, + "learning_rate": 7.789577773181104e-05, + "loss": 0.0092, + "step": 293490 + }, + { + "epoch": 1.48, + "learning_rate": 7.788821003879703e-05, + "loss": 0.0085, + "step": 293500 + }, + { + "epoch": 1.48, + "learning_rate": 7.788064234578303e-05, + "loss": 0.0095, + "step": 293510 + }, + { + "epoch": 1.48, + "learning_rate": 7.787307465276901e-05, + "loss": 0.0087, + "step": 293520 + }, + { + "epoch": 1.48, + "learning_rate": 7.7865506959755e-05, + "loss": 0.0085, + "step": 293530 + }, + { + "epoch": 1.48, + "learning_rate": 7.785793926674099e-05, + "loss": 0.0071, + "step": 293540 + }, + { + "epoch": 1.48, + "learning_rate": 7.785037157372698e-05, + "loss": 0.0111, + "step": 293550 + }, + { + "epoch": 1.48, + "learning_rate": 7.784280388071298e-05, + "loss": 0.0065, + "step": 293560 + }, + { + "epoch": 1.48, + "learning_rate": 7.783523618769896e-05, + "loss": 0.0067, + "step": 293570 + }, + { + "epoch": 1.48, + "learning_rate": 7.782766849468495e-05, + "loss": 0.0064, + "step": 293580 + }, + { + "epoch": 1.48, + "learning_rate": 7.782010080167095e-05, + "loss": 0.0071, + "step": 293590 + }, + { + "epoch": 1.48, + "learning_rate": 7.781253310865693e-05, + "loss": 0.0069, + "step": 293600 + }, + { + "epoch": 1.48, + "learning_rate": 7.780496541564293e-05, + "loss": 0.0073, + "step": 293610 + }, + { + "epoch": 1.48, + "learning_rate": 7.77973977226289e-05, + "loss": 0.0093, + "step": 293620 + }, + { + "epoch": 1.48, + "learning_rate": 7.77898300296149e-05, + "loss": 0.0089, + "step": 293630 + }, + { + "epoch": 1.48, + "learning_rate": 7.77822623366009e-05, + "loss": 0.0068, + "step": 293640 + }, + { + "epoch": 1.48, + "learning_rate": 7.777469464358688e-05, + "loss": 0.0068, + "step": 293650 + }, + { + "epoch": 1.48, + "learning_rate": 7.776712695057287e-05, + "loss": 0.0077, + "step": 293660 + }, + { + "epoch": 1.48, + "learning_rate": 7.775955925755887e-05, + "loss": 0.0062, + "step": 293670 + }, + { + "epoch": 1.48, + "learning_rate": 7.775199156454485e-05, + "loss": 0.007, + "step": 293680 + }, + { + "epoch": 1.48, + "learning_rate": 7.774442387153084e-05, + "loss": 0.0084, + "step": 293690 + }, + { + "epoch": 1.48, + "learning_rate": 7.773685617851683e-05, + "loss": 0.0106, + "step": 293700 + }, + { + "epoch": 1.48, + "learning_rate": 7.772928848550282e-05, + "loss": 0.0088, + "step": 293710 + }, + { + "epoch": 1.48, + "learning_rate": 7.772172079248882e-05, + "loss": 0.006, + "step": 293720 + }, + { + "epoch": 1.48, + "learning_rate": 7.77141530994748e-05, + "loss": 0.0064, + "step": 293730 + }, + { + "epoch": 1.48, + "learning_rate": 7.770658540646079e-05, + "loss": 0.0088, + "step": 293740 + }, + { + "epoch": 1.48, + "learning_rate": 7.769901771344679e-05, + "loss": 0.0077, + "step": 293750 + }, + { + "epoch": 1.48, + "learning_rate": 7.769145002043277e-05, + "loss": 0.007, + "step": 293760 + }, + { + "epoch": 1.48, + "learning_rate": 7.768388232741876e-05, + "loss": 0.0079, + "step": 293770 + }, + { + "epoch": 1.48, + "learning_rate": 7.767631463440475e-05, + "loss": 0.0062, + "step": 293780 + }, + { + "epoch": 1.48, + "learning_rate": 7.766874694139074e-05, + "loss": 0.0079, + "step": 293790 + }, + { + "epoch": 1.48, + "learning_rate": 7.766117924837671e-05, + "loss": 0.006, + "step": 293800 + }, + { + "epoch": 1.48, + "learning_rate": 7.76536115553627e-05, + "loss": 0.0064, + "step": 293810 + }, + { + "epoch": 1.48, + "learning_rate": 7.76460438623487e-05, + "loss": 0.0076, + "step": 293820 + }, + { + "epoch": 1.48, + "learning_rate": 7.763847616933468e-05, + "loss": 0.0067, + "step": 293830 + }, + { + "epoch": 1.48, + "learning_rate": 7.763090847632067e-05, + "loss": 0.0071, + "step": 293840 + }, + { + "epoch": 1.48, + "learning_rate": 7.762334078330667e-05, + "loss": 0.01, + "step": 293850 + }, + { + "epoch": 1.48, + "learning_rate": 7.761577309029265e-05, + "loss": 0.0086, + "step": 293860 + }, + { + "epoch": 1.48, + "learning_rate": 7.760820539727865e-05, + "loss": 0.007, + "step": 293870 + }, + { + "epoch": 1.48, + "learning_rate": 7.760063770426464e-05, + "loss": 0.0063, + "step": 293880 + }, + { + "epoch": 1.48, + "learning_rate": 7.759307001125062e-05, + "loss": 0.0053, + "step": 293890 + }, + { + "epoch": 1.48, + "learning_rate": 7.758550231823662e-05, + "loss": 0.0071, + "step": 293900 + }, + { + "epoch": 1.48, + "learning_rate": 7.75779346252226e-05, + "loss": 0.0094, + "step": 293910 + }, + { + "epoch": 1.48, + "learning_rate": 7.75703669322086e-05, + "loss": 0.0071, + "step": 293920 + }, + { + "epoch": 1.48, + "learning_rate": 7.756279923919459e-05, + "loss": 0.0054, + "step": 293930 + }, + { + "epoch": 1.48, + "learning_rate": 7.755523154618057e-05, + "loss": 0.0081, + "step": 293940 + }, + { + "epoch": 1.48, + "learning_rate": 7.754766385316657e-05, + "loss": 0.0083, + "step": 293950 + }, + { + "epoch": 1.48, + "learning_rate": 7.754009616015256e-05, + "loss": 0.0053, + "step": 293960 + }, + { + "epoch": 1.48, + "learning_rate": 7.753252846713854e-05, + "loss": 0.0091, + "step": 293970 + }, + { + "epoch": 1.48, + "learning_rate": 7.752496077412454e-05, + "loss": 0.0072, + "step": 293980 + }, + { + "epoch": 1.48, + "learning_rate": 7.751739308111052e-05, + "loss": 0.009, + "step": 293990 + }, + { + "epoch": 1.48, + "learning_rate": 7.750982538809651e-05, + "loss": 0.0062, + "step": 294000 + }, + { + "epoch": 1.48, + "eval_cer": 0.9144294992658953, + "eval_loss": 0.005396208260208368, + "eval_runtime": 116.6359, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, + "step": 294000 + }, + { + "epoch": 1.48, + "learning_rate": 7.750225769508251e-05, + "loss": 0.0058, + "step": 294010 + }, + { + "epoch": 1.48, + "learning_rate": 7.749469000206849e-05, + "loss": 0.006, + "step": 294020 + }, + { + "epoch": 1.48, + "learning_rate": 7.748712230905448e-05, + "loss": 0.0066, + "step": 294030 + }, + { + "epoch": 1.48, + "learning_rate": 7.747955461604048e-05, + "loss": 0.0085, + "step": 294040 + }, + { + "epoch": 1.48, + "learning_rate": 7.747198692302646e-05, + "loss": 0.0048, + "step": 294050 + }, + { + "epoch": 1.48, + "learning_rate": 7.746441923001246e-05, + "loss": 0.0075, + "step": 294060 + }, + { + "epoch": 1.48, + "learning_rate": 7.745685153699844e-05, + "loss": 0.0087, + "step": 294070 + }, + { + "epoch": 1.48, + "learning_rate": 7.744928384398443e-05, + "loss": 0.0077, + "step": 294080 + }, + { + "epoch": 1.48, + "learning_rate": 7.744171615097043e-05, + "loss": 0.0088, + "step": 294090 + }, + { + "epoch": 1.48, + "learning_rate": 7.743414845795641e-05, + "loss": 0.0064, + "step": 294100 + }, + { + "epoch": 1.48, + "learning_rate": 7.74265807649424e-05, + "loss": 0.0068, + "step": 294110 + }, + { + "epoch": 1.48, + "learning_rate": 7.74190130719284e-05, + "loss": 0.0055, + "step": 294120 + }, + { + "epoch": 1.48, + "learning_rate": 7.741144537891438e-05, + "loss": 0.0076, + "step": 294130 + }, + { + "epoch": 1.48, + "learning_rate": 7.740387768590038e-05, + "loss": 0.0072, + "step": 294140 + }, + { + "epoch": 1.48, + "learning_rate": 7.739630999288636e-05, + "loss": 0.0065, + "step": 294150 + }, + { + "epoch": 1.48, + "learning_rate": 7.738874229987235e-05, + "loss": 0.0068, + "step": 294160 + }, + { + "epoch": 1.48, + "learning_rate": 7.738117460685835e-05, + "loss": 0.0074, + "step": 294170 + }, + { + "epoch": 1.48, + "learning_rate": 7.737360691384433e-05, + "loss": 0.0088, + "step": 294180 + }, + { + "epoch": 1.48, + "learning_rate": 7.736603922083032e-05, + "loss": 0.0063, + "step": 294190 + }, + { + "epoch": 1.48, + "learning_rate": 7.735847152781632e-05, + "loss": 0.0126, + "step": 294200 + }, + { + "epoch": 1.48, + "learning_rate": 7.73509038348023e-05, + "loss": 0.0069, + "step": 294210 + }, + { + "epoch": 1.48, + "learning_rate": 7.73433361417883e-05, + "loss": 0.0063, + "step": 294220 + }, + { + "epoch": 1.48, + "learning_rate": 7.733576844877428e-05, + "loss": 0.0076, + "step": 294230 + }, + { + "epoch": 1.48, + "learning_rate": 7.732820075576027e-05, + "loss": 0.0084, + "step": 294240 + }, + { + "epoch": 1.48, + "learning_rate": 7.732063306274627e-05, + "loss": 0.0106, + "step": 294250 + }, + { + "epoch": 1.48, + "learning_rate": 7.731306536973225e-05, + "loss": 0.0063, + "step": 294260 + }, + { + "epoch": 1.48, + "learning_rate": 7.730549767671824e-05, + "loss": 0.0064, + "step": 294270 + }, + { + "epoch": 1.48, + "learning_rate": 7.729792998370424e-05, + "loss": 0.0059, + "step": 294280 + }, + { + "epoch": 1.48, + "learning_rate": 7.729036229069022e-05, + "loss": 0.008, + "step": 294290 + }, + { + "epoch": 1.48, + "learning_rate": 7.728279459767621e-05, + "loss": 0.006, + "step": 294300 + }, + { + "epoch": 1.48, + "learning_rate": 7.72752269046622e-05, + "loss": 0.0069, + "step": 294310 + }, + { + "epoch": 1.48, + "learning_rate": 7.726765921164819e-05, + "loss": 0.0056, + "step": 294320 + }, + { + "epoch": 1.48, + "learning_rate": 7.726009151863419e-05, + "loss": 0.0085, + "step": 294330 + }, + { + "epoch": 1.48, + "learning_rate": 7.725252382562017e-05, + "loss": 0.006, + "step": 294340 + }, + { + "epoch": 1.49, + "learning_rate": 7.724495613260616e-05, + "loss": 0.0062, + "step": 294350 + }, + { + "epoch": 1.49, + "learning_rate": 7.723738843959216e-05, + "loss": 0.0078, + "step": 294360 + }, + { + "epoch": 1.49, + "learning_rate": 7.722982074657814e-05, + "loss": 0.0065, + "step": 294370 + }, + { + "epoch": 1.49, + "learning_rate": 7.722225305356413e-05, + "loss": 0.0072, + "step": 294380 + }, + { + "epoch": 1.49, + "learning_rate": 7.721468536055013e-05, + "loss": 0.0113, + "step": 294390 + }, + { + "epoch": 1.49, + "learning_rate": 7.720711766753611e-05, + "loss": 0.008, + "step": 294400 + }, + { + "epoch": 1.49, + "learning_rate": 7.71995499745221e-05, + "loss": 0.0138, + "step": 294410 + }, + { + "epoch": 1.49, + "learning_rate": 7.719198228150809e-05, + "loss": 0.0105, + "step": 294420 + }, + { + "epoch": 1.49, + "learning_rate": 7.718441458849407e-05, + "loss": 0.007, + "step": 294430 + }, + { + "epoch": 1.49, + "learning_rate": 7.717684689548005e-05, + "loss": 0.0082, + "step": 294440 + }, + { + "epoch": 1.49, + "learning_rate": 7.716927920246604e-05, + "loss": 0.0067, + "step": 294450 + }, + { + "epoch": 1.49, + "learning_rate": 7.716171150945204e-05, + "loss": 0.0069, + "step": 294460 + }, + { + "epoch": 1.49, + "learning_rate": 7.715414381643802e-05, + "loss": 0.0057, + "step": 294470 + }, + { + "epoch": 1.49, + "learning_rate": 7.714657612342402e-05, + "loss": 0.0078, + "step": 294480 + }, + { + "epoch": 1.49, + "learning_rate": 7.713900843041001e-05, + "loss": 0.0061, + "step": 294490 + }, + { + "epoch": 1.49, + "learning_rate": 7.713144073739599e-05, + "loss": 0.0054, + "step": 294500 + }, + { + "epoch": 1.49, + "learning_rate": 7.712387304438199e-05, + "loss": 0.005, + "step": 294510 + }, + { + "epoch": 1.49, + "learning_rate": 7.711630535136797e-05, + "loss": 0.0081, + "step": 294520 + }, + { + "epoch": 1.49, + "learning_rate": 7.710873765835396e-05, + "loss": 0.0065, + "step": 294530 + }, + { + "epoch": 1.49, + "learning_rate": 7.710116996533996e-05, + "loss": 0.0077, + "step": 294540 + }, + { + "epoch": 1.49, + "learning_rate": 7.709360227232594e-05, + "loss": 0.0073, + "step": 294550 + }, + { + "epoch": 1.49, + "learning_rate": 7.708603457931193e-05, + "loss": 0.0071, + "step": 294560 + }, + { + "epoch": 1.49, + "learning_rate": 7.707846688629793e-05, + "loss": 0.0075, + "step": 294570 + }, + { + "epoch": 1.49, + "learning_rate": 7.707089919328391e-05, + "loss": 0.0074, + "step": 294580 + }, + { + "epoch": 1.49, + "learning_rate": 7.70633315002699e-05, + "loss": 0.0078, + "step": 294590 + }, + { + "epoch": 1.49, + "learning_rate": 7.705576380725589e-05, + "loss": 0.0102, + "step": 294600 + }, + { + "epoch": 1.49, + "learning_rate": 7.704819611424188e-05, + "loss": 0.0057, + "step": 294610 + }, + { + "epoch": 1.49, + "learning_rate": 7.704062842122788e-05, + "loss": 0.007, + "step": 294620 + }, + { + "epoch": 1.49, + "learning_rate": 7.703306072821386e-05, + "loss": 0.0061, + "step": 294630 + }, + { + "epoch": 1.49, + "learning_rate": 7.702549303519985e-05, + "loss": 0.006, + "step": 294640 + }, + { + "epoch": 1.49, + "learning_rate": 7.701792534218585e-05, + "loss": 0.0079, + "step": 294650 + }, + { + "epoch": 1.49, + "learning_rate": 7.701035764917183e-05, + "loss": 0.01, + "step": 294660 + }, + { + "epoch": 1.49, + "learning_rate": 7.700278995615783e-05, + "loss": 0.008, + "step": 294670 + }, + { + "epoch": 1.49, + "learning_rate": 7.699522226314381e-05, + "loss": 0.0068, + "step": 294680 + }, + { + "epoch": 1.49, + "learning_rate": 7.69876545701298e-05, + "loss": 0.0083, + "step": 294690 + }, + { + "epoch": 1.49, + "learning_rate": 7.69800868771158e-05, + "loss": 0.007, + "step": 294700 + }, + { + "epoch": 1.49, + "learning_rate": 7.697251918410178e-05, + "loss": 0.0062, + "step": 294710 + }, + { + "epoch": 1.49, + "learning_rate": 7.696495149108777e-05, + "loss": 0.0075, + "step": 294720 + }, + { + "epoch": 1.49, + "learning_rate": 7.695738379807377e-05, + "loss": 0.0099, + "step": 294730 + }, + { + "epoch": 1.49, + "learning_rate": 7.694981610505975e-05, + "loss": 0.0068, + "step": 294740 + }, + { + "epoch": 1.49, + "learning_rate": 7.694224841204574e-05, + "loss": 0.0059, + "step": 294750 + }, + { + "epoch": 1.49, + "learning_rate": 7.693468071903173e-05, + "loss": 0.0087, + "step": 294760 + }, + { + "epoch": 1.49, + "learning_rate": 7.692711302601772e-05, + "loss": 0.01, + "step": 294770 + }, + { + "epoch": 1.49, + "learning_rate": 7.691954533300372e-05, + "loss": 0.0083, + "step": 294780 + }, + { + "epoch": 1.49, + "learning_rate": 7.69119776399897e-05, + "loss": 0.0075, + "step": 294790 + }, + { + "epoch": 1.49, + "learning_rate": 7.690440994697569e-05, + "loss": 0.0076, + "step": 294800 + }, + { + "epoch": 1.49, + "learning_rate": 7.689684225396169e-05, + "loss": 0.006, + "step": 294810 + }, + { + "epoch": 1.49, + "learning_rate": 7.688927456094767e-05, + "loss": 0.0067, + "step": 294820 + }, + { + "epoch": 1.49, + "learning_rate": 7.688170686793366e-05, + "loss": 0.0067, + "step": 294830 + }, + { + "epoch": 1.49, + "learning_rate": 7.687413917491965e-05, + "loss": 0.0082, + "step": 294840 + }, + { + "epoch": 1.49, + "learning_rate": 7.686657148190564e-05, + "loss": 0.0059, + "step": 294850 + }, + { + "epoch": 1.49, + "learning_rate": 7.685900378889164e-05, + "loss": 0.0101, + "step": 294860 + }, + { + "epoch": 1.49, + "learning_rate": 7.685143609587762e-05, + "loss": 0.0071, + "step": 294870 + }, + { + "epoch": 1.49, + "learning_rate": 7.684386840286361e-05, + "loss": 0.0056, + "step": 294880 + }, + { + "epoch": 1.49, + "learning_rate": 7.683630070984961e-05, + "loss": 0.0071, + "step": 294890 + }, + { + "epoch": 1.49, + "learning_rate": 7.682873301683559e-05, + "loss": 0.0077, + "step": 294900 + }, + { + "epoch": 1.49, + "learning_rate": 7.682116532382158e-05, + "loss": 0.0056, + "step": 294910 + }, + { + "epoch": 1.49, + "learning_rate": 7.681359763080758e-05, + "loss": 0.0062, + "step": 294920 + }, + { + "epoch": 1.49, + "learning_rate": 7.680602993779356e-05, + "loss": 0.0079, + "step": 294930 + }, + { + "epoch": 1.49, + "learning_rate": 7.679846224477955e-05, + "loss": 0.0063, + "step": 294940 + }, + { + "epoch": 1.49, + "learning_rate": 7.679089455176554e-05, + "loss": 0.0067, + "step": 294950 + }, + { + "epoch": 1.49, + "learning_rate": 7.678332685875153e-05, + "loss": 0.0073, + "step": 294960 + }, + { + "epoch": 1.49, + "learning_rate": 7.677575916573753e-05, + "loss": 0.007, + "step": 294970 + }, + { + "epoch": 1.49, + "learning_rate": 7.676819147272351e-05, + "loss": 0.0083, + "step": 294980 + }, + { + "epoch": 1.49, + "learning_rate": 7.67606237797095e-05, + "loss": 0.0077, + "step": 294990 + }, + { + "epoch": 1.49, + "learning_rate": 7.67530560866955e-05, + "loss": 0.0065, + "step": 295000 + }, + { + "epoch": 1.49, + "eval_cer": 0.9144304696620207, + "eval_loss": 0.005469324998557568, + "eval_runtime": 116.6115, + "eval_samples_per_second": 17.151, + "eval_steps_per_second": 4.288, + "step": 295000 + }, + { + "epoch": 1.49, + "learning_rate": 7.674548839368148e-05, + "loss": 0.0067, + "step": 295010 + }, + { + "epoch": 1.49, + "learning_rate": 7.673792070066747e-05, + "loss": 0.0055, + "step": 295020 + }, + { + "epoch": 1.49, + "learning_rate": 7.673035300765346e-05, + "loss": 0.007, + "step": 295030 + }, + { + "epoch": 1.49, + "learning_rate": 7.672278531463945e-05, + "loss": 0.01, + "step": 295040 + }, + { + "epoch": 1.49, + "learning_rate": 7.671521762162545e-05, + "loss": 0.0061, + "step": 295050 + }, + { + "epoch": 1.49, + "learning_rate": 7.670764992861141e-05, + "loss": 0.0081, + "step": 295060 + }, + { + "epoch": 1.49, + "learning_rate": 7.670008223559741e-05, + "loss": 0.0063, + "step": 295070 + }, + { + "epoch": 1.49, + "learning_rate": 7.669251454258339e-05, + "loss": 0.007, + "step": 295080 + }, + { + "epoch": 1.49, + "learning_rate": 7.668494684956938e-05, + "loss": 0.0096, + "step": 295090 + }, + { + "epoch": 1.49, + "learning_rate": 7.667737915655538e-05, + "loss": 0.0078, + "step": 295100 + }, + { + "epoch": 1.49, + "learning_rate": 7.666981146354136e-05, + "loss": 0.0063, + "step": 295110 + }, + { + "epoch": 1.49, + "learning_rate": 7.666224377052736e-05, + "loss": 0.0061, + "step": 295120 + }, + { + "epoch": 1.49, + "learning_rate": 7.665467607751334e-05, + "loss": 0.0099, + "step": 295130 + }, + { + "epoch": 1.49, + "learning_rate": 7.664710838449933e-05, + "loss": 0.0072, + "step": 295140 + }, + { + "epoch": 1.49, + "learning_rate": 7.663954069148533e-05, + "loss": 0.0074, + "step": 295150 + }, + { + "epoch": 1.49, + "learning_rate": 7.663197299847131e-05, + "loss": 0.0067, + "step": 295160 + }, + { + "epoch": 1.49, + "learning_rate": 7.66244053054573e-05, + "loss": 0.0086, + "step": 295170 + }, + { + "epoch": 1.49, + "learning_rate": 7.66168376124433e-05, + "loss": 0.0072, + "step": 295180 + }, + { + "epoch": 1.49, + "learning_rate": 7.660926991942928e-05, + "loss": 0.0104, + "step": 295190 + }, + { + "epoch": 1.49, + "learning_rate": 7.660170222641528e-05, + "loss": 0.0069, + "step": 295200 + }, + { + "epoch": 1.49, + "learning_rate": 7.659413453340126e-05, + "loss": 0.0116, + "step": 295210 + }, + { + "epoch": 1.49, + "learning_rate": 7.658656684038725e-05, + "loss": 0.0061, + "step": 295220 + }, + { + "epoch": 1.49, + "learning_rate": 7.657899914737325e-05, + "loss": 0.0082, + "step": 295230 + }, + { + "epoch": 1.49, + "learning_rate": 7.657143145435923e-05, + "loss": 0.0071, + "step": 295240 + }, + { + "epoch": 1.49, + "learning_rate": 7.656386376134522e-05, + "loss": 0.0071, + "step": 295250 + }, + { + "epoch": 1.49, + "learning_rate": 7.655629606833122e-05, + "loss": 0.0068, + "step": 295260 + }, + { + "epoch": 1.49, + "learning_rate": 7.65487283753172e-05, + "loss": 0.0085, + "step": 295270 + }, + { + "epoch": 1.49, + "learning_rate": 7.65411606823032e-05, + "loss": 0.0096, + "step": 295280 + }, + { + "epoch": 1.49, + "learning_rate": 7.653359298928918e-05, + "loss": 0.0075, + "step": 295290 + }, + { + "epoch": 1.49, + "learning_rate": 7.652602529627517e-05, + "loss": 0.0094, + "step": 295300 + }, + { + "epoch": 1.49, + "learning_rate": 7.651845760326117e-05, + "loss": 0.0071, + "step": 295310 + }, + { + "epoch": 1.49, + "learning_rate": 7.651088991024715e-05, + "loss": 0.0076, + "step": 295320 + }, + { + "epoch": 1.49, + "learning_rate": 7.650332221723314e-05, + "loss": 0.0115, + "step": 295330 + }, + { + "epoch": 1.49, + "learning_rate": 7.649575452421914e-05, + "loss": 0.0063, + "step": 295340 + }, + { + "epoch": 1.49, + "learning_rate": 7.648818683120512e-05, + "loss": 0.0067, + "step": 295350 + }, + { + "epoch": 1.49, + "learning_rate": 7.648061913819111e-05, + "loss": 0.0072, + "step": 295360 + }, + { + "epoch": 1.49, + "learning_rate": 7.647305144517711e-05, + "loss": 0.0073, + "step": 295370 + }, + { + "epoch": 1.49, + "learning_rate": 7.646548375216309e-05, + "loss": 0.0067, + "step": 295380 + }, + { + "epoch": 1.49, + "learning_rate": 7.645791605914909e-05, + "loss": 0.0086, + "step": 295390 + }, + { + "epoch": 1.49, + "learning_rate": 7.645034836613507e-05, + "loss": 0.004, + "step": 295400 + }, + { + "epoch": 1.49, + "learning_rate": 7.644278067312106e-05, + "loss": 0.0078, + "step": 295410 + }, + { + "epoch": 1.49, + "learning_rate": 7.643521298010706e-05, + "loss": 0.0082, + "step": 295420 + }, + { + "epoch": 1.49, + "learning_rate": 7.642764528709304e-05, + "loss": 0.0074, + "step": 295430 + }, + { + "epoch": 1.49, + "learning_rate": 7.642007759407903e-05, + "loss": 0.0063, + "step": 295440 + }, + { + "epoch": 1.49, + "learning_rate": 7.641250990106503e-05, + "loss": 0.0112, + "step": 295450 + }, + { + "epoch": 1.49, + "learning_rate": 7.640494220805101e-05, + "loss": 0.0077, + "step": 295460 + }, + { + "epoch": 1.49, + "learning_rate": 7.6397374515037e-05, + "loss": 0.0088, + "step": 295470 + }, + { + "epoch": 1.49, + "learning_rate": 7.638980682202299e-05, + "loss": 0.0057, + "step": 295480 + }, + { + "epoch": 1.49, + "learning_rate": 7.638223912900898e-05, + "loss": 0.0069, + "step": 295490 + }, + { + "epoch": 1.49, + "learning_rate": 7.637467143599498e-05, + "loss": 0.0092, + "step": 295500 + }, + { + "epoch": 1.49, + "learning_rate": 7.636710374298096e-05, + "loss": 0.0058, + "step": 295510 + }, + { + "epoch": 1.49, + "learning_rate": 7.635953604996695e-05, + "loss": 0.0087, + "step": 295520 + }, + { + "epoch": 1.49, + "learning_rate": 7.635196835695295e-05, + "loss": 0.0067, + "step": 295530 + }, + { + "epoch": 1.49, + "learning_rate": 7.634440066393893e-05, + "loss": 0.0073, + "step": 295540 + }, + { + "epoch": 1.49, + "learning_rate": 7.633683297092492e-05, + "loss": 0.0063, + "step": 295550 + }, + { + "epoch": 1.49, + "learning_rate": 7.63292652779109e-05, + "loss": 0.0087, + "step": 295560 + }, + { + "epoch": 1.49, + "learning_rate": 7.63216975848969e-05, + "loss": 0.0076, + "step": 295570 + }, + { + "epoch": 1.49, + "learning_rate": 7.63141298918829e-05, + "loss": 0.007, + "step": 295580 + }, + { + "epoch": 1.49, + "learning_rate": 7.630656219886888e-05, + "loss": 0.0091, + "step": 295590 + }, + { + "epoch": 1.49, + "learning_rate": 7.629899450585487e-05, + "loss": 0.0062, + "step": 295600 + }, + { + "epoch": 1.49, + "learning_rate": 7.629142681284087e-05, + "loss": 0.0067, + "step": 295610 + }, + { + "epoch": 1.49, + "learning_rate": 7.628385911982685e-05, + "loss": 0.0065, + "step": 295620 + }, + { + "epoch": 1.49, + "learning_rate": 7.627629142681284e-05, + "loss": 0.007, + "step": 295630 + }, + { + "epoch": 1.49, + "learning_rate": 7.626872373379882e-05, + "loss": 0.0077, + "step": 295640 + }, + { + "epoch": 1.49, + "learning_rate": 7.626115604078482e-05, + "loss": 0.0068, + "step": 295650 + }, + { + "epoch": 1.49, + "learning_rate": 7.625358834777081e-05, + "loss": 0.0072, + "step": 295660 + }, + { + "epoch": 1.49, + "learning_rate": 7.62460206547568e-05, + "loss": 0.0048, + "step": 295670 + }, + { + "epoch": 1.49, + "learning_rate": 7.623845296174279e-05, + "loss": 0.0106, + "step": 295680 + }, + { + "epoch": 1.49, + "learning_rate": 7.623088526872876e-05, + "loss": 0.0065, + "step": 295690 + }, + { + "epoch": 1.49, + "learning_rate": 7.622331757571475e-05, + "loss": 0.0078, + "step": 295700 + }, + { + "epoch": 1.49, + "learning_rate": 7.621574988270075e-05, + "loss": 0.0067, + "step": 295710 + }, + { + "epoch": 1.49, + "learning_rate": 7.620818218968673e-05, + "loss": 0.007, + "step": 295720 + }, + { + "epoch": 1.49, + "learning_rate": 7.620061449667273e-05, + "loss": 0.0092, + "step": 295730 + }, + { + "epoch": 1.49, + "learning_rate": 7.619304680365871e-05, + "loss": 0.0069, + "step": 295740 + }, + { + "epoch": 1.49, + "learning_rate": 7.61854791106447e-05, + "loss": 0.0068, + "step": 295750 + }, + { + "epoch": 1.49, + "learning_rate": 7.61779114176307e-05, + "loss": 0.0075, + "step": 295760 + }, + { + "epoch": 1.49, + "learning_rate": 7.617034372461668e-05, + "loss": 0.0059, + "step": 295770 + }, + { + "epoch": 1.49, + "learning_rate": 7.616277603160267e-05, + "loss": 0.008, + "step": 295780 + }, + { + "epoch": 1.49, + "learning_rate": 7.615520833858867e-05, + "loss": 0.0061, + "step": 295790 + }, + { + "epoch": 1.49, + "learning_rate": 7.614764064557465e-05, + "loss": 0.0073, + "step": 295800 + }, + { + "epoch": 1.49, + "learning_rate": 7.614007295256064e-05, + "loss": 0.0059, + "step": 295810 + }, + { + "epoch": 1.49, + "learning_rate": 7.613250525954664e-05, + "loss": 0.0083, + "step": 295820 + }, + { + "epoch": 1.49, + "learning_rate": 7.612493756653262e-05, + "loss": 0.0059, + "step": 295830 + }, + { + "epoch": 1.49, + "learning_rate": 7.611736987351862e-05, + "loss": 0.008, + "step": 295840 + }, + { + "epoch": 1.49, + "learning_rate": 7.61098021805046e-05, + "loss": 0.0081, + "step": 295850 + }, + { + "epoch": 1.49, + "learning_rate": 7.610223448749059e-05, + "loss": 0.0067, + "step": 295860 + }, + { + "epoch": 1.49, + "learning_rate": 7.609466679447659e-05, + "loss": 0.0074, + "step": 295870 + }, + { + "epoch": 1.49, + "learning_rate": 7.608709910146257e-05, + "loss": 0.0079, + "step": 295880 + }, + { + "epoch": 1.49, + "learning_rate": 7.607953140844856e-05, + "loss": 0.0084, + "step": 295890 + }, + { + "epoch": 1.49, + "learning_rate": 7.607196371543456e-05, + "loss": 0.0095, + "step": 295900 + }, + { + "epoch": 1.49, + "learning_rate": 7.606439602242054e-05, + "loss": 0.0072, + "step": 295910 + }, + { + "epoch": 1.49, + "learning_rate": 7.605682832940654e-05, + "loss": 0.0082, + "step": 295920 + }, + { + "epoch": 1.49, + "learning_rate": 7.604926063639252e-05, + "loss": 0.0078, + "step": 295930 + }, + { + "epoch": 1.49, + "learning_rate": 7.604169294337851e-05, + "loss": 0.0071, + "step": 295940 + }, + { + "epoch": 1.49, + "learning_rate": 7.603412525036451e-05, + "loss": 0.0079, + "step": 295950 + }, + { + "epoch": 1.49, + "learning_rate": 7.602655755735049e-05, + "loss": 0.007, + "step": 295960 + }, + { + "epoch": 1.49, + "learning_rate": 7.601898986433648e-05, + "loss": 0.0079, + "step": 295970 + }, + { + "epoch": 1.49, + "learning_rate": 7.601142217132248e-05, + "loss": 0.0076, + "step": 295980 + }, + { + "epoch": 1.49, + "learning_rate": 7.600385447830846e-05, + "loss": 0.0069, + "step": 295990 + }, + { + "epoch": 1.49, + "learning_rate": 7.599628678529446e-05, + "loss": 0.0075, + "step": 296000 + }, + { + "epoch": 1.49, + "eval_cer": 0.9144605519419082, + "eval_loss": 0.005476477090269327, + "eval_runtime": 116.6265, + "eval_samples_per_second": 17.149, + "eval_steps_per_second": 4.287, + "step": 296000 + }, + { + "epoch": 1.49, + "learning_rate": 7.598871909228044e-05, + "loss": 0.0067, + "step": 296010 + }, + { + "epoch": 1.49, + "learning_rate": 7.598115139926643e-05, + "loss": 0.0109, + "step": 296020 + }, + { + "epoch": 1.49, + "learning_rate": 7.597358370625243e-05, + "loss": 0.012, + "step": 296030 + }, + { + "epoch": 1.49, + "learning_rate": 7.596601601323841e-05, + "loss": 0.0069, + "step": 296040 + }, + { + "epoch": 1.49, + "learning_rate": 7.59584483202244e-05, + "loss": 0.0075, + "step": 296050 + }, + { + "epoch": 1.49, + "learning_rate": 7.59508806272104e-05, + "loss": 0.0074, + "step": 296060 + }, + { + "epoch": 1.49, + "learning_rate": 7.594331293419638e-05, + "loss": 0.0083, + "step": 296070 + }, + { + "epoch": 1.49, + "learning_rate": 7.593574524118237e-05, + "loss": 0.0084, + "step": 296080 + }, + { + "epoch": 1.49, + "learning_rate": 7.592817754816836e-05, + "loss": 0.0063, + "step": 296090 + }, + { + "epoch": 1.49, + "learning_rate": 7.592060985515435e-05, + "loss": 0.0066, + "step": 296100 + }, + { + "epoch": 1.49, + "learning_rate": 7.591304216214035e-05, + "loss": 0.0106, + "step": 296110 + }, + { + "epoch": 1.49, + "learning_rate": 7.590547446912633e-05, + "loss": 0.0067, + "step": 296120 + }, + { + "epoch": 1.49, + "learning_rate": 7.589790677611232e-05, + "loss": 0.0062, + "step": 296130 + }, + { + "epoch": 1.49, + "learning_rate": 7.589033908309832e-05, + "loss": 0.0064, + "step": 296140 + }, + { + "epoch": 1.49, + "learning_rate": 7.58827713900843e-05, + "loss": 0.0087, + "step": 296150 + }, + { + "epoch": 1.49, + "learning_rate": 7.58752036970703e-05, + "loss": 0.006, + "step": 296160 + }, + { + "epoch": 1.49, + "learning_rate": 7.586763600405628e-05, + "loss": 0.0072, + "step": 296170 + }, + { + "epoch": 1.49, + "learning_rate": 7.586006831104227e-05, + "loss": 0.0075, + "step": 296180 + }, + { + "epoch": 1.49, + "learning_rate": 7.585250061802827e-05, + "loss": 0.008, + "step": 296190 + }, + { + "epoch": 1.49, + "learning_rate": 7.584493292501425e-05, + "loss": 0.0083, + "step": 296200 + }, + { + "epoch": 1.49, + "learning_rate": 7.583736523200024e-05, + "loss": 0.0053, + "step": 296210 + }, + { + "epoch": 1.49, + "learning_rate": 7.582979753898624e-05, + "loss": 0.0075, + "step": 296220 + }, + { + "epoch": 1.49, + "learning_rate": 7.582222984597222e-05, + "loss": 0.0063, + "step": 296230 + }, + { + "epoch": 1.49, + "learning_rate": 7.581466215295821e-05, + "loss": 0.0067, + "step": 296240 + }, + { + "epoch": 1.49, + "learning_rate": 7.58070944599442e-05, + "loss": 0.0102, + "step": 296250 + }, + { + "epoch": 1.49, + "learning_rate": 7.579952676693019e-05, + "loss": 0.0076, + "step": 296260 + }, + { + "epoch": 1.49, + "learning_rate": 7.579195907391618e-05, + "loss": 0.0065, + "step": 296270 + }, + { + "epoch": 1.49, + "learning_rate": 7.578439138090217e-05, + "loss": 0.009, + "step": 296280 + }, + { + "epoch": 1.49, + "learning_rate": 7.577682368788816e-05, + "loss": 0.0084, + "step": 296290 + }, + { + "epoch": 1.49, + "learning_rate": 7.576925599487416e-05, + "loss": 0.0066, + "step": 296300 + }, + { + "epoch": 1.49, + "learning_rate": 7.576168830186014e-05, + "loss": 0.0067, + "step": 296310 + }, + { + "epoch": 1.49, + "learning_rate": 7.575412060884612e-05, + "loss": 0.0096, + "step": 296320 + }, + { + "epoch": 1.5, + "learning_rate": 7.57465529158321e-05, + "loss": 0.007, + "step": 296330 + }, + { + "epoch": 1.5, + "learning_rate": 7.57389852228181e-05, + "loss": 0.0068, + "step": 296340 + }, + { + "epoch": 1.5, + "learning_rate": 7.573141752980409e-05, + "loss": 0.0079, + "step": 296350 + }, + { + "epoch": 1.5, + "learning_rate": 7.572384983679007e-05, + "loss": 0.0074, + "step": 296360 + }, + { + "epoch": 1.5, + "learning_rate": 7.571628214377607e-05, + "loss": 0.0084, + "step": 296370 + }, + { + "epoch": 1.5, + "learning_rate": 7.570871445076205e-05, + "loss": 0.0067, + "step": 296380 + }, + { + "epoch": 1.5, + "learning_rate": 7.570114675774804e-05, + "loss": 0.0066, + "step": 296390 + }, + { + "epoch": 1.5, + "learning_rate": 7.569357906473404e-05, + "loss": 0.0061, + "step": 296400 + }, + { + "epoch": 1.5, + "learning_rate": 7.568601137172002e-05, + "loss": 0.0053, + "step": 296410 + }, + { + "epoch": 1.5, + "learning_rate": 7.567844367870601e-05, + "loss": 0.0078, + "step": 296420 + }, + { + "epoch": 1.5, + "learning_rate": 7.567087598569201e-05, + "loss": 0.0101, + "step": 296430 + }, + { + "epoch": 1.5, + "learning_rate": 7.566330829267799e-05, + "loss": 0.0074, + "step": 296440 + }, + { + "epoch": 1.5, + "learning_rate": 7.565574059966399e-05, + "loss": 0.0083, + "step": 296450 + }, + { + "epoch": 1.5, + "learning_rate": 7.564817290664997e-05, + "loss": 0.0067, + "step": 296460 + }, + { + "epoch": 1.5, + "learning_rate": 7.564060521363596e-05, + "loss": 0.0077, + "step": 296470 + }, + { + "epoch": 1.5, + "learning_rate": 7.563303752062196e-05, + "loss": 0.0074, + "step": 296480 + }, + { + "epoch": 1.5, + "learning_rate": 7.562546982760794e-05, + "loss": 0.0094, + "step": 296490 + }, + { + "epoch": 1.5, + "learning_rate": 7.561790213459393e-05, + "loss": 0.0064, + "step": 296500 + }, + { + "epoch": 1.5, + "learning_rate": 7.561033444157993e-05, + "loss": 0.0056, + "step": 296510 + }, + { + "epoch": 1.5, + "learning_rate": 7.560276674856591e-05, + "loss": 0.0052, + "step": 296520 + }, + { + "epoch": 1.5, + "learning_rate": 7.55951990555519e-05, + "loss": 0.008, + "step": 296530 + }, + { + "epoch": 1.5, + "learning_rate": 7.558763136253789e-05, + "loss": 0.0072, + "step": 296540 + }, + { + "epoch": 1.5, + "learning_rate": 7.558006366952388e-05, + "loss": 0.0074, + "step": 296550 + }, + { + "epoch": 1.5, + "learning_rate": 7.557249597650988e-05, + "loss": 0.0062, + "step": 296560 + }, + { + "epoch": 1.5, + "learning_rate": 7.556492828349586e-05, + "loss": 0.0085, + "step": 296570 + }, + { + "epoch": 1.5, + "learning_rate": 7.555736059048185e-05, + "loss": 0.0082, + "step": 296580 + }, + { + "epoch": 1.5, + "learning_rate": 7.554979289746785e-05, + "loss": 0.006, + "step": 296590 + }, + { + "epoch": 1.5, + "learning_rate": 7.554222520445383e-05, + "loss": 0.0112, + "step": 296600 + }, + { + "epoch": 1.5, + "learning_rate": 7.553465751143982e-05, + "loss": 0.0074, + "step": 296610 + }, + { + "epoch": 1.5, + "learning_rate": 7.55270898184258e-05, + "loss": 0.0069, + "step": 296620 + }, + { + "epoch": 1.5, + "learning_rate": 7.55195221254118e-05, + "loss": 0.0064, + "step": 296630 + }, + { + "epoch": 1.5, + "learning_rate": 7.55119544323978e-05, + "loss": 0.0059, + "step": 296640 + }, + { + "epoch": 1.5, + "learning_rate": 7.550438673938378e-05, + "loss": 0.0065, + "step": 296650 + }, + { + "epoch": 1.5, + "learning_rate": 7.549681904636977e-05, + "loss": 0.0082, + "step": 296660 + }, + { + "epoch": 1.5, + "learning_rate": 7.548925135335577e-05, + "loss": 0.0066, + "step": 296670 + }, + { + "epoch": 1.5, + "learning_rate": 7.548168366034175e-05, + "loss": 0.0083, + "step": 296680 + }, + { + "epoch": 1.5, + "learning_rate": 7.547411596732774e-05, + "loss": 0.0079, + "step": 296690 + }, + { + "epoch": 1.5, + "learning_rate": 7.546654827431373e-05, + "loss": 0.0067, + "step": 296700 + }, + { + "epoch": 1.5, + "learning_rate": 7.545898058129972e-05, + "loss": 0.0068, + "step": 296710 + }, + { + "epoch": 1.5, + "learning_rate": 7.545141288828572e-05, + "loss": 0.0063, + "step": 296720 + }, + { + "epoch": 1.5, + "learning_rate": 7.54438451952717e-05, + "loss": 0.009, + "step": 296730 + }, + { + "epoch": 1.5, + "learning_rate": 7.543627750225769e-05, + "loss": 0.0069, + "step": 296740 + }, + { + "epoch": 1.5, + "learning_rate": 7.542870980924369e-05, + "loss": 0.0089, + "step": 296750 + }, + { + "epoch": 1.5, + "learning_rate": 7.542114211622967e-05, + "loss": 0.0067, + "step": 296760 + }, + { + "epoch": 1.5, + "learning_rate": 7.541357442321566e-05, + "loss": 0.0095, + "step": 296770 + }, + { + "epoch": 1.5, + "learning_rate": 7.540600673020164e-05, + "loss": 0.0113, + "step": 296780 + }, + { + "epoch": 1.5, + "learning_rate": 7.539843903718764e-05, + "loss": 0.0072, + "step": 296790 + }, + { + "epoch": 1.5, + "learning_rate": 7.539087134417363e-05, + "loss": 0.008, + "step": 296800 + }, + { + "epoch": 1.5, + "learning_rate": 7.538330365115962e-05, + "loss": 0.0073, + "step": 296810 + }, + { + "epoch": 1.5, + "learning_rate": 7.537573595814561e-05, + "loss": 0.0085, + "step": 296820 + }, + { + "epoch": 1.5, + "learning_rate": 7.53681682651316e-05, + "loss": 0.006, + "step": 296830 + }, + { + "epoch": 1.5, + "learning_rate": 7.536060057211759e-05, + "loss": 0.0074, + "step": 296840 + }, + { + "epoch": 1.5, + "learning_rate": 7.535303287910358e-05, + "loss": 0.006, + "step": 296850 + }, + { + "epoch": 1.5, + "learning_rate": 7.534546518608958e-05, + "loss": 0.0063, + "step": 296860 + }, + { + "epoch": 1.5, + "learning_rate": 7.533789749307556e-05, + "loss": 0.0105, + "step": 296870 + }, + { + "epoch": 1.5, + "learning_rate": 7.533032980006155e-05, + "loss": 0.0072, + "step": 296880 + }, + { + "epoch": 1.5, + "learning_rate": 7.532276210704754e-05, + "loss": 0.0072, + "step": 296890 + }, + { + "epoch": 1.5, + "learning_rate": 7.531519441403353e-05, + "loss": 0.0061, + "step": 296900 + }, + { + "epoch": 1.5, + "learning_rate": 7.530762672101953e-05, + "loss": 0.0054, + "step": 296910 + }, + { + "epoch": 1.5, + "learning_rate": 7.53000590280055e-05, + "loss": 0.0065, + "step": 296920 + }, + { + "epoch": 1.5, + "learning_rate": 7.52924913349915e-05, + "loss": 0.0061, + "step": 296930 + }, + { + "epoch": 1.5, + "learning_rate": 7.528492364197747e-05, + "loss": 0.0098, + "step": 296940 + }, + { + "epoch": 1.5, + "learning_rate": 7.527735594896346e-05, + "loss": 0.0078, + "step": 296950 + }, + { + "epoch": 1.5, + "learning_rate": 7.526978825594946e-05, + "loss": 0.0071, + "step": 296960 + }, + { + "epoch": 1.5, + "learning_rate": 7.526222056293544e-05, + "loss": 0.007, + "step": 296970 + }, + { + "epoch": 1.5, + "learning_rate": 7.525465286992144e-05, + "loss": 0.0074, + "step": 296980 + }, + { + "epoch": 1.5, + "learning_rate": 7.524708517690742e-05, + "loss": 0.0057, + "step": 296990 + }, + { + "epoch": 1.5, + "learning_rate": 7.523951748389341e-05, + "loss": 0.0049, + "step": 297000 + }, + { + "epoch": 1.5, + "eval_cer": 0.9144440552077764, + "eval_loss": 0.005415515974164009, + "eval_runtime": 116.5765, + "eval_samples_per_second": 17.156, + "eval_steps_per_second": 4.289, + "step": 297000 + }, + { + "epoch": 1.5, + "learning_rate": 7.523194979087941e-05, + "loss": 0.0068, + "step": 297010 + }, + { + "epoch": 1.5, + "learning_rate": 7.522438209786539e-05, + "loss": 0.0077, + "step": 297020 + }, + { + "epoch": 1.5, + "learning_rate": 7.521681440485138e-05, + "loss": 0.0068, + "step": 297030 + }, + { + "epoch": 1.5, + "learning_rate": 7.520924671183738e-05, + "loss": 0.0065, + "step": 297040 + }, + { + "epoch": 1.5, + "learning_rate": 7.520167901882336e-05, + "loss": 0.0071, + "step": 297050 + }, + { + "epoch": 1.5, + "learning_rate": 7.519411132580936e-05, + "loss": 0.0077, + "step": 297060 + }, + { + "epoch": 1.5, + "learning_rate": 7.518654363279534e-05, + "loss": 0.0067, + "step": 297070 + }, + { + "epoch": 1.5, + "learning_rate": 7.517897593978133e-05, + "loss": 0.0072, + "step": 297080 + }, + { + "epoch": 1.5, + "learning_rate": 7.517140824676733e-05, + "loss": 0.0087, + "step": 297090 + }, + { + "epoch": 1.5, + "learning_rate": 7.516384055375331e-05, + "loss": 0.008, + "step": 297100 + }, + { + "epoch": 1.5, + "learning_rate": 7.51562728607393e-05, + "loss": 0.0071, + "step": 297110 + }, + { + "epoch": 1.5, + "learning_rate": 7.51487051677253e-05, + "loss": 0.0082, + "step": 297120 + }, + { + "epoch": 1.5, + "learning_rate": 7.514113747471128e-05, + "loss": 0.0081, + "step": 297130 + }, + { + "epoch": 1.5, + "learning_rate": 7.513356978169727e-05, + "loss": 0.0062, + "step": 297140 + }, + { + "epoch": 1.5, + "learning_rate": 7.512600208868326e-05, + "loss": 0.0102, + "step": 297150 + }, + { + "epoch": 1.5, + "learning_rate": 7.511843439566925e-05, + "loss": 0.005, + "step": 297160 + }, + { + "epoch": 1.5, + "learning_rate": 7.511086670265525e-05, + "loss": 0.0073, + "step": 297170 + }, + { + "epoch": 1.5, + "learning_rate": 7.510329900964123e-05, + "loss": 0.0075, + "step": 297180 + }, + { + "epoch": 1.5, + "learning_rate": 7.509573131662722e-05, + "loss": 0.0075, + "step": 297190 + }, + { + "epoch": 1.5, + "learning_rate": 7.508816362361322e-05, + "loss": 0.0079, + "step": 297200 + }, + { + "epoch": 1.5, + "learning_rate": 7.50805959305992e-05, + "loss": 0.0083, + "step": 297210 + }, + { + "epoch": 1.5, + "learning_rate": 7.50730282375852e-05, + "loss": 0.0067, + "step": 297220 + }, + { + "epoch": 1.5, + "learning_rate": 7.506546054457118e-05, + "loss": 0.0081, + "step": 297230 + }, + { + "epoch": 1.5, + "learning_rate": 7.505789285155717e-05, + "loss": 0.0052, + "step": 297240 + }, + { + "epoch": 1.5, + "learning_rate": 7.505032515854317e-05, + "loss": 0.0071, + "step": 297250 + }, + { + "epoch": 1.5, + "learning_rate": 7.504275746552915e-05, + "loss": 0.0063, + "step": 297260 + }, + { + "epoch": 1.5, + "learning_rate": 7.503518977251514e-05, + "loss": 0.0069, + "step": 297270 + }, + { + "epoch": 1.5, + "learning_rate": 7.502762207950114e-05, + "loss": 0.0098, + "step": 297280 + }, + { + "epoch": 1.5, + "learning_rate": 7.502005438648712e-05, + "loss": 0.0068, + "step": 297290 + }, + { + "epoch": 1.5, + "learning_rate": 7.501248669347311e-05, + "loss": 0.008, + "step": 297300 + }, + { + "epoch": 1.5, + "learning_rate": 7.500491900045911e-05, + "loss": 0.0093, + "step": 297310 + }, + { + "epoch": 1.5, + "learning_rate": 7.499735130744509e-05, + "loss": 0.0074, + "step": 297320 + }, + { + "epoch": 1.5, + "learning_rate": 7.498978361443108e-05, + "loss": 0.0066, + "step": 297330 + }, + { + "epoch": 1.5, + "learning_rate": 7.498221592141707e-05, + "loss": 0.0072, + "step": 297340 + }, + { + "epoch": 1.5, + "learning_rate": 7.497464822840306e-05, + "loss": 0.0057, + "step": 297350 + }, + { + "epoch": 1.5, + "learning_rate": 7.496708053538906e-05, + "loss": 0.0068, + "step": 297360 + }, + { + "epoch": 1.5, + "learning_rate": 7.495951284237504e-05, + "loss": 0.0062, + "step": 297370 + }, + { + "epoch": 1.5, + "learning_rate": 7.495194514936103e-05, + "loss": 0.0081, + "step": 297380 + }, + { + "epoch": 1.5, + "learning_rate": 7.494437745634703e-05, + "loss": 0.0072, + "step": 297390 + }, + { + "epoch": 1.5, + "learning_rate": 7.493680976333301e-05, + "loss": 0.0083, + "step": 297400 + }, + { + "epoch": 1.5, + "learning_rate": 7.4929242070319e-05, + "loss": 0.0105, + "step": 297410 + }, + { + "epoch": 1.5, + "learning_rate": 7.492167437730499e-05, + "loss": 0.0089, + "step": 297420 + }, + { + "epoch": 1.5, + "learning_rate": 7.491410668429097e-05, + "loss": 0.0091, + "step": 297430 + }, + { + "epoch": 1.5, + "learning_rate": 7.490653899127696e-05, + "loss": 0.0073, + "step": 297440 + }, + { + "epoch": 1.5, + "learning_rate": 7.489897129826296e-05, + "loss": 0.0078, + "step": 297450 + }, + { + "epoch": 1.5, + "learning_rate": 7.489140360524894e-05, + "loss": 0.0072, + "step": 297460 + }, + { + "epoch": 1.5, + "learning_rate": 7.488383591223493e-05, + "loss": 0.012, + "step": 297470 + }, + { + "epoch": 1.5, + "learning_rate": 7.487626821922093e-05, + "loss": 0.0064, + "step": 297480 + }, + { + "epoch": 1.5, + "learning_rate": 7.486870052620691e-05, + "loss": 0.0061, + "step": 297490 + }, + { + "epoch": 1.5, + "learning_rate": 7.48611328331929e-05, + "loss": 0.0076, + "step": 297500 + }, + { + "epoch": 1.5, + "learning_rate": 7.485356514017889e-05, + "loss": 0.0074, + "step": 297510 + }, + { + "epoch": 1.5, + "learning_rate": 7.484599744716488e-05, + "loss": 0.0064, + "step": 297520 + }, + { + "epoch": 1.5, + "learning_rate": 7.483842975415088e-05, + "loss": 0.0083, + "step": 297530 + }, + { + "epoch": 1.5, + "learning_rate": 7.483086206113686e-05, + "loss": 0.0057, + "step": 297540 + }, + { + "epoch": 1.5, + "learning_rate": 7.482329436812285e-05, + "loss": 0.0084, + "step": 297550 + }, + { + "epoch": 1.5, + "learning_rate": 7.481572667510885e-05, + "loss": 0.0094, + "step": 297560 + }, + { + "epoch": 1.5, + "learning_rate": 7.480815898209483e-05, + "loss": 0.0076, + "step": 297570 + }, + { + "epoch": 1.5, + "learning_rate": 7.480059128908082e-05, + "loss": 0.0096, + "step": 297580 + }, + { + "epoch": 1.5, + "learning_rate": 7.47930235960668e-05, + "loss": 0.0073, + "step": 297590 + }, + { + "epoch": 1.5, + "learning_rate": 7.47854559030528e-05, + "loss": 0.0095, + "step": 297600 + }, + { + "epoch": 1.5, + "learning_rate": 7.47778882100388e-05, + "loss": 0.0075, + "step": 297610 + }, + { + "epoch": 1.5, + "learning_rate": 7.477032051702478e-05, + "loss": 0.0059, + "step": 297620 + }, + { + "epoch": 1.5, + "learning_rate": 7.476275282401077e-05, + "loss": 0.0076, + "step": 297630 + }, + { + "epoch": 1.5, + "learning_rate": 7.475518513099677e-05, + "loss": 0.006, + "step": 297640 + }, + { + "epoch": 1.5, + "learning_rate": 7.474761743798275e-05, + "loss": 0.0071, + "step": 297650 + }, + { + "epoch": 1.5, + "learning_rate": 7.474004974496874e-05, + "loss": 0.0083, + "step": 297660 + }, + { + "epoch": 1.5, + "learning_rate": 7.473248205195472e-05, + "loss": 0.0084, + "step": 297670 + }, + { + "epoch": 1.5, + "learning_rate": 7.472491435894072e-05, + "loss": 0.0069, + "step": 297680 + }, + { + "epoch": 1.5, + "learning_rate": 7.471734666592671e-05, + "loss": 0.0066, + "step": 297690 + }, + { + "epoch": 1.5, + "learning_rate": 7.47097789729127e-05, + "loss": 0.0071, + "step": 297700 + }, + { + "epoch": 1.5, + "learning_rate": 7.470221127989869e-05, + "loss": 0.006, + "step": 297710 + }, + { + "epoch": 1.5, + "learning_rate": 7.469464358688469e-05, + "loss": 0.0086, + "step": 297720 + }, + { + "epoch": 1.5, + "learning_rate": 7.468707589387067e-05, + "loss": 0.0093, + "step": 297730 + }, + { + "epoch": 1.5, + "learning_rate": 7.467950820085665e-05, + "loss": 0.0127, + "step": 297740 + }, + { + "epoch": 1.5, + "learning_rate": 7.467194050784264e-05, + "loss": 0.0075, + "step": 297750 + }, + { + "epoch": 1.5, + "learning_rate": 7.466437281482864e-05, + "loss": 0.0071, + "step": 297760 + }, + { + "epoch": 1.5, + "learning_rate": 7.465680512181462e-05, + "loss": 0.0071, + "step": 297770 + }, + { + "epoch": 1.5, + "learning_rate": 7.464923742880062e-05, + "loss": 0.0073, + "step": 297780 + }, + { + "epoch": 1.5, + "learning_rate": 7.46416697357866e-05, + "loss": 0.0066, + "step": 297790 + }, + { + "epoch": 1.5, + "learning_rate": 7.463410204277259e-05, + "loss": 0.0081, + "step": 297800 + }, + { + "epoch": 1.5, + "learning_rate": 7.462653434975859e-05, + "loss": 0.0099, + "step": 297810 + }, + { + "epoch": 1.5, + "learning_rate": 7.461896665674457e-05, + "loss": 0.008, + "step": 297820 + }, + { + "epoch": 1.5, + "learning_rate": 7.461139896373056e-05, + "loss": 0.0078, + "step": 297830 + }, + { + "epoch": 1.5, + "learning_rate": 7.460383127071656e-05, + "loss": 0.0083, + "step": 297840 + }, + { + "epoch": 1.5, + "learning_rate": 7.459626357770254e-05, + "loss": 0.0074, + "step": 297850 + }, + { + "epoch": 1.5, + "learning_rate": 7.458869588468853e-05, + "loss": 0.008, + "step": 297860 + }, + { + "epoch": 1.5, + "learning_rate": 7.458112819167452e-05, + "loss": 0.008, + "step": 297870 + }, + { + "epoch": 1.5, + "learning_rate": 7.457356049866051e-05, + "loss": 0.0074, + "step": 297880 + }, + { + "epoch": 1.5, + "learning_rate": 7.45659928056465e-05, + "loss": 0.0077, + "step": 297890 + }, + { + "epoch": 1.5, + "learning_rate": 7.455842511263249e-05, + "loss": 0.0058, + "step": 297900 + }, + { + "epoch": 1.5, + "learning_rate": 7.455085741961848e-05, + "loss": 0.0062, + "step": 297910 + }, + { + "epoch": 1.5, + "learning_rate": 7.454328972660448e-05, + "loss": 0.0077, + "step": 297920 + }, + { + "epoch": 1.5, + "learning_rate": 7.453572203359046e-05, + "loss": 0.007, + "step": 297930 + }, + { + "epoch": 1.5, + "learning_rate": 7.452815434057645e-05, + "loss": 0.0075, + "step": 297940 + }, + { + "epoch": 1.5, + "learning_rate": 7.452058664756244e-05, + "loss": 0.0095, + "step": 297950 + }, + { + "epoch": 1.5, + "learning_rate": 7.451301895454843e-05, + "loss": 0.0078, + "step": 297960 + }, + { + "epoch": 1.5, + "learning_rate": 7.450545126153443e-05, + "loss": 0.0082, + "step": 297970 + }, + { + "epoch": 1.5, + "learning_rate": 7.449788356852041e-05, + "loss": 0.0068, + "step": 297980 + }, + { + "epoch": 1.5, + "learning_rate": 7.44903158755064e-05, + "loss": 0.0064, + "step": 297990 + }, + { + "epoch": 1.5, + "learning_rate": 7.44827481824924e-05, + "loss": 0.006, + "step": 298000 + }, + { + "epoch": 1.5, + "eval_cer": 0.9144489071884033, + "eval_loss": 0.0054661910980939865, + "eval_runtime": 116.6326, + "eval_samples_per_second": 17.148, + "eval_steps_per_second": 4.287, + "step": 298000 + }, + { + "epoch": 1.5, + "learning_rate": 7.447518048947838e-05, + "loss": 0.007, + "step": 298010 + }, + { + "epoch": 1.5, + "learning_rate": 7.446761279646437e-05, + "loss": 0.0068, + "step": 298020 + }, + { + "epoch": 1.5, + "learning_rate": 7.446004510345035e-05, + "loss": 0.0082, + "step": 298030 + }, + { + "epoch": 1.5, + "learning_rate": 7.445247741043634e-05, + "loss": 0.0062, + "step": 298040 + }, + { + "epoch": 1.5, + "learning_rate": 7.444490971742233e-05, + "loss": 0.0069, + "step": 298050 + }, + { + "epoch": 1.5, + "learning_rate": 7.443734202440833e-05, + "loss": 0.007, + "step": 298060 + }, + { + "epoch": 1.5, + "learning_rate": 7.442977433139431e-05, + "loss": 0.0066, + "step": 298070 + }, + { + "epoch": 1.5, + "learning_rate": 7.44222066383803e-05, + "loss": 0.0067, + "step": 298080 + }, + { + "epoch": 1.5, + "learning_rate": 7.44146389453663e-05, + "loss": 0.0055, + "step": 298090 + }, + { + "epoch": 1.5, + "learning_rate": 7.440707125235228e-05, + "loss": 0.0058, + "step": 298100 + }, + { + "epoch": 1.5, + "learning_rate": 7.439950355933827e-05, + "loss": 0.0085, + "step": 298110 + }, + { + "epoch": 1.5, + "learning_rate": 7.439193586632426e-05, + "loss": 0.0068, + "step": 298120 + }, + { + "epoch": 1.5, + "learning_rate": 7.438436817331025e-05, + "loss": 0.0085, + "step": 298130 + }, + { + "epoch": 1.5, + "learning_rate": 7.437680048029625e-05, + "loss": 0.008, + "step": 298140 + }, + { + "epoch": 1.5, + "learning_rate": 7.436923278728223e-05, + "loss": 0.0079, + "step": 298150 + }, + { + "epoch": 1.5, + "learning_rate": 7.436166509426822e-05, + "loss": 0.007, + "step": 298160 + }, + { + "epoch": 1.5, + "learning_rate": 7.435409740125422e-05, + "loss": 0.0096, + "step": 298170 + }, + { + "epoch": 1.5, + "learning_rate": 7.43465297082402e-05, + "loss": 0.006, + "step": 298180 + }, + { + "epoch": 1.5, + "learning_rate": 7.43389620152262e-05, + "loss": 0.0064, + "step": 298190 + }, + { + "epoch": 1.5, + "learning_rate": 7.433139432221217e-05, + "loss": 0.0068, + "step": 298200 + }, + { + "epoch": 1.5, + "learning_rate": 7.432382662919817e-05, + "loss": 0.0062, + "step": 298210 + }, + { + "epoch": 1.5, + "learning_rate": 7.431625893618416e-05, + "loss": 0.0065, + "step": 298220 + }, + { + "epoch": 1.5, + "learning_rate": 7.430869124317015e-05, + "loss": 0.0086, + "step": 298230 + }, + { + "epoch": 1.5, + "learning_rate": 7.430112355015614e-05, + "loss": 0.0076, + "step": 298240 + }, + { + "epoch": 1.5, + "learning_rate": 7.429355585714214e-05, + "loss": 0.0069, + "step": 298250 + }, + { + "epoch": 1.5, + "learning_rate": 7.428598816412812e-05, + "loss": 0.0074, + "step": 298260 + }, + { + "epoch": 1.5, + "learning_rate": 7.427842047111411e-05, + "loss": 0.0106, + "step": 298270 + }, + { + "epoch": 1.5, + "learning_rate": 7.427085277810011e-05, + "loss": 0.0063, + "step": 298280 + }, + { + "epoch": 1.5, + "learning_rate": 7.426328508508609e-05, + "loss": 0.0075, + "step": 298290 + }, + { + "epoch": 1.5, + "learning_rate": 7.425571739207208e-05, + "loss": 0.0089, + "step": 298300 + }, + { + "epoch": 1.51, + "learning_rate": 7.424814969905807e-05, + "loss": 0.0078, + "step": 298310 + }, + { + "epoch": 1.51, + "learning_rate": 7.424058200604406e-05, + "loss": 0.0061, + "step": 298320 + }, + { + "epoch": 1.51, + "learning_rate": 7.423301431303006e-05, + "loss": 0.008, + "step": 298330 + }, + { + "epoch": 1.51, + "learning_rate": 7.422544662001604e-05, + "loss": 0.0078, + "step": 298340 + }, + { + "epoch": 1.51, + "learning_rate": 7.421787892700203e-05, + "loss": 0.0063, + "step": 298350 + }, + { + "epoch": 1.51, + "learning_rate": 7.421031123398801e-05, + "loss": 0.0066, + "step": 298360 + }, + { + "epoch": 1.51, + "learning_rate": 7.420274354097401e-05, + "loss": 0.0061, + "step": 298370 + }, + { + "epoch": 1.51, + "learning_rate": 7.419517584795999e-05, + "loss": 0.0082, + "step": 298380 + }, + { + "epoch": 1.51, + "learning_rate": 7.418760815494598e-05, + "loss": 0.0134, + "step": 298390 + }, + { + "epoch": 1.51, + "learning_rate": 7.418004046193197e-05, + "loss": 0.0077, + "step": 298400 + }, + { + "epoch": 1.51, + "learning_rate": 7.417247276891796e-05, + "loss": 0.006, + "step": 298410 + }, + { + "epoch": 1.51, + "learning_rate": 7.416490507590396e-05, + "loss": 0.0077, + "step": 298420 + }, + { + "epoch": 1.51, + "learning_rate": 7.415733738288994e-05, + "loss": 0.006, + "step": 298430 + }, + { + "epoch": 1.51, + "learning_rate": 7.414976968987593e-05, + "loss": 0.0089, + "step": 298440 + }, + { + "epoch": 1.51, + "learning_rate": 7.414220199686193e-05, + "loss": 0.0081, + "step": 298450 + }, + { + "epoch": 1.51, + "learning_rate": 7.413463430384791e-05, + "loss": 0.0078, + "step": 298460 + }, + { + "epoch": 1.51, + "learning_rate": 7.41270666108339e-05, + "loss": 0.0075, + "step": 298470 + }, + { + "epoch": 1.51, + "learning_rate": 7.411949891781989e-05, + "loss": 0.0088, + "step": 298480 + }, + { + "epoch": 1.51, + "learning_rate": 7.411193122480588e-05, + "loss": 0.0061, + "step": 298490 + }, + { + "epoch": 1.51, + "learning_rate": 7.410436353179188e-05, + "loss": 0.0078, + "step": 298500 + }, + { + "epoch": 1.51, + "learning_rate": 7.409679583877786e-05, + "loss": 0.0046, + "step": 298510 + }, + { + "epoch": 1.51, + "learning_rate": 7.408922814576385e-05, + "loss": 0.0084, + "step": 298520 + }, + { + "epoch": 1.51, + "learning_rate": 7.408166045274985e-05, + "loss": 0.0057, + "step": 298530 + }, + { + "epoch": 1.51, + "learning_rate": 7.407409275973583e-05, + "loss": 0.0056, + "step": 298540 + }, + { + "epoch": 1.51, + "learning_rate": 7.406652506672182e-05, + "loss": 0.0077, + "step": 298550 + }, + { + "epoch": 1.51, + "learning_rate": 7.40589573737078e-05, + "loss": 0.007, + "step": 298560 + }, + { + "epoch": 1.51, + "learning_rate": 7.40513896806938e-05, + "loss": 0.0072, + "step": 298570 + }, + { + "epoch": 1.51, + "learning_rate": 7.40438219876798e-05, + "loss": 0.0076, + "step": 298580 + }, + { + "epoch": 1.51, + "learning_rate": 7.403625429466578e-05, + "loss": 0.0083, + "step": 298590 + }, + { + "epoch": 1.51, + "learning_rate": 7.402868660165177e-05, + "loss": 0.0087, + "step": 298600 + }, + { + "epoch": 1.51, + "learning_rate": 7.402111890863777e-05, + "loss": 0.008, + "step": 298610 + }, + { + "epoch": 1.51, + "learning_rate": 7.401355121562375e-05, + "loss": 0.0082, + "step": 298620 + }, + { + "epoch": 1.51, + "learning_rate": 7.400598352260974e-05, + "loss": 0.0056, + "step": 298630 + }, + { + "epoch": 1.51, + "learning_rate": 7.399841582959572e-05, + "loss": 0.0064, + "step": 298640 + }, + { + "epoch": 1.51, + "learning_rate": 7.399084813658172e-05, + "loss": 0.0064, + "step": 298650 + }, + { + "epoch": 1.51, + "learning_rate": 7.398328044356771e-05, + "loss": 0.0062, + "step": 298660 + }, + { + "epoch": 1.51, + "learning_rate": 7.39757127505537e-05, + "loss": 0.0065, + "step": 298670 + }, + { + "epoch": 1.51, + "learning_rate": 7.396814505753968e-05, + "loss": 0.0072, + "step": 298680 + }, + { + "epoch": 1.51, + "learning_rate": 7.396057736452567e-05, + "loss": 0.0092, + "step": 298690 + }, + { + "epoch": 1.51, + "learning_rate": 7.395300967151167e-05, + "loss": 0.0088, + "step": 298700 + }, + { + "epoch": 1.51, + "learning_rate": 7.394544197849765e-05, + "loss": 0.0065, + "step": 298710 + }, + { + "epoch": 1.51, + "learning_rate": 7.393787428548364e-05, + "loss": 0.0073, + "step": 298720 + }, + { + "epoch": 1.51, + "learning_rate": 7.393030659246964e-05, + "loss": 0.0068, + "step": 298730 + }, + { + "epoch": 1.51, + "learning_rate": 7.392273889945562e-05, + "loss": 0.0048, + "step": 298740 + }, + { + "epoch": 1.51, + "learning_rate": 7.391517120644161e-05, + "loss": 0.0064, + "step": 298750 + }, + { + "epoch": 1.51, + "learning_rate": 7.39076035134276e-05, + "loss": 0.0092, + "step": 298760 + }, + { + "epoch": 1.51, + "learning_rate": 7.390003582041359e-05, + "loss": 0.0059, + "step": 298770 + }, + { + "epoch": 1.51, + "learning_rate": 7.389246812739959e-05, + "loss": 0.0068, + "step": 298780 + }, + { + "epoch": 1.51, + "learning_rate": 7.388490043438557e-05, + "loss": 0.0073, + "step": 298790 + }, + { + "epoch": 1.51, + "learning_rate": 7.387733274137156e-05, + "loss": 0.0067, + "step": 298800 + }, + { + "epoch": 1.51, + "learning_rate": 7.386976504835756e-05, + "loss": 0.0064, + "step": 298810 + }, + { + "epoch": 1.51, + "learning_rate": 7.386219735534354e-05, + "loss": 0.0075, + "step": 298820 + }, + { + "epoch": 1.51, + "learning_rate": 7.385462966232953e-05, + "loss": 0.0071, + "step": 298830 + }, + { + "epoch": 1.51, + "learning_rate": 7.384706196931552e-05, + "loss": 0.0071, + "step": 298840 + }, + { + "epoch": 1.51, + "learning_rate": 7.383949427630151e-05, + "loss": 0.0055, + "step": 298850 + }, + { + "epoch": 1.51, + "learning_rate": 7.38319265832875e-05, + "loss": 0.0074, + "step": 298860 + }, + { + "epoch": 1.51, + "learning_rate": 7.382435889027349e-05, + "loss": 0.0062, + "step": 298870 + }, + { + "epoch": 1.51, + "learning_rate": 7.381679119725948e-05, + "loss": 0.0074, + "step": 298880 + }, + { + "epoch": 1.51, + "learning_rate": 7.380922350424548e-05, + "loss": 0.0067, + "step": 298890 + }, + { + "epoch": 1.51, + "learning_rate": 7.380165581123146e-05, + "loss": 0.007, + "step": 298900 + }, + { + "epoch": 1.51, + "learning_rate": 7.379408811821745e-05, + "loss": 0.0056, + "step": 298910 + }, + { + "epoch": 1.51, + "learning_rate": 7.378652042520344e-05, + "loss": 0.0082, + "step": 298920 + }, + { + "epoch": 1.51, + "learning_rate": 7.377895273218943e-05, + "loss": 0.0061, + "step": 298930 + }, + { + "epoch": 1.51, + "learning_rate": 7.377138503917543e-05, + "loss": 0.0068, + "step": 298940 + }, + { + "epoch": 1.51, + "learning_rate": 7.37638173461614e-05, + "loss": 0.0071, + "step": 298950 + }, + { + "epoch": 1.51, + "learning_rate": 7.37562496531474e-05, + "loss": 0.006, + "step": 298960 + }, + { + "epoch": 1.51, + "learning_rate": 7.37486819601334e-05, + "loss": 0.0085, + "step": 298970 + }, + { + "epoch": 1.51, + "learning_rate": 7.374111426711938e-05, + "loss": 0.0067, + "step": 298980 + }, + { + "epoch": 1.51, + "learning_rate": 7.373354657410536e-05, + "loss": 0.0072, + "step": 298990 + }, + { + "epoch": 1.51, + "learning_rate": 7.372597888109135e-05, + "loss": 0.0058, + "step": 299000 + }, + { + "epoch": 1.51, + "eval_cer": 0.9144362920387732, + "eval_loss": 0.005306443199515343, + "eval_runtime": 116.5784, + "eval_samples_per_second": 17.156, + "eval_steps_per_second": 4.289, + "step": 299000 + }, + { + "epoch": 1.51, + "learning_rate": 7.371841118807734e-05, + "loss": 0.0063, + "step": 299010 + }, + { + "epoch": 1.51, + "learning_rate": 7.371084349506333e-05, + "loss": 0.0097, + "step": 299020 + }, + { + "epoch": 1.51, + "learning_rate": 7.370327580204933e-05, + "loss": 0.0081, + "step": 299030 + }, + { + "epoch": 1.51, + "learning_rate": 7.369570810903531e-05, + "loss": 0.0069, + "step": 299040 + }, + { + "epoch": 1.51, + "learning_rate": 7.36881404160213e-05, + "loss": 0.0084, + "step": 299050 + }, + { + "epoch": 1.51, + "learning_rate": 7.36805727230073e-05, + "loss": 0.0088, + "step": 299060 + }, + { + "epoch": 1.51, + "learning_rate": 7.367300502999328e-05, + "loss": 0.0067, + "step": 299070 + }, + { + "epoch": 1.51, + "learning_rate": 7.366543733697927e-05, + "loss": 0.0069, + "step": 299080 + }, + { + "epoch": 1.51, + "learning_rate": 7.365786964396526e-05, + "loss": 0.007, + "step": 299090 + }, + { + "epoch": 1.51, + "learning_rate": 7.365030195095125e-05, + "loss": 0.0075, + "step": 299100 + }, + { + "epoch": 1.51, + "learning_rate": 7.364273425793725e-05, + "loss": 0.0069, + "step": 299110 + }, + { + "epoch": 1.51, + "learning_rate": 7.363516656492323e-05, + "loss": 0.0071, + "step": 299120 + }, + { + "epoch": 1.51, + "learning_rate": 7.362759887190922e-05, + "loss": 0.0091, + "step": 299130 + }, + { + "epoch": 1.51, + "learning_rate": 7.362003117889522e-05, + "loss": 0.0067, + "step": 299140 + }, + { + "epoch": 1.51, + "learning_rate": 7.36124634858812e-05, + "loss": 0.0079, + "step": 299150 + }, + { + "epoch": 1.51, + "learning_rate": 7.360489579286719e-05, + "loss": 0.0072, + "step": 299160 + }, + { + "epoch": 1.51, + "learning_rate": 7.359732809985317e-05, + "loss": 0.007, + "step": 299170 + }, + { + "epoch": 1.51, + "learning_rate": 7.358976040683917e-05, + "loss": 0.0054, + "step": 299180 + }, + { + "epoch": 1.51, + "learning_rate": 7.358219271382516e-05, + "loss": 0.0063, + "step": 299190 + }, + { + "epoch": 1.51, + "learning_rate": 7.357462502081115e-05, + "loss": 0.006, + "step": 299200 + }, + { + "epoch": 1.51, + "learning_rate": 7.356705732779714e-05, + "loss": 0.0068, + "step": 299210 + }, + { + "epoch": 1.51, + "learning_rate": 7.355948963478314e-05, + "loss": 0.0071, + "step": 299220 + }, + { + "epoch": 1.51, + "learning_rate": 7.355192194176912e-05, + "loss": 0.0076, + "step": 299230 + }, + { + "epoch": 1.51, + "learning_rate": 7.354435424875511e-05, + "loss": 0.0075, + "step": 299240 + }, + { + "epoch": 1.51, + "learning_rate": 7.353678655574111e-05, + "loss": 0.0082, + "step": 299250 + }, + { + "epoch": 1.51, + "learning_rate": 7.352921886272709e-05, + "loss": 0.008, + "step": 299260 + }, + { + "epoch": 1.51, + "learning_rate": 7.352165116971308e-05, + "loss": 0.0087, + "step": 299270 + }, + { + "epoch": 1.51, + "learning_rate": 7.351408347669907e-05, + "loss": 0.0056, + "step": 299280 + }, + { + "epoch": 1.51, + "learning_rate": 7.350651578368506e-05, + "loss": 0.0062, + "step": 299290 + }, + { + "epoch": 1.51, + "learning_rate": 7.349894809067104e-05, + "loss": 0.0081, + "step": 299300 + }, + { + "epoch": 1.51, + "learning_rate": 7.349138039765704e-05, + "loss": 0.0067, + "step": 299310 + }, + { + "epoch": 1.51, + "learning_rate": 7.348381270464302e-05, + "loss": 0.0076, + "step": 299320 + }, + { + "epoch": 1.51, + "learning_rate": 7.347624501162901e-05, + "loss": 0.0065, + "step": 299330 + }, + { + "epoch": 1.51, + "learning_rate": 7.346867731861501e-05, + "loss": 0.0069, + "step": 299340 + }, + { + "epoch": 1.51, + "learning_rate": 7.346110962560099e-05, + "loss": 0.0052, + "step": 299350 + }, + { + "epoch": 1.51, + "learning_rate": 7.345354193258698e-05, + "loss": 0.0068, + "step": 299360 + }, + { + "epoch": 1.51, + "learning_rate": 7.344597423957297e-05, + "loss": 0.0075, + "step": 299370 + }, + { + "epoch": 1.51, + "learning_rate": 7.343840654655896e-05, + "loss": 0.0095, + "step": 299380 + }, + { + "epoch": 1.51, + "learning_rate": 7.343083885354496e-05, + "loss": 0.009, + "step": 299390 + }, + { + "epoch": 1.51, + "learning_rate": 7.342327116053094e-05, + "loss": 0.0075, + "step": 299400 + }, + { + "epoch": 1.51, + "learning_rate": 7.341570346751693e-05, + "loss": 0.0111, + "step": 299410 + }, + { + "epoch": 1.51, + "learning_rate": 7.340813577450293e-05, + "loss": 0.0064, + "step": 299420 + }, + { + "epoch": 1.51, + "learning_rate": 7.340056808148891e-05, + "loss": 0.0072, + "step": 299430 + }, + { + "epoch": 1.51, + "learning_rate": 7.33930003884749e-05, + "loss": 0.0084, + "step": 299440 + }, + { + "epoch": 1.51, + "learning_rate": 7.338543269546089e-05, + "loss": 0.0067, + "step": 299450 + }, + { + "epoch": 1.51, + "learning_rate": 7.337786500244688e-05, + "loss": 0.0071, + "step": 299460 + }, + { + "epoch": 1.51, + "learning_rate": 7.337029730943288e-05, + "loss": 0.0068, + "step": 299470 + }, + { + "epoch": 1.51, + "learning_rate": 7.336272961641886e-05, + "loss": 0.0053, + "step": 299480 + }, + { + "epoch": 1.51, + "learning_rate": 7.335516192340485e-05, + "loss": 0.008, + "step": 299490 + }, + { + "epoch": 1.51, + "learning_rate": 7.334759423039085e-05, + "loss": 0.0074, + "step": 299500 + }, + { + "epoch": 1.51, + "learning_rate": 7.334002653737683e-05, + "loss": 0.007, + "step": 299510 + }, + { + "epoch": 1.51, + "learning_rate": 7.333245884436282e-05, + "loss": 0.0062, + "step": 299520 + }, + { + "epoch": 1.51, + "learning_rate": 7.33248911513488e-05, + "loss": 0.0082, + "step": 299530 + }, + { + "epoch": 1.51, + "learning_rate": 7.33173234583348e-05, + "loss": 0.0089, + "step": 299540 + }, + { + "epoch": 1.51, + "learning_rate": 7.33097557653208e-05, + "loss": 0.0056, + "step": 299550 + }, + { + "epoch": 1.51, + "learning_rate": 7.330218807230678e-05, + "loss": 0.0068, + "step": 299560 + }, + { + "epoch": 1.51, + "learning_rate": 7.329462037929277e-05, + "loss": 0.0046, + "step": 299570 + }, + { + "epoch": 1.51, + "learning_rate": 7.328705268627877e-05, + "loss": 0.0085, + "step": 299580 + }, + { + "epoch": 1.51, + "learning_rate": 7.327948499326475e-05, + "loss": 0.0064, + "step": 299590 + }, + { + "epoch": 1.51, + "learning_rate": 7.327191730025074e-05, + "loss": 0.0059, + "step": 299600 + }, + { + "epoch": 1.51, + "learning_rate": 7.326434960723672e-05, + "loss": 0.0089, + "step": 299610 + }, + { + "epoch": 1.51, + "learning_rate": 7.32567819142227e-05, + "loss": 0.0097, + "step": 299620 + }, + { + "epoch": 1.51, + "learning_rate": 7.32492142212087e-05, + "loss": 0.0079, + "step": 299630 + }, + { + "epoch": 1.51, + "learning_rate": 7.32416465281947e-05, + "loss": 0.0056, + "step": 299640 + }, + { + "epoch": 1.51, + "learning_rate": 7.323407883518068e-05, + "loss": 0.006, + "step": 299650 + }, + { + "epoch": 1.51, + "learning_rate": 7.322651114216667e-05, + "loss": 0.0078, + "step": 299660 + }, + { + "epoch": 1.51, + "learning_rate": 7.321894344915267e-05, + "loss": 0.0058, + "step": 299670 + }, + { + "epoch": 1.51, + "learning_rate": 7.321137575613865e-05, + "loss": 0.0073, + "step": 299680 + }, + { + "epoch": 1.51, + "learning_rate": 7.320380806312464e-05, + "loss": 0.0075, + "step": 299690 + }, + { + "epoch": 1.51, + "learning_rate": 7.319624037011064e-05, + "loss": 0.008, + "step": 299700 + }, + { + "epoch": 1.51, + "learning_rate": 7.318867267709662e-05, + "loss": 0.0083, + "step": 299710 + }, + { + "epoch": 1.51, + "learning_rate": 7.318110498408261e-05, + "loss": 0.0076, + "step": 299720 + }, + { + "epoch": 1.51, + "learning_rate": 7.31735372910686e-05, + "loss": 0.0068, + "step": 299730 + }, + { + "epoch": 1.51, + "learning_rate": 7.316596959805459e-05, + "loss": 0.0071, + "step": 299740 + }, + { + "epoch": 1.51, + "learning_rate": 7.315840190504059e-05, + "loss": 0.0085, + "step": 299750 + }, + { + "epoch": 1.51, + "learning_rate": 7.315083421202657e-05, + "loss": 0.0082, + "step": 299760 + }, + { + "epoch": 1.51, + "learning_rate": 7.314326651901256e-05, + "loss": 0.0051, + "step": 299770 + }, + { + "epoch": 1.51, + "learning_rate": 7.313569882599856e-05, + "loss": 0.0086, + "step": 299780 + }, + { + "epoch": 1.51, + "learning_rate": 7.312813113298454e-05, + "loss": 0.0059, + "step": 299790 + }, + { + "epoch": 1.51, + "learning_rate": 7.312056343997053e-05, + "loss": 0.0081, + "step": 299800 + }, + { + "epoch": 1.51, + "learning_rate": 7.311299574695652e-05, + "loss": 0.0081, + "step": 299810 + }, + { + "epoch": 1.51, + "learning_rate": 7.310542805394251e-05, + "loss": 0.008, + "step": 299820 + }, + { + "epoch": 1.51, + "learning_rate": 7.30978603609285e-05, + "loss": 0.0073, + "step": 299830 + }, + { + "epoch": 1.51, + "learning_rate": 7.309029266791449e-05, + "loss": 0.0076, + "step": 299840 + }, + { + "epoch": 1.51, + "learning_rate": 7.308272497490048e-05, + "loss": 0.0091, + "step": 299850 + }, + { + "epoch": 1.51, + "learning_rate": 7.307515728188648e-05, + "loss": 0.0067, + "step": 299860 + }, + { + "epoch": 1.51, + "learning_rate": 7.306758958887246e-05, + "loss": 0.0073, + "step": 299870 + }, + { + "epoch": 1.51, + "learning_rate": 7.306002189585845e-05, + "loss": 0.0073, + "step": 299880 + }, + { + "epoch": 1.51, + "learning_rate": 7.305245420284443e-05, + "loss": 0.0062, + "step": 299890 + }, + { + "epoch": 1.51, + "learning_rate": 7.304488650983043e-05, + "loss": 0.0089, + "step": 299900 + }, + { + "epoch": 1.51, + "learning_rate": 7.303731881681642e-05, + "loss": 0.0049, + "step": 299910 + }, + { + "epoch": 1.51, + "learning_rate": 7.30297511238024e-05, + "loss": 0.0078, + "step": 299920 + }, + { + "epoch": 1.51, + "learning_rate": 7.302218343078839e-05, + "loss": 0.0064, + "step": 299930 + }, + { + "epoch": 1.51, + "learning_rate": 7.301461573777438e-05, + "loss": 0.007, + "step": 299940 + }, + { + "epoch": 1.51, + "learning_rate": 7.300704804476038e-05, + "loss": 0.0083, + "step": 299950 + }, + { + "epoch": 1.51, + "learning_rate": 7.299948035174636e-05, + "loss": 0.0068, + "step": 299960 + }, + { + "epoch": 1.51, + "learning_rate": 7.299191265873235e-05, + "loss": 0.0079, + "step": 299970 + }, + { + "epoch": 1.51, + "learning_rate": 7.298434496571834e-05, + "loss": 0.0082, + "step": 299980 + }, + { + "epoch": 1.51, + "learning_rate": 7.297677727270433e-05, + "loss": 0.0087, + "step": 299990 + }, + { + "epoch": 1.51, + "learning_rate": 7.296920957969033e-05, + "loss": 0.0079, + "step": 300000 + }, + { + "epoch": 1.51, + "eval_cer": 0.9144518183767796, + "eval_loss": 0.0054466393776237965, + "eval_runtime": 116.3507, + "eval_samples_per_second": 17.189, + "eval_steps_per_second": 4.297, + "step": 300000 + }, + { + "epoch": 1.51, + "learning_rate": 7.29616418866763e-05, + "loss": 0.0053, + "step": 300010 + }, + { + "epoch": 1.51, + "learning_rate": 7.29540741936623e-05, + "loss": 0.0059, + "step": 300020 + }, + { + "epoch": 1.51, + "learning_rate": 7.29465065006483e-05, + "loss": 0.0092, + "step": 300030 + }, + { + "epoch": 1.51, + "learning_rate": 7.293893880763428e-05, + "loss": 0.014, + "step": 300040 + }, + { + "epoch": 1.51, + "learning_rate": 7.293137111462027e-05, + "loss": 0.0071, + "step": 300050 + }, + { + "epoch": 1.51, + "learning_rate": 7.292380342160625e-05, + "loss": 0.008, + "step": 300060 + }, + { + "epoch": 1.51, + "learning_rate": 7.291623572859225e-05, + "loss": 0.0066, + "step": 300070 + }, + { + "epoch": 1.51, + "learning_rate": 7.290866803557824e-05, + "loss": 0.0085, + "step": 300080 + }, + { + "epoch": 1.51, + "learning_rate": 7.290110034256423e-05, + "loss": 0.0073, + "step": 300090 + }, + { + "epoch": 1.51, + "learning_rate": 7.289353264955022e-05, + "loss": 0.0087, + "step": 300100 + }, + { + "epoch": 1.51, + "learning_rate": 7.288596495653622e-05, + "loss": 0.0047, + "step": 300110 + }, + { + "epoch": 1.51, + "learning_rate": 7.28783972635222e-05, + "loss": 0.01, + "step": 300120 + }, + { + "epoch": 1.51, + "learning_rate": 7.287082957050819e-05, + "loss": 0.0071, + "step": 300130 + }, + { + "epoch": 1.51, + "learning_rate": 7.286326187749417e-05, + "loss": 0.0078, + "step": 300140 + }, + { + "epoch": 1.51, + "learning_rate": 7.285569418448017e-05, + "loss": 0.0104, + "step": 300150 + }, + { + "epoch": 1.51, + "learning_rate": 7.284812649146616e-05, + "loss": 0.0045, + "step": 300160 + }, + { + "epoch": 1.51, + "learning_rate": 7.284055879845215e-05, + "loss": 0.0074, + "step": 300170 + }, + { + "epoch": 1.51, + "learning_rate": 7.283299110543814e-05, + "loss": 0.0069, + "step": 300180 + }, + { + "epoch": 1.51, + "learning_rate": 7.282542341242414e-05, + "loss": 0.0084, + "step": 300190 + }, + { + "epoch": 1.51, + "learning_rate": 7.281785571941012e-05, + "loss": 0.007, + "step": 300200 + }, + { + "epoch": 1.51, + "learning_rate": 7.281028802639611e-05, + "loss": 0.0055, + "step": 300210 + }, + { + "epoch": 1.51, + "learning_rate": 7.28027203333821e-05, + "loss": 0.0085, + "step": 300220 + }, + { + "epoch": 1.51, + "learning_rate": 7.279515264036809e-05, + "loss": 0.0071, + "step": 300230 + }, + { + "epoch": 1.51, + "learning_rate": 7.278758494735407e-05, + "loss": 0.0068, + "step": 300240 + }, + { + "epoch": 1.51, + "learning_rate": 7.278001725434006e-05, + "loss": 0.0064, + "step": 300250 + }, + { + "epoch": 1.51, + "learning_rate": 7.277244956132605e-05, + "loss": 0.0061, + "step": 300260 + }, + { + "epoch": 1.51, + "learning_rate": 7.276488186831204e-05, + "loss": 0.0082, + "step": 300270 + }, + { + "epoch": 1.51, + "learning_rate": 7.275731417529804e-05, + "loss": 0.0063, + "step": 300280 + }, + { + "epoch": 1.51, + "learning_rate": 7.274974648228402e-05, + "loss": 0.0079, + "step": 300290 + }, + { + "epoch": 1.52, + "learning_rate": 7.274217878927001e-05, + "loss": 0.0097, + "step": 300300 + }, + { + "epoch": 1.52, + "learning_rate": 7.273461109625601e-05, + "loss": 0.0074, + "step": 300310 + }, + { + "epoch": 1.52, + "learning_rate": 7.272704340324199e-05, + "loss": 0.005, + "step": 300320 + }, + { + "epoch": 1.52, + "learning_rate": 7.271947571022798e-05, + "loss": 0.0068, + "step": 300330 + }, + { + "epoch": 1.52, + "learning_rate": 7.271190801721397e-05, + "loss": 0.0063, + "step": 300340 + }, + { + "epoch": 1.52, + "learning_rate": 7.270434032419996e-05, + "loss": 0.0092, + "step": 300350 + }, + { + "epoch": 1.52, + "learning_rate": 7.269677263118596e-05, + "loss": 0.0089, + "step": 300360 + }, + { + "epoch": 1.52, + "learning_rate": 7.268920493817194e-05, + "loss": 0.0102, + "step": 300370 + }, + { + "epoch": 1.52, + "learning_rate": 7.268163724515793e-05, + "loss": 0.0072, + "step": 300380 + }, + { + "epoch": 1.52, + "learning_rate": 7.267406955214393e-05, + "loss": 0.0042, + "step": 300390 + }, + { + "epoch": 1.52, + "learning_rate": 7.266650185912991e-05, + "loss": 0.0073, + "step": 300400 + }, + { + "epoch": 1.52, + "learning_rate": 7.26589341661159e-05, + "loss": 0.0056, + "step": 300410 + }, + { + "epoch": 1.52, + "learning_rate": 7.265136647310188e-05, + "loss": 0.0089, + "step": 300420 + }, + { + "epoch": 1.52, + "learning_rate": 7.264379878008788e-05, + "loss": 0.0074, + "step": 300430 + }, + { + "epoch": 1.52, + "learning_rate": 7.263623108707387e-05, + "loss": 0.0068, + "step": 300440 + }, + { + "epoch": 1.52, + "learning_rate": 7.262866339405986e-05, + "loss": 0.0075, + "step": 300450 + }, + { + "epoch": 1.52, + "learning_rate": 7.262109570104585e-05, + "loss": 0.0087, + "step": 300460 + }, + { + "epoch": 1.52, + "learning_rate": 7.261352800803185e-05, + "loss": 0.0055, + "step": 300470 + }, + { + "epoch": 1.52, + "learning_rate": 7.260596031501783e-05, + "loss": 0.0056, + "step": 300480 + }, + { + "epoch": 1.52, + "learning_rate": 7.259839262200382e-05, + "loss": 0.0067, + "step": 300490 + }, + { + "epoch": 1.52, + "learning_rate": 7.25908249289898e-05, + "loss": 0.0061, + "step": 300500 + }, + { + "epoch": 1.52, + "learning_rate": 7.25832572359758e-05, + "loss": 0.0073, + "step": 300510 + }, + { + "epoch": 1.52, + "learning_rate": 7.25756895429618e-05, + "loss": 0.0067, + "step": 300520 + }, + { + "epoch": 1.52, + "learning_rate": 7.256812184994778e-05, + "loss": 0.0076, + "step": 300530 + }, + { + "epoch": 1.52, + "learning_rate": 7.256055415693377e-05, + "loss": 0.0077, + "step": 300540 + }, + { + "epoch": 1.52, + "learning_rate": 7.255298646391977e-05, + "loss": 0.0078, + "step": 300550 + }, + { + "epoch": 1.52, + "learning_rate": 7.254541877090575e-05, + "loss": 0.0076, + "step": 300560 + }, + { + "epoch": 1.52, + "learning_rate": 7.253785107789173e-05, + "loss": 0.0073, + "step": 300570 + }, + { + "epoch": 1.52, + "learning_rate": 7.253028338487772e-05, + "loss": 0.0097, + "step": 300580 + }, + { + "epoch": 1.52, + "learning_rate": 7.25227156918637e-05, + "loss": 0.006, + "step": 300590 + }, + { + "epoch": 1.52, + "learning_rate": 7.25151479988497e-05, + "loss": 0.0063, + "step": 300600 + }, + { + "epoch": 1.52, + "learning_rate": 7.25075803058357e-05, + "loss": 0.0071, + "step": 300610 + }, + { + "epoch": 1.52, + "learning_rate": 7.250001261282168e-05, + "loss": 0.0064, + "step": 300620 + }, + { + "epoch": 1.52, + "learning_rate": 7.249244491980767e-05, + "loss": 0.0069, + "step": 300630 + }, + { + "epoch": 1.52, + "learning_rate": 7.248487722679367e-05, + "loss": 0.0053, + "step": 300640 + }, + { + "epoch": 1.52, + "learning_rate": 7.247730953377965e-05, + "loss": 0.0067, + "step": 300650 + }, + { + "epoch": 1.52, + "learning_rate": 7.246974184076564e-05, + "loss": 0.0069, + "step": 300660 + }, + { + "epoch": 1.52, + "learning_rate": 7.246217414775164e-05, + "loss": 0.0058, + "step": 300670 + }, + { + "epoch": 1.52, + "learning_rate": 7.245460645473762e-05, + "loss": 0.006, + "step": 300680 + }, + { + "epoch": 1.52, + "learning_rate": 7.244703876172361e-05, + "loss": 0.0074, + "step": 300690 + }, + { + "epoch": 1.52, + "learning_rate": 7.24394710687096e-05, + "loss": 0.0079, + "step": 300700 + }, + { + "epoch": 1.52, + "learning_rate": 7.243190337569559e-05, + "loss": 0.0064, + "step": 300710 + }, + { + "epoch": 1.52, + "learning_rate": 7.242433568268159e-05, + "loss": 0.007, + "step": 300720 + }, + { + "epoch": 1.52, + "learning_rate": 7.241676798966757e-05, + "loss": 0.0054, + "step": 300730 + }, + { + "epoch": 1.52, + "learning_rate": 7.240920029665356e-05, + "loss": 0.0078, + "step": 300740 + }, + { + "epoch": 1.52, + "learning_rate": 7.240163260363956e-05, + "loss": 0.006, + "step": 300750 + }, + { + "epoch": 1.52, + "learning_rate": 7.239406491062554e-05, + "loss": 0.0061, + "step": 300760 + }, + { + "epoch": 1.52, + "learning_rate": 7.238649721761153e-05, + "loss": 0.0049, + "step": 300770 + }, + { + "epoch": 1.52, + "learning_rate": 7.237892952459751e-05, + "loss": 0.0065, + "step": 300780 + }, + { + "epoch": 1.52, + "learning_rate": 7.237136183158351e-05, + "loss": 0.0072, + "step": 300790 + }, + { + "epoch": 1.52, + "learning_rate": 7.23637941385695e-05, + "loss": 0.0074, + "step": 300800 + }, + { + "epoch": 1.52, + "learning_rate": 7.235622644555549e-05, + "loss": 0.0064, + "step": 300810 + }, + { + "epoch": 1.52, + "learning_rate": 7.234865875254148e-05, + "loss": 0.0054, + "step": 300820 + }, + { + "epoch": 1.52, + "learning_rate": 7.234109105952748e-05, + "loss": 0.0069, + "step": 300830 + }, + { + "epoch": 1.52, + "learning_rate": 7.233352336651346e-05, + "loss": 0.0058, + "step": 300840 + }, + { + "epoch": 1.52, + "learning_rate": 7.232595567349945e-05, + "loss": 0.0074, + "step": 300850 + }, + { + "epoch": 1.52, + "learning_rate": 7.231838798048543e-05, + "loss": 0.0068, + "step": 300860 + }, + { + "epoch": 1.52, + "learning_rate": 7.231082028747142e-05, + "loss": 0.0062, + "step": 300870 + }, + { + "epoch": 1.52, + "learning_rate": 7.230325259445741e-05, + "loss": 0.0078, + "step": 300880 + }, + { + "epoch": 1.52, + "learning_rate": 7.22956849014434e-05, + "loss": 0.0069, + "step": 300890 + }, + { + "epoch": 1.52, + "learning_rate": 7.228811720842939e-05, + "loss": 0.0063, + "step": 300900 + }, + { + "epoch": 1.52, + "learning_rate": 7.228054951541538e-05, + "loss": 0.0072, + "step": 300910 + }, + { + "epoch": 1.52, + "learning_rate": 7.227298182240138e-05, + "loss": 0.0077, + "step": 300920 + }, + { + "epoch": 1.52, + "learning_rate": 7.226541412938736e-05, + "loss": 0.007, + "step": 300930 + }, + { + "epoch": 1.52, + "learning_rate": 7.225784643637335e-05, + "loss": 0.0064, + "step": 300940 + }, + { + "epoch": 1.52, + "learning_rate": 7.225027874335933e-05, + "loss": 0.0081, + "step": 300950 + }, + { + "epoch": 1.52, + "learning_rate": 7.224271105034533e-05, + "loss": 0.0075, + "step": 300960 + }, + { + "epoch": 1.52, + "learning_rate": 7.223514335733132e-05, + "loss": 0.0079, + "step": 300970 + }, + { + "epoch": 1.52, + "learning_rate": 7.22275756643173e-05, + "loss": 0.006, + "step": 300980 + }, + { + "epoch": 1.52, + "learning_rate": 7.22200079713033e-05, + "loss": 0.0083, + "step": 300990 + }, + { + "epoch": 1.52, + "learning_rate": 7.22124402782893e-05, + "loss": 0.0064, + "step": 301000 + }, + { + "epoch": 1.52, + "eval_cer": 0.9144430848116509, + "eval_loss": 0.00536463363096118, + "eval_runtime": 116.4459, + "eval_samples_per_second": 17.175, + "eval_steps_per_second": 4.294, + "step": 301000 + }, + { + "epoch": 1.52, + "learning_rate": 7.220487258527528e-05, + "loss": 0.0084, + "step": 301010 + }, + { + "epoch": 1.52, + "learning_rate": 7.219730489226127e-05, + "loss": 0.0061, + "step": 301020 + }, + { + "epoch": 1.52, + "learning_rate": 7.218973719924725e-05, + "loss": 0.0083, + "step": 301030 + }, + { + "epoch": 1.52, + "learning_rate": 7.218216950623325e-05, + "loss": 0.0093, + "step": 301040 + }, + { + "epoch": 1.52, + "learning_rate": 7.217460181321924e-05, + "loss": 0.0066, + "step": 301050 + }, + { + "epoch": 1.52, + "learning_rate": 7.216703412020523e-05, + "loss": 0.0059, + "step": 301060 + }, + { + "epoch": 1.52, + "learning_rate": 7.215946642719122e-05, + "loss": 0.0087, + "step": 301070 + }, + { + "epoch": 1.52, + "learning_rate": 7.215189873417722e-05, + "loss": 0.0063, + "step": 301080 + }, + { + "epoch": 1.52, + "learning_rate": 7.21443310411632e-05, + "loss": 0.0064, + "step": 301090 + }, + { + "epoch": 1.52, + "learning_rate": 7.213676334814919e-05, + "loss": 0.008, + "step": 301100 + }, + { + "epoch": 1.52, + "learning_rate": 7.212919565513517e-05, + "loss": 0.0081, + "step": 301110 + }, + { + "epoch": 1.52, + "learning_rate": 7.212162796212117e-05, + "loss": 0.006, + "step": 301120 + }, + { + "epoch": 1.52, + "learning_rate": 7.211406026910716e-05, + "loss": 0.0057, + "step": 301130 + }, + { + "epoch": 1.52, + "learning_rate": 7.210649257609314e-05, + "loss": 0.0065, + "step": 301140 + }, + { + "epoch": 1.52, + "learning_rate": 7.209892488307914e-05, + "loss": 0.0058, + "step": 301150 + }, + { + "epoch": 1.52, + "learning_rate": 7.209135719006513e-05, + "loss": 0.0071, + "step": 301160 + }, + { + "epoch": 1.52, + "learning_rate": 7.208378949705112e-05, + "loss": 0.0048, + "step": 301170 + }, + { + "epoch": 1.52, + "learning_rate": 7.207622180403711e-05, + "loss": 0.0074, + "step": 301180 + }, + { + "epoch": 1.52, + "learning_rate": 7.206865411102309e-05, + "loss": 0.007, + "step": 301190 + }, + { + "epoch": 1.52, + "learning_rate": 7.206108641800909e-05, + "loss": 0.0068, + "step": 301200 + }, + { + "epoch": 1.52, + "learning_rate": 7.205351872499507e-05, + "loss": 0.0054, + "step": 301210 + }, + { + "epoch": 1.52, + "learning_rate": 7.204595103198106e-05, + "loss": 0.0094, + "step": 301220 + }, + { + "epoch": 1.52, + "learning_rate": 7.203838333896705e-05, + "loss": 0.0072, + "step": 301230 + }, + { + "epoch": 1.52, + "learning_rate": 7.203081564595304e-05, + "loss": 0.0104, + "step": 301240 + }, + { + "epoch": 1.52, + "learning_rate": 7.202324795293904e-05, + "loss": 0.0098, + "step": 301250 + }, + { + "epoch": 1.52, + "learning_rate": 7.201568025992502e-05, + "loss": 0.0074, + "step": 301260 + }, + { + "epoch": 1.52, + "learning_rate": 7.200811256691101e-05, + "loss": 0.0081, + "step": 301270 + }, + { + "epoch": 1.52, + "learning_rate": 7.200054487389701e-05, + "loss": 0.0073, + "step": 301280 + }, + { + "epoch": 1.52, + "learning_rate": 7.199297718088299e-05, + "loss": 0.0073, + "step": 301290 + }, + { + "epoch": 1.52, + "learning_rate": 7.198540948786898e-05, + "loss": 0.0067, + "step": 301300 + }, + { + "epoch": 1.52, + "learning_rate": 7.197784179485496e-05, + "loss": 0.0071, + "step": 301310 + }, + { + "epoch": 1.52, + "learning_rate": 7.197027410184096e-05, + "loss": 0.0067, + "step": 301320 + }, + { + "epoch": 1.52, + "learning_rate": 7.196270640882695e-05, + "loss": 0.0071, + "step": 301330 + }, + { + "epoch": 1.52, + "learning_rate": 7.195513871581294e-05, + "loss": 0.0073, + "step": 301340 + }, + { + "epoch": 1.52, + "learning_rate": 7.194757102279893e-05, + "loss": 0.0074, + "step": 301350 + }, + { + "epoch": 1.52, + "learning_rate": 7.194000332978493e-05, + "loss": 0.0065, + "step": 301360 + }, + { + "epoch": 1.52, + "learning_rate": 7.193243563677091e-05, + "loss": 0.0068, + "step": 301370 + }, + { + "epoch": 1.52, + "learning_rate": 7.19248679437569e-05, + "loss": 0.0084, + "step": 301380 + }, + { + "epoch": 1.52, + "learning_rate": 7.191730025074288e-05, + "loss": 0.0068, + "step": 301390 + }, + { + "epoch": 1.52, + "learning_rate": 7.190973255772888e-05, + "loss": 0.0073, + "step": 301400 + }, + { + "epoch": 1.52, + "learning_rate": 7.190216486471487e-05, + "loss": 0.0097, + "step": 301410 + }, + { + "epoch": 1.52, + "learning_rate": 7.189459717170086e-05, + "loss": 0.0067, + "step": 301420 + }, + { + "epoch": 1.52, + "learning_rate": 7.188702947868685e-05, + "loss": 0.0055, + "step": 301430 + }, + { + "epoch": 1.52, + "learning_rate": 7.187946178567285e-05, + "loss": 0.0078, + "step": 301440 + }, + { + "epoch": 1.52, + "learning_rate": 7.187189409265883e-05, + "loss": 0.0055, + "step": 301450 + }, + { + "epoch": 1.52, + "learning_rate": 7.186432639964482e-05, + "loss": 0.0052, + "step": 301460 + }, + { + "epoch": 1.52, + "learning_rate": 7.18567587066308e-05, + "loss": 0.0062, + "step": 301470 + }, + { + "epoch": 1.52, + "learning_rate": 7.18491910136168e-05, + "loss": 0.0064, + "step": 301480 + }, + { + "epoch": 1.52, + "learning_rate": 7.18416233206028e-05, + "loss": 0.0075, + "step": 301490 + }, + { + "epoch": 1.52, + "learning_rate": 7.183405562758877e-05, + "loss": 0.0075, + "step": 301500 + }, + { + "epoch": 1.52, + "learning_rate": 7.182648793457476e-05, + "loss": 0.0069, + "step": 301510 + }, + { + "epoch": 1.52, + "learning_rate": 7.181892024156075e-05, + "loss": 0.0059, + "step": 301520 + }, + { + "epoch": 1.52, + "learning_rate": 7.181135254854675e-05, + "loss": 0.0064, + "step": 301530 + }, + { + "epoch": 1.52, + "learning_rate": 7.180378485553273e-05, + "loss": 0.0088, + "step": 301540 + }, + { + "epoch": 1.52, + "learning_rate": 7.179621716251872e-05, + "loss": 0.0068, + "step": 301550 + }, + { + "epoch": 1.52, + "learning_rate": 7.17886494695047e-05, + "loss": 0.0098, + "step": 301560 + }, + { + "epoch": 1.52, + "learning_rate": 7.17810817764907e-05, + "loss": 0.009, + "step": 301570 + }, + { + "epoch": 1.52, + "learning_rate": 7.17735140834767e-05, + "loss": 0.007, + "step": 301580 + }, + { + "epoch": 1.52, + "learning_rate": 7.176594639046268e-05, + "loss": 0.0057, + "step": 301590 + }, + { + "epoch": 1.52, + "learning_rate": 7.175837869744867e-05, + "loss": 0.0063, + "step": 301600 + }, + { + "epoch": 1.52, + "learning_rate": 7.175081100443467e-05, + "loss": 0.0084, + "step": 301610 + }, + { + "epoch": 1.52, + "learning_rate": 7.174324331142065e-05, + "loss": 0.0068, + "step": 301620 + }, + { + "epoch": 1.52, + "learning_rate": 7.173567561840664e-05, + "loss": 0.0066, + "step": 301630 + }, + { + "epoch": 1.52, + "learning_rate": 7.172810792539264e-05, + "loss": 0.0089, + "step": 301640 + }, + { + "epoch": 1.52, + "learning_rate": 7.172054023237862e-05, + "loss": 0.0055, + "step": 301650 + }, + { + "epoch": 1.52, + "learning_rate": 7.171297253936461e-05, + "loss": 0.0064, + "step": 301660 + }, + { + "epoch": 1.52, + "learning_rate": 7.17054048463506e-05, + "loss": 0.0062, + "step": 301670 + }, + { + "epoch": 1.52, + "learning_rate": 7.169783715333659e-05, + "loss": 0.006, + "step": 301680 + }, + { + "epoch": 1.52, + "learning_rate": 7.169026946032258e-05, + "loss": 0.0064, + "step": 301690 + }, + { + "epoch": 1.52, + "learning_rate": 7.168270176730857e-05, + "loss": 0.0056, + "step": 301700 + }, + { + "epoch": 1.52, + "learning_rate": 7.167513407429456e-05, + "loss": 0.0059, + "step": 301710 + }, + { + "epoch": 1.52, + "learning_rate": 7.166756638128056e-05, + "loss": 0.0081, + "step": 301720 + }, + { + "epoch": 1.52, + "learning_rate": 7.165999868826654e-05, + "loss": 0.0062, + "step": 301730 + }, + { + "epoch": 1.52, + "learning_rate": 7.165243099525253e-05, + "loss": 0.0075, + "step": 301740 + }, + { + "epoch": 1.52, + "learning_rate": 7.164486330223851e-05, + "loss": 0.01, + "step": 301750 + }, + { + "epoch": 1.52, + "learning_rate": 7.163729560922451e-05, + "loss": 0.0084, + "step": 301760 + }, + { + "epoch": 1.52, + "learning_rate": 7.16297279162105e-05, + "loss": 0.0058, + "step": 301770 + }, + { + "epoch": 1.52, + "learning_rate": 7.162216022319649e-05, + "loss": 0.0065, + "step": 301780 + }, + { + "epoch": 1.52, + "learning_rate": 7.161459253018248e-05, + "loss": 0.0057, + "step": 301790 + }, + { + "epoch": 1.52, + "learning_rate": 7.160702483716848e-05, + "loss": 0.0075, + "step": 301800 + }, + { + "epoch": 1.52, + "learning_rate": 7.159945714415446e-05, + "loss": 0.0072, + "step": 301810 + }, + { + "epoch": 1.52, + "learning_rate": 7.159188945114044e-05, + "loss": 0.0066, + "step": 301820 + }, + { + "epoch": 1.52, + "learning_rate": 7.158432175812643e-05, + "loss": 0.0066, + "step": 301830 + }, + { + "epoch": 1.52, + "learning_rate": 7.157675406511242e-05, + "loss": 0.0069, + "step": 301840 + }, + { + "epoch": 1.52, + "learning_rate": 7.156918637209841e-05, + "loss": 0.0069, + "step": 301850 + }, + { + "epoch": 1.52, + "learning_rate": 7.15616186790844e-05, + "loss": 0.0073, + "step": 301860 + }, + { + "epoch": 1.52, + "learning_rate": 7.155405098607039e-05, + "loss": 0.0066, + "step": 301870 + }, + { + "epoch": 1.52, + "learning_rate": 7.154648329305638e-05, + "loss": 0.0064, + "step": 301880 + }, + { + "epoch": 1.52, + "learning_rate": 7.153891560004238e-05, + "loss": 0.0075, + "step": 301890 + }, + { + "epoch": 1.52, + "learning_rate": 7.153134790702836e-05, + "loss": 0.0084, + "step": 301900 + }, + { + "epoch": 1.52, + "learning_rate": 7.152378021401435e-05, + "loss": 0.0063, + "step": 301910 + }, + { + "epoch": 1.52, + "learning_rate": 7.151621252100033e-05, + "loss": 0.0074, + "step": 301920 + }, + { + "epoch": 1.52, + "learning_rate": 7.150864482798633e-05, + "loss": 0.0056, + "step": 301930 + }, + { + "epoch": 1.52, + "learning_rate": 7.150107713497232e-05, + "loss": 0.0065, + "step": 301940 + }, + { + "epoch": 1.52, + "learning_rate": 7.14935094419583e-05, + "loss": 0.0057, + "step": 301950 + }, + { + "epoch": 1.52, + "learning_rate": 7.14859417489443e-05, + "loss": 0.0093, + "step": 301960 + }, + { + "epoch": 1.52, + "learning_rate": 7.14783740559303e-05, + "loss": 0.006, + "step": 301970 + }, + { + "epoch": 1.52, + "learning_rate": 7.147080636291628e-05, + "loss": 0.007, + "step": 301980 + }, + { + "epoch": 1.52, + "learning_rate": 7.146323866990227e-05, + "loss": 0.0069, + "step": 301990 + }, + { + "epoch": 1.52, + "learning_rate": 7.145567097688825e-05, + "loss": 0.008, + "step": 302000 + }, + { + "epoch": 1.52, + "eval_cer": 0.9144489071884033, + "eval_loss": 0.0054143439047038555, + "eval_runtime": 116.5206, + "eval_samples_per_second": 17.164, + "eval_steps_per_second": 4.291, + "step": 302000 + }, + { + "epoch": 1.52, + "learning_rate": 7.144810328387425e-05, + "loss": 0.0075, + "step": 302010 + }, + { + "epoch": 1.52, + "learning_rate": 7.144053559086024e-05, + "loss": 0.0073, + "step": 302020 + }, + { + "epoch": 1.52, + "learning_rate": 7.143296789784623e-05, + "loss": 0.007, + "step": 302030 + }, + { + "epoch": 1.52, + "learning_rate": 7.142540020483222e-05, + "loss": 0.0069, + "step": 302040 + }, + { + "epoch": 1.52, + "learning_rate": 7.141783251181822e-05, + "loss": 0.0078, + "step": 302050 + }, + { + "epoch": 1.52, + "learning_rate": 7.14102648188042e-05, + "loss": 0.0078, + "step": 302060 + }, + { + "epoch": 1.52, + "learning_rate": 7.140269712579019e-05, + "loss": 0.0089, + "step": 302070 + }, + { + "epoch": 1.52, + "learning_rate": 7.139512943277617e-05, + "loss": 0.0071, + "step": 302080 + }, + { + "epoch": 1.52, + "learning_rate": 7.138756173976217e-05, + "loss": 0.0062, + "step": 302090 + }, + { + "epoch": 1.52, + "learning_rate": 7.137999404674816e-05, + "loss": 0.0092, + "step": 302100 + }, + { + "epoch": 1.52, + "learning_rate": 7.137242635373414e-05, + "loss": 0.0076, + "step": 302110 + }, + { + "epoch": 1.52, + "learning_rate": 7.136485866072014e-05, + "loss": 0.0074, + "step": 302120 + }, + { + "epoch": 1.52, + "learning_rate": 7.135729096770612e-05, + "loss": 0.0078, + "step": 302130 + }, + { + "epoch": 1.52, + "learning_rate": 7.134972327469212e-05, + "loss": 0.0068, + "step": 302140 + }, + { + "epoch": 1.52, + "learning_rate": 7.13421555816781e-05, + "loss": 0.0097, + "step": 302150 + }, + { + "epoch": 1.52, + "learning_rate": 7.133458788866409e-05, + "loss": 0.0065, + "step": 302160 + }, + { + "epoch": 1.52, + "learning_rate": 7.132702019565009e-05, + "loss": 0.0067, + "step": 302170 + }, + { + "epoch": 1.52, + "learning_rate": 7.131945250263607e-05, + "loss": 0.0072, + "step": 302180 + }, + { + "epoch": 1.52, + "learning_rate": 7.131188480962206e-05, + "loss": 0.0072, + "step": 302190 + }, + { + "epoch": 1.52, + "learning_rate": 7.130431711660805e-05, + "loss": 0.0072, + "step": 302200 + }, + { + "epoch": 1.52, + "learning_rate": 7.129674942359404e-05, + "loss": 0.006, + "step": 302210 + }, + { + "epoch": 1.52, + "learning_rate": 7.128918173058004e-05, + "loss": 0.0081, + "step": 302220 + }, + { + "epoch": 1.52, + "learning_rate": 7.128161403756602e-05, + "loss": 0.0082, + "step": 302230 + }, + { + "epoch": 1.52, + "learning_rate": 7.127404634455201e-05, + "loss": 0.0083, + "step": 302240 + }, + { + "epoch": 1.52, + "learning_rate": 7.1266478651538e-05, + "loss": 0.0059, + "step": 302250 + }, + { + "epoch": 1.52, + "learning_rate": 7.125891095852399e-05, + "loss": 0.009, + "step": 302260 + }, + { + "epoch": 1.52, + "learning_rate": 7.125134326550998e-05, + "loss": 0.0063, + "step": 302270 + }, + { + "epoch": 1.53, + "learning_rate": 7.124377557249596e-05, + "loss": 0.0061, + "step": 302280 + }, + { + "epoch": 1.53, + "learning_rate": 7.123620787948196e-05, + "loss": 0.0075, + "step": 302290 + }, + { + "epoch": 1.53, + "learning_rate": 7.122864018646795e-05, + "loss": 0.0074, + "step": 302300 + }, + { + "epoch": 1.53, + "learning_rate": 7.122107249345394e-05, + "loss": 0.0064, + "step": 302310 + }, + { + "epoch": 1.53, + "learning_rate": 7.121350480043993e-05, + "loss": 0.0095, + "step": 302320 + }, + { + "epoch": 1.53, + "learning_rate": 7.120593710742593e-05, + "loss": 0.0054, + "step": 302330 + }, + { + "epoch": 1.53, + "learning_rate": 7.119836941441191e-05, + "loss": 0.0072, + "step": 302340 + }, + { + "epoch": 1.53, + "learning_rate": 7.11908017213979e-05, + "loss": 0.0077, + "step": 302350 + }, + { + "epoch": 1.53, + "learning_rate": 7.118323402838388e-05, + "loss": 0.006, + "step": 302360 + }, + { + "epoch": 1.53, + "learning_rate": 7.117566633536988e-05, + "loss": 0.0071, + "step": 302370 + }, + { + "epoch": 1.53, + "learning_rate": 7.116809864235587e-05, + "loss": 0.0073, + "step": 302380 + }, + { + "epoch": 1.53, + "learning_rate": 7.116053094934186e-05, + "loss": 0.0079, + "step": 302390 + }, + { + "epoch": 1.53, + "learning_rate": 7.115296325632785e-05, + "loss": 0.008, + "step": 302400 + }, + { + "epoch": 1.53, + "learning_rate": 7.114539556331385e-05, + "loss": 0.0082, + "step": 302410 + }, + { + "epoch": 1.53, + "learning_rate": 7.113782787029983e-05, + "loss": 0.0085, + "step": 302420 + }, + { + "epoch": 1.53, + "learning_rate": 7.113026017728582e-05, + "loss": 0.0088, + "step": 302430 + }, + { + "epoch": 1.53, + "learning_rate": 7.11226924842718e-05, + "loss": 0.0096, + "step": 302440 + }, + { + "epoch": 1.53, + "learning_rate": 7.111512479125778e-05, + "loss": 0.0068, + "step": 302450 + }, + { + "epoch": 1.53, + "learning_rate": 7.110755709824378e-05, + "loss": 0.0063, + "step": 302460 + }, + { + "epoch": 1.53, + "learning_rate": 7.109998940522977e-05, + "loss": 0.0062, + "step": 302470 + }, + { + "epoch": 1.53, + "learning_rate": 7.109242171221576e-05, + "loss": 0.007, + "step": 302480 + }, + { + "epoch": 1.53, + "learning_rate": 7.108485401920175e-05, + "loss": 0.0101, + "step": 302490 + }, + { + "epoch": 1.53, + "learning_rate": 7.107728632618775e-05, + "loss": 0.0096, + "step": 302500 + }, + { + "epoch": 1.53, + "learning_rate": 7.106971863317373e-05, + "loss": 0.0063, + "step": 302510 + }, + { + "epoch": 1.53, + "learning_rate": 7.106215094015972e-05, + "loss": 0.0061, + "step": 302520 + }, + { + "epoch": 1.53, + "learning_rate": 7.10545832471457e-05, + "loss": 0.0089, + "step": 302530 + }, + { + "epoch": 1.53, + "learning_rate": 7.10470155541317e-05, + "loss": 0.0049, + "step": 302540 + }, + { + "epoch": 1.53, + "learning_rate": 7.10394478611177e-05, + "loss": 0.008, + "step": 302550 + }, + { + "epoch": 1.53, + "learning_rate": 7.103188016810368e-05, + "loss": 0.008, + "step": 302560 + }, + { + "epoch": 1.53, + "learning_rate": 7.102431247508967e-05, + "loss": 0.0065, + "step": 302570 + }, + { + "epoch": 1.53, + "learning_rate": 7.101674478207567e-05, + "loss": 0.0072, + "step": 302580 + }, + { + "epoch": 1.53, + "learning_rate": 7.100917708906165e-05, + "loss": 0.0067, + "step": 302590 + }, + { + "epoch": 1.53, + "learning_rate": 7.100160939604764e-05, + "loss": 0.0093, + "step": 302600 + }, + { + "epoch": 1.53, + "learning_rate": 7.099404170303364e-05, + "loss": 0.0074, + "step": 302610 + }, + { + "epoch": 1.53, + "learning_rate": 7.098647401001962e-05, + "loss": 0.0062, + "step": 302620 + }, + { + "epoch": 1.53, + "learning_rate": 7.097890631700561e-05, + "loss": 0.0067, + "step": 302630 + }, + { + "epoch": 1.53, + "learning_rate": 7.09713386239916e-05, + "loss": 0.0081, + "step": 302640 + }, + { + "epoch": 1.53, + "learning_rate": 7.096377093097759e-05, + "loss": 0.0096, + "step": 302650 + }, + { + "epoch": 1.53, + "learning_rate": 7.095620323796358e-05, + "loss": 0.0079, + "step": 302660 + }, + { + "epoch": 1.53, + "learning_rate": 7.094863554494957e-05, + "loss": 0.007, + "step": 302670 + }, + { + "epoch": 1.53, + "learning_rate": 7.094106785193556e-05, + "loss": 0.0068, + "step": 302680 + }, + { + "epoch": 1.53, + "learning_rate": 7.093350015892156e-05, + "loss": 0.006, + "step": 302690 + }, + { + "epoch": 1.53, + "learning_rate": 7.092593246590754e-05, + "loss": 0.0064, + "step": 302700 + }, + { + "epoch": 1.53, + "learning_rate": 7.091836477289353e-05, + "loss": 0.007, + "step": 302710 + }, + { + "epoch": 1.53, + "learning_rate": 7.091079707987951e-05, + "loss": 0.0063, + "step": 302720 + }, + { + "epoch": 1.53, + "learning_rate": 7.090322938686551e-05, + "loss": 0.0093, + "step": 302730 + }, + { + "epoch": 1.53, + "learning_rate": 7.08956616938515e-05, + "loss": 0.0096, + "step": 302740 + }, + { + "epoch": 1.53, + "learning_rate": 7.088809400083749e-05, + "loss": 0.0067, + "step": 302750 + }, + { + "epoch": 1.53, + "learning_rate": 7.088052630782347e-05, + "loss": 0.0074, + "step": 302760 + }, + { + "epoch": 1.53, + "learning_rate": 7.087295861480946e-05, + "loss": 0.0087, + "step": 302770 + }, + { + "epoch": 1.53, + "learning_rate": 7.086539092179546e-05, + "loss": 0.0074, + "step": 302780 + }, + { + "epoch": 1.53, + "learning_rate": 7.085782322878144e-05, + "loss": 0.0058, + "step": 302790 + }, + { + "epoch": 1.53, + "learning_rate": 7.085025553576743e-05, + "loss": 0.008, + "step": 302800 + }, + { + "epoch": 1.53, + "learning_rate": 7.084268784275341e-05, + "loss": 0.0074, + "step": 302810 + }, + { + "epoch": 1.53, + "learning_rate": 7.083512014973941e-05, + "loss": 0.0066, + "step": 302820 + }, + { + "epoch": 1.53, + "learning_rate": 7.08275524567254e-05, + "loss": 0.0078, + "step": 302830 + }, + { + "epoch": 1.53, + "learning_rate": 7.081998476371139e-05, + "loss": 0.007, + "step": 302840 + }, + { + "epoch": 1.53, + "learning_rate": 7.081241707069738e-05, + "loss": 0.0062, + "step": 302850 + }, + { + "epoch": 1.53, + "learning_rate": 7.080484937768338e-05, + "loss": 0.0077, + "step": 302860 + }, + { + "epoch": 1.53, + "learning_rate": 7.079728168466936e-05, + "loss": 0.0072, + "step": 302870 + }, + { + "epoch": 1.53, + "learning_rate": 7.078971399165535e-05, + "loss": 0.0065, + "step": 302880 + }, + { + "epoch": 1.53, + "learning_rate": 7.078214629864133e-05, + "loss": 0.0054, + "step": 302890 + }, + { + "epoch": 1.53, + "learning_rate": 7.077457860562733e-05, + "loss": 0.0096, + "step": 302900 + }, + { + "epoch": 1.53, + "learning_rate": 7.076701091261332e-05, + "loss": 0.0075, + "step": 302910 + }, + { + "epoch": 1.53, + "learning_rate": 7.07594432195993e-05, + "loss": 0.008, + "step": 302920 + }, + { + "epoch": 1.53, + "learning_rate": 7.07518755265853e-05, + "loss": 0.0098, + "step": 302930 + }, + { + "epoch": 1.53, + "learning_rate": 7.07443078335713e-05, + "loss": 0.0062, + "step": 302940 + }, + { + "epoch": 1.53, + "learning_rate": 7.073674014055728e-05, + "loss": 0.0063, + "step": 302950 + }, + { + "epoch": 1.53, + "learning_rate": 7.072917244754327e-05, + "loss": 0.0054, + "step": 302960 + }, + { + "epoch": 1.53, + "learning_rate": 7.072160475452925e-05, + "loss": 0.0065, + "step": 302970 + }, + { + "epoch": 1.53, + "learning_rate": 7.071403706151525e-05, + "loss": 0.0086, + "step": 302980 + }, + { + "epoch": 1.53, + "learning_rate": 7.070646936850124e-05, + "loss": 0.0093, + "step": 302990 + }, + { + "epoch": 1.53, + "learning_rate": 7.069890167548722e-05, + "loss": 0.0051, + "step": 303000 + }, + { + "epoch": 1.53, + "eval_cer": 0.9144556999612812, + "eval_loss": 0.00549934571608901, + "eval_runtime": 116.3379, + "eval_samples_per_second": 17.191, + "eval_steps_per_second": 4.298, + "step": 303000 + }, + { + "epoch": 1.53, + "learning_rate": 7.069133398247322e-05, + "loss": 0.0096, + "step": 303010 + }, + { + "epoch": 1.53, + "learning_rate": 7.068376628945921e-05, + "loss": 0.0077, + "step": 303020 + }, + { + "epoch": 1.53, + "learning_rate": 7.06761985964452e-05, + "loss": 0.0057, + "step": 303030 + }, + { + "epoch": 1.53, + "learning_rate": 7.066863090343119e-05, + "loss": 0.0071, + "step": 303040 + }, + { + "epoch": 1.53, + "learning_rate": 7.066106321041717e-05, + "loss": 0.0069, + "step": 303050 + }, + { + "epoch": 1.53, + "learning_rate": 7.065349551740317e-05, + "loss": 0.0091, + "step": 303060 + }, + { + "epoch": 1.53, + "learning_rate": 7.064592782438915e-05, + "loss": 0.0078, + "step": 303070 + }, + { + "epoch": 1.53, + "learning_rate": 7.063836013137514e-05, + "loss": 0.0095, + "step": 303080 + }, + { + "epoch": 1.53, + "learning_rate": 7.063079243836113e-05, + "loss": 0.006, + "step": 303090 + }, + { + "epoch": 1.53, + "learning_rate": 7.062322474534712e-05, + "loss": 0.0077, + "step": 303100 + }, + { + "epoch": 1.53, + "learning_rate": 7.061565705233312e-05, + "loss": 0.0072, + "step": 303110 + }, + { + "epoch": 1.53, + "learning_rate": 7.06080893593191e-05, + "loss": 0.0081, + "step": 303120 + }, + { + "epoch": 1.53, + "learning_rate": 7.060052166630509e-05, + "loss": 0.0073, + "step": 303130 + }, + { + "epoch": 1.53, + "learning_rate": 7.059295397329109e-05, + "loss": 0.0089, + "step": 303140 + }, + { + "epoch": 1.53, + "learning_rate": 7.058538628027707e-05, + "loss": 0.0067, + "step": 303150 + }, + { + "epoch": 1.53, + "learning_rate": 7.057781858726306e-05, + "loss": 0.0056, + "step": 303160 + }, + { + "epoch": 1.53, + "learning_rate": 7.057025089424904e-05, + "loss": 0.0055, + "step": 303170 + }, + { + "epoch": 1.53, + "learning_rate": 7.056268320123504e-05, + "loss": 0.0075, + "step": 303180 + }, + { + "epoch": 1.53, + "learning_rate": 7.055511550822103e-05, + "loss": 0.0068, + "step": 303190 + }, + { + "epoch": 1.53, + "learning_rate": 7.054754781520702e-05, + "loss": 0.008, + "step": 303200 + }, + { + "epoch": 1.53, + "learning_rate": 7.053998012219301e-05, + "loss": 0.0089, + "step": 303210 + }, + { + "epoch": 1.53, + "learning_rate": 7.0532412429179e-05, + "loss": 0.0065, + "step": 303220 + }, + { + "epoch": 1.53, + "learning_rate": 7.052484473616499e-05, + "loss": 0.0073, + "step": 303230 + }, + { + "epoch": 1.53, + "learning_rate": 7.051727704315098e-05, + "loss": 0.0082, + "step": 303240 + }, + { + "epoch": 1.53, + "learning_rate": 7.050970935013696e-05, + "loss": 0.0073, + "step": 303250 + }, + { + "epoch": 1.53, + "learning_rate": 7.050214165712296e-05, + "loss": 0.007, + "step": 303260 + }, + { + "epoch": 1.53, + "learning_rate": 7.049457396410895e-05, + "loss": 0.0088, + "step": 303270 + }, + { + "epoch": 1.53, + "learning_rate": 7.048700627109494e-05, + "loss": 0.0083, + "step": 303280 + }, + { + "epoch": 1.53, + "learning_rate": 7.047943857808093e-05, + "loss": 0.006, + "step": 303290 + }, + { + "epoch": 1.53, + "learning_rate": 7.047187088506693e-05, + "loss": 0.0064, + "step": 303300 + }, + { + "epoch": 1.53, + "learning_rate": 7.046430319205291e-05, + "loss": 0.0067, + "step": 303310 + }, + { + "epoch": 1.53, + "learning_rate": 7.04567354990389e-05, + "loss": 0.0073, + "step": 303320 + }, + { + "epoch": 1.53, + "learning_rate": 7.044916780602488e-05, + "loss": 0.0047, + "step": 303330 + }, + { + "epoch": 1.53, + "learning_rate": 7.044160011301088e-05, + "loss": 0.0075, + "step": 303340 + }, + { + "epoch": 1.53, + "learning_rate": 7.043403241999687e-05, + "loss": 0.0067, + "step": 303350 + }, + { + "epoch": 1.53, + "learning_rate": 7.042646472698285e-05, + "loss": 0.0064, + "step": 303360 + }, + { + "epoch": 1.53, + "learning_rate": 7.041889703396885e-05, + "loss": 0.0077, + "step": 303370 + }, + { + "epoch": 1.53, + "learning_rate": 7.041132934095484e-05, + "loss": 0.009, + "step": 303380 + }, + { + "epoch": 1.53, + "learning_rate": 7.040376164794083e-05, + "loss": 0.0069, + "step": 303390 + }, + { + "epoch": 1.53, + "learning_rate": 7.039619395492681e-05, + "loss": 0.0076, + "step": 303400 + }, + { + "epoch": 1.53, + "learning_rate": 7.03886262619128e-05, + "loss": 0.0062, + "step": 303410 + }, + { + "epoch": 1.53, + "learning_rate": 7.038105856889878e-05, + "loss": 0.0063, + "step": 303420 + }, + { + "epoch": 1.53, + "learning_rate": 7.037349087588478e-05, + "loss": 0.0075, + "step": 303430 + }, + { + "epoch": 1.53, + "learning_rate": 7.036592318287077e-05, + "loss": 0.0072, + "step": 303440 + }, + { + "epoch": 1.53, + "learning_rate": 7.035835548985676e-05, + "loss": 0.0051, + "step": 303450 + }, + { + "epoch": 1.53, + "learning_rate": 7.035078779684275e-05, + "loss": 0.0079, + "step": 303460 + }, + { + "epoch": 1.53, + "learning_rate": 7.034322010382875e-05, + "loss": 0.006, + "step": 303470 + }, + { + "epoch": 1.53, + "learning_rate": 7.033565241081473e-05, + "loss": 0.0071, + "step": 303480 + }, + { + "epoch": 1.53, + "learning_rate": 7.032808471780072e-05, + "loss": 0.0067, + "step": 303490 + }, + { + "epoch": 1.53, + "learning_rate": 7.03205170247867e-05, + "loss": 0.0072, + "step": 303500 + }, + { + "epoch": 1.53, + "learning_rate": 7.03129493317727e-05, + "loss": 0.0088, + "step": 303510 + }, + { + "epoch": 1.53, + "learning_rate": 7.03053816387587e-05, + "loss": 0.0078, + "step": 303520 + }, + { + "epoch": 1.53, + "learning_rate": 7.029781394574467e-05, + "loss": 0.0072, + "step": 303530 + }, + { + "epoch": 1.53, + "learning_rate": 7.029024625273067e-05, + "loss": 0.011, + "step": 303540 + }, + { + "epoch": 1.53, + "learning_rate": 7.028267855971666e-05, + "loss": 0.0076, + "step": 303550 + }, + { + "epoch": 1.53, + "learning_rate": 7.027511086670265e-05, + "loss": 0.008, + "step": 303560 + }, + { + "epoch": 1.53, + "learning_rate": 7.026754317368864e-05, + "loss": 0.0067, + "step": 303570 + }, + { + "epoch": 1.53, + "learning_rate": 7.025997548067464e-05, + "loss": 0.0056, + "step": 303580 + }, + { + "epoch": 1.53, + "learning_rate": 7.025240778766062e-05, + "loss": 0.0051, + "step": 303590 + }, + { + "epoch": 1.53, + "learning_rate": 7.024484009464661e-05, + "loss": 0.0074, + "step": 303600 + }, + { + "epoch": 1.53, + "learning_rate": 7.02372724016326e-05, + "loss": 0.0107, + "step": 303610 + }, + { + "epoch": 1.53, + "learning_rate": 7.022970470861859e-05, + "loss": 0.0066, + "step": 303620 + }, + { + "epoch": 1.53, + "learning_rate": 7.022213701560458e-05, + "loss": 0.0066, + "step": 303630 + }, + { + "epoch": 1.53, + "learning_rate": 7.021456932259057e-05, + "loss": 0.0059, + "step": 303640 + }, + { + "epoch": 1.53, + "learning_rate": 7.020700162957656e-05, + "loss": 0.0058, + "step": 303650 + }, + { + "epoch": 1.53, + "learning_rate": 7.019943393656256e-05, + "loss": 0.0054, + "step": 303660 + }, + { + "epoch": 1.53, + "learning_rate": 7.019186624354854e-05, + "loss": 0.0069, + "step": 303670 + }, + { + "epoch": 1.53, + "learning_rate": 7.018429855053453e-05, + "loss": 0.0056, + "step": 303680 + }, + { + "epoch": 1.53, + "learning_rate": 7.017673085752051e-05, + "loss": 0.0067, + "step": 303690 + }, + { + "epoch": 1.53, + "learning_rate": 7.01691631645065e-05, + "loss": 0.0097, + "step": 303700 + }, + { + "epoch": 1.53, + "learning_rate": 7.016159547149249e-05, + "loss": 0.0091, + "step": 303710 + }, + { + "epoch": 1.53, + "learning_rate": 7.015402777847848e-05, + "loss": 0.0069, + "step": 303720 + }, + { + "epoch": 1.53, + "learning_rate": 7.014646008546447e-05, + "loss": 0.0083, + "step": 303730 + }, + { + "epoch": 1.53, + "learning_rate": 7.013889239245046e-05, + "loss": 0.0072, + "step": 303740 + }, + { + "epoch": 1.53, + "learning_rate": 7.013132469943646e-05, + "loss": 0.0057, + "step": 303750 + }, + { + "epoch": 1.53, + "learning_rate": 7.012375700642244e-05, + "loss": 0.0057, + "step": 303760 + }, + { + "epoch": 1.53, + "learning_rate": 7.011618931340843e-05, + "loss": 0.0078, + "step": 303770 + }, + { + "epoch": 1.53, + "learning_rate": 7.010862162039441e-05, + "loss": 0.0086, + "step": 303780 + }, + { + "epoch": 1.53, + "learning_rate": 7.010105392738041e-05, + "loss": 0.0063, + "step": 303790 + }, + { + "epoch": 1.53, + "learning_rate": 7.00934862343664e-05, + "loss": 0.0054, + "step": 303800 + }, + { + "epoch": 1.53, + "learning_rate": 7.008591854135239e-05, + "loss": 0.0068, + "step": 303810 + }, + { + "epoch": 1.53, + "learning_rate": 7.007835084833838e-05, + "loss": 0.0075, + "step": 303820 + }, + { + "epoch": 1.53, + "learning_rate": 7.007078315532438e-05, + "loss": 0.0051, + "step": 303830 + }, + { + "epoch": 1.53, + "learning_rate": 7.006321546231036e-05, + "loss": 0.0055, + "step": 303840 + }, + { + "epoch": 1.53, + "learning_rate": 7.005564776929635e-05, + "loss": 0.004, + "step": 303850 + }, + { + "epoch": 1.53, + "learning_rate": 7.004808007628233e-05, + "loss": 0.0081, + "step": 303860 + }, + { + "epoch": 1.53, + "learning_rate": 7.004051238326833e-05, + "loss": 0.0083, + "step": 303870 + }, + { + "epoch": 1.53, + "learning_rate": 7.003294469025432e-05, + "loss": 0.0058, + "step": 303880 + }, + { + "epoch": 1.53, + "learning_rate": 7.00253769972403e-05, + "loss": 0.0081, + "step": 303890 + }, + { + "epoch": 1.53, + "learning_rate": 7.00178093042263e-05, + "loss": 0.0089, + "step": 303900 + }, + { + "epoch": 1.53, + "learning_rate": 7.00102416112123e-05, + "loss": 0.0087, + "step": 303910 + }, + { + "epoch": 1.53, + "learning_rate": 7.000267391819828e-05, + "loss": 0.0066, + "step": 303920 + }, + { + "epoch": 1.53, + "learning_rate": 6.999510622518427e-05, + "loss": 0.0092, + "step": 303930 + }, + { + "epoch": 1.53, + "learning_rate": 6.998753853217025e-05, + "loss": 0.0053, + "step": 303940 + }, + { + "epoch": 1.53, + "learning_rate": 6.997997083915625e-05, + "loss": 0.0073, + "step": 303950 + }, + { + "epoch": 1.53, + "learning_rate": 6.997240314614224e-05, + "loss": 0.0078, + "step": 303960 + }, + { + "epoch": 1.53, + "learning_rate": 6.996483545312822e-05, + "loss": 0.0074, + "step": 303970 + }, + { + "epoch": 1.53, + "learning_rate": 6.995726776011422e-05, + "loss": 0.0089, + "step": 303980 + }, + { + "epoch": 1.53, + "learning_rate": 6.994970006710021e-05, + "loss": 0.01, + "step": 303990 + }, + { + "epoch": 1.53, + "learning_rate": 6.99421323740862e-05, + "loss": 0.0086, + "step": 304000 + }, + { + "epoch": 1.53, + "eval_cer": 0.9144459960000272, + "eval_loss": 0.005344762932509184, + "eval_runtime": 116.3874, + "eval_samples_per_second": 17.184, + "eval_steps_per_second": 4.296, + "step": 304000 + }, + { + "epoch": 1.53, + "learning_rate": 6.993456468107218e-05, + "loss": 0.0104, + "step": 304010 + }, + { + "epoch": 1.53, + "learning_rate": 6.992699698805817e-05, + "loss": 0.0061, + "step": 304020 + }, + { + "epoch": 1.53, + "learning_rate": 6.991942929504417e-05, + "loss": 0.0075, + "step": 304030 + }, + { + "epoch": 1.53, + "learning_rate": 6.991186160203015e-05, + "loss": 0.0075, + "step": 304040 + }, + { + "epoch": 1.53, + "learning_rate": 6.990429390901614e-05, + "loss": 0.0103, + "step": 304050 + }, + { + "epoch": 1.53, + "learning_rate": 6.989672621600212e-05, + "loss": 0.009, + "step": 304060 + }, + { + "epoch": 1.53, + "learning_rate": 6.988915852298812e-05, + "loss": 0.0096, + "step": 304070 + }, + { + "epoch": 1.53, + "learning_rate": 6.988159082997411e-05, + "loss": 0.0083, + "step": 304080 + }, + { + "epoch": 1.53, + "learning_rate": 6.98740231369601e-05, + "loss": 0.0059, + "step": 304090 + }, + { + "epoch": 1.53, + "learning_rate": 6.986645544394609e-05, + "loss": 0.0074, + "step": 304100 + }, + { + "epoch": 1.53, + "learning_rate": 6.985888775093209e-05, + "loss": 0.0088, + "step": 304110 + }, + { + "epoch": 1.53, + "learning_rate": 6.985132005791807e-05, + "loss": 0.009, + "step": 304120 + }, + { + "epoch": 1.53, + "learning_rate": 6.984375236490406e-05, + "loss": 0.006, + "step": 304130 + }, + { + "epoch": 1.53, + "learning_rate": 6.983618467189004e-05, + "loss": 0.0071, + "step": 304140 + }, + { + "epoch": 1.53, + "learning_rate": 6.982861697887604e-05, + "loss": 0.0086, + "step": 304150 + }, + { + "epoch": 1.53, + "learning_rate": 6.982104928586203e-05, + "loss": 0.0077, + "step": 304160 + }, + { + "epoch": 1.53, + "learning_rate": 6.981348159284802e-05, + "loss": 0.0076, + "step": 304170 + }, + { + "epoch": 1.53, + "learning_rate": 6.980591389983401e-05, + "loss": 0.0059, + "step": 304180 + }, + { + "epoch": 1.53, + "learning_rate": 6.979834620682e-05, + "loss": 0.008, + "step": 304190 + }, + { + "epoch": 1.53, + "learning_rate": 6.979077851380599e-05, + "loss": 0.0072, + "step": 304200 + }, + { + "epoch": 1.53, + "learning_rate": 6.978321082079198e-05, + "loss": 0.0058, + "step": 304210 + }, + { + "epoch": 1.53, + "learning_rate": 6.977564312777796e-05, + "loss": 0.0063, + "step": 304220 + }, + { + "epoch": 1.53, + "learning_rate": 6.976807543476396e-05, + "loss": 0.0078, + "step": 304230 + }, + { + "epoch": 1.53, + "learning_rate": 6.976050774174995e-05, + "loss": 0.0091, + "step": 304240 + }, + { + "epoch": 1.53, + "learning_rate": 6.975294004873593e-05, + "loss": 0.0068, + "step": 304250 + }, + { + "epoch": 1.54, + "learning_rate": 6.974537235572193e-05, + "loss": 0.0074, + "step": 304260 + }, + { + "epoch": 1.54, + "learning_rate": 6.973780466270792e-05, + "loss": 0.0067, + "step": 304270 + }, + { + "epoch": 1.54, + "learning_rate": 6.97302369696939e-05, + "loss": 0.0097, + "step": 304280 + }, + { + "epoch": 1.54, + "learning_rate": 6.97226692766799e-05, + "loss": 0.0082, + "step": 304290 + }, + { + "epoch": 1.54, + "learning_rate": 6.971510158366588e-05, + "loss": 0.0078, + "step": 304300 + }, + { + "epoch": 1.54, + "learning_rate": 6.970753389065188e-05, + "loss": 0.0093, + "step": 304310 + }, + { + "epoch": 1.54, + "learning_rate": 6.969996619763787e-05, + "loss": 0.0068, + "step": 304320 + }, + { + "epoch": 1.54, + "learning_rate": 6.969239850462385e-05, + "loss": 0.0098, + "step": 304330 + }, + { + "epoch": 1.54, + "learning_rate": 6.968483081160984e-05, + "loss": 0.01, + "step": 304340 + }, + { + "epoch": 1.54, + "learning_rate": 6.967726311859583e-05, + "loss": 0.0062, + "step": 304350 + }, + { + "epoch": 1.54, + "learning_rate": 6.966969542558183e-05, + "loss": 0.0081, + "step": 304360 + }, + { + "epoch": 1.54, + "learning_rate": 6.966212773256781e-05, + "loss": 0.0085, + "step": 304370 + }, + { + "epoch": 1.54, + "learning_rate": 6.96545600395538e-05, + "loss": 0.0072, + "step": 304380 + }, + { + "epoch": 1.54, + "learning_rate": 6.964699234653978e-05, + "loss": 0.0075, + "step": 304390 + }, + { + "epoch": 1.54, + "learning_rate": 6.963942465352578e-05, + "loss": 0.0048, + "step": 304400 + }, + { + "epoch": 1.54, + "learning_rate": 6.963185696051177e-05, + "loss": 0.0064, + "step": 304410 + }, + { + "epoch": 1.54, + "learning_rate": 6.962428926749775e-05, + "loss": 0.0057, + "step": 304420 + }, + { + "epoch": 1.54, + "learning_rate": 6.961672157448375e-05, + "loss": 0.0063, + "step": 304430 + }, + { + "epoch": 1.54, + "learning_rate": 6.960915388146974e-05, + "loss": 0.0069, + "step": 304440 + }, + { + "epoch": 1.54, + "learning_rate": 6.960158618845573e-05, + "loss": 0.0072, + "step": 304450 + }, + { + "epoch": 1.54, + "learning_rate": 6.959401849544172e-05, + "loss": 0.0065, + "step": 304460 + }, + { + "epoch": 1.54, + "learning_rate": 6.95864508024277e-05, + "loss": 0.0063, + "step": 304470 + }, + { + "epoch": 1.54, + "learning_rate": 6.95788831094137e-05, + "loss": 0.009, + "step": 304480 + }, + { + "epoch": 1.54, + "learning_rate": 6.957131541639969e-05, + "loss": 0.0058, + "step": 304490 + }, + { + "epoch": 1.54, + "learning_rate": 6.956374772338567e-05, + "loss": 0.0067, + "step": 304500 + }, + { + "epoch": 1.54, + "learning_rate": 6.955618003037167e-05, + "loss": 0.0064, + "step": 304510 + }, + { + "epoch": 1.54, + "learning_rate": 6.954861233735766e-05, + "loss": 0.0096, + "step": 304520 + }, + { + "epoch": 1.54, + "learning_rate": 6.954104464434365e-05, + "loss": 0.0095, + "step": 304530 + }, + { + "epoch": 1.54, + "learning_rate": 6.953347695132964e-05, + "loss": 0.0055, + "step": 304540 + }, + { + "epoch": 1.54, + "learning_rate": 6.952590925831564e-05, + "loss": 0.0069, + "step": 304550 + }, + { + "epoch": 1.54, + "learning_rate": 6.951834156530162e-05, + "loss": 0.0061, + "step": 304560 + }, + { + "epoch": 1.54, + "learning_rate": 6.951077387228761e-05, + "loss": 0.0067, + "step": 304570 + }, + { + "epoch": 1.54, + "learning_rate": 6.95032061792736e-05, + "loss": 0.0065, + "step": 304580 + }, + { + "epoch": 1.54, + "learning_rate": 6.949563848625959e-05, + "loss": 0.0052, + "step": 304590 + }, + { + "epoch": 1.54, + "learning_rate": 6.948807079324558e-05, + "loss": 0.0079, + "step": 304600 + }, + { + "epoch": 1.54, + "learning_rate": 6.948050310023157e-05, + "loss": 0.0062, + "step": 304610 + }, + { + "epoch": 1.54, + "learning_rate": 6.947293540721756e-05, + "loss": 0.0096, + "step": 304620 + }, + { + "epoch": 1.54, + "learning_rate": 6.946536771420355e-05, + "loss": 0.0075, + "step": 304630 + }, + { + "epoch": 1.54, + "learning_rate": 6.945780002118954e-05, + "loss": 0.0071, + "step": 304640 + }, + { + "epoch": 1.54, + "learning_rate": 6.945023232817552e-05, + "loss": 0.0062, + "step": 304650 + }, + { + "epoch": 1.54, + "learning_rate": 6.944266463516151e-05, + "loss": 0.0061, + "step": 304660 + }, + { + "epoch": 1.54, + "learning_rate": 6.94350969421475e-05, + "loss": 0.0064, + "step": 304670 + }, + { + "epoch": 1.54, + "learning_rate": 6.942752924913349e-05, + "loss": 0.0068, + "step": 304680 + }, + { + "epoch": 1.54, + "learning_rate": 6.941996155611948e-05, + "loss": 0.0057, + "step": 304690 + }, + { + "epoch": 1.54, + "learning_rate": 6.941239386310547e-05, + "loss": 0.0057, + "step": 304700 + }, + { + "epoch": 1.54, + "learning_rate": 6.940482617009146e-05, + "loss": 0.0083, + "step": 304710 + }, + { + "epoch": 1.54, + "learning_rate": 6.939725847707746e-05, + "loss": 0.0068, + "step": 304720 + }, + { + "epoch": 1.54, + "learning_rate": 6.938969078406344e-05, + "loss": 0.0071, + "step": 304730 + }, + { + "epoch": 1.54, + "learning_rate": 6.938212309104943e-05, + "loss": 0.0071, + "step": 304740 + }, + { + "epoch": 1.54, + "learning_rate": 6.937455539803541e-05, + "loss": 0.0073, + "step": 304750 + }, + { + "epoch": 1.54, + "learning_rate": 6.936698770502141e-05, + "loss": 0.0086, + "step": 304760 + }, + { + "epoch": 1.54, + "learning_rate": 6.93594200120074e-05, + "loss": 0.0068, + "step": 304770 + }, + { + "epoch": 1.54, + "learning_rate": 6.935185231899339e-05, + "loss": 0.0077, + "step": 304780 + }, + { + "epoch": 1.54, + "learning_rate": 6.934428462597938e-05, + "loss": 0.0075, + "step": 304790 + }, + { + "epoch": 1.54, + "learning_rate": 6.933671693296538e-05, + "loss": 0.0065, + "step": 304800 + }, + { + "epoch": 1.54, + "learning_rate": 6.932914923995136e-05, + "loss": 0.0065, + "step": 304810 + }, + { + "epoch": 1.54, + "learning_rate": 6.932158154693735e-05, + "loss": 0.009, + "step": 304820 + }, + { + "epoch": 1.54, + "learning_rate": 6.931401385392333e-05, + "loss": 0.006, + "step": 304830 + }, + { + "epoch": 1.54, + "learning_rate": 6.930644616090933e-05, + "loss": 0.005, + "step": 304840 + }, + { + "epoch": 1.54, + "learning_rate": 6.929887846789532e-05, + "loss": 0.0064, + "step": 304850 + }, + { + "epoch": 1.54, + "learning_rate": 6.92913107748813e-05, + "loss": 0.0072, + "step": 304860 + }, + { + "epoch": 1.54, + "learning_rate": 6.92837430818673e-05, + "loss": 0.0061, + "step": 304870 + }, + { + "epoch": 1.54, + "learning_rate": 6.92761753888533e-05, + "loss": 0.0061, + "step": 304880 + }, + { + "epoch": 1.54, + "learning_rate": 6.926860769583928e-05, + "loss": 0.007, + "step": 304890 + }, + { + "epoch": 1.54, + "learning_rate": 6.926104000282527e-05, + "loss": 0.0063, + "step": 304900 + }, + { + "epoch": 1.54, + "learning_rate": 6.925347230981125e-05, + "loss": 0.0073, + "step": 304910 + }, + { + "epoch": 1.54, + "learning_rate": 6.924590461679725e-05, + "loss": 0.007, + "step": 304920 + }, + { + "epoch": 1.54, + "learning_rate": 6.923833692378324e-05, + "loss": 0.006, + "step": 304930 + }, + { + "epoch": 1.54, + "learning_rate": 6.923076923076922e-05, + "loss": 0.0057, + "step": 304940 + }, + { + "epoch": 1.54, + "learning_rate": 6.922320153775522e-05, + "loss": 0.0056, + "step": 304950 + }, + { + "epoch": 1.54, + "learning_rate": 6.92156338447412e-05, + "loss": 0.0055, + "step": 304960 + }, + { + "epoch": 1.54, + "learning_rate": 6.92080661517272e-05, + "loss": 0.0077, + "step": 304970 + }, + { + "epoch": 1.54, + "learning_rate": 6.920049845871318e-05, + "loss": 0.0074, + "step": 304980 + }, + { + "epoch": 1.54, + "learning_rate": 6.919293076569917e-05, + "loss": 0.0056, + "step": 304990 + }, + { + "epoch": 1.54, + "learning_rate": 6.918536307268517e-05, + "loss": 0.0072, + "step": 305000 + }, + { + "epoch": 1.54, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.0054320478811860085, + "eval_runtime": 116.39, + "eval_samples_per_second": 17.184, + "eval_steps_per_second": 4.296, + "step": 305000 + }, + { + "epoch": 1.54, + "learning_rate": 6.917779537967115e-05, + "loss": 0.0077, + "step": 305010 + }, + { + "epoch": 1.54, + "learning_rate": 6.917022768665714e-05, + "loss": 0.0075, + "step": 305020 + }, + { + "epoch": 1.54, + "learning_rate": 6.916265999364312e-05, + "loss": 0.0113, + "step": 305030 + }, + { + "epoch": 1.54, + "learning_rate": 6.915509230062912e-05, + "loss": 0.0112, + "step": 305040 + }, + { + "epoch": 1.54, + "learning_rate": 6.914752460761511e-05, + "loss": 0.0063, + "step": 305050 + }, + { + "epoch": 1.54, + "learning_rate": 6.91399569146011e-05, + "loss": 0.0066, + "step": 305060 + }, + { + "epoch": 1.54, + "learning_rate": 6.913238922158709e-05, + "loss": 0.0076, + "step": 305070 + }, + { + "epoch": 1.54, + "learning_rate": 6.912482152857309e-05, + "loss": 0.0063, + "step": 305080 + }, + { + "epoch": 1.54, + "learning_rate": 6.911725383555907e-05, + "loss": 0.0071, + "step": 305090 + }, + { + "epoch": 1.54, + "learning_rate": 6.910968614254506e-05, + "loss": 0.0077, + "step": 305100 + }, + { + "epoch": 1.54, + "learning_rate": 6.910211844953104e-05, + "loss": 0.0052, + "step": 305110 + }, + { + "epoch": 1.54, + "learning_rate": 6.909455075651704e-05, + "loss": 0.0065, + "step": 305120 + }, + { + "epoch": 1.54, + "learning_rate": 6.908698306350303e-05, + "loss": 0.0074, + "step": 305130 + }, + { + "epoch": 1.54, + "learning_rate": 6.907941537048902e-05, + "loss": 0.0073, + "step": 305140 + }, + { + "epoch": 1.54, + "learning_rate": 6.907184767747501e-05, + "loss": 0.0064, + "step": 305150 + }, + { + "epoch": 1.54, + "learning_rate": 6.9064279984461e-05, + "loss": 0.0052, + "step": 305160 + }, + { + "epoch": 1.54, + "learning_rate": 6.905671229144699e-05, + "loss": 0.0068, + "step": 305170 + }, + { + "epoch": 1.54, + "learning_rate": 6.904914459843298e-05, + "loss": 0.0085, + "step": 305180 + }, + { + "epoch": 1.54, + "learning_rate": 6.904157690541896e-05, + "loss": 0.0084, + "step": 305190 + }, + { + "epoch": 1.54, + "learning_rate": 6.903400921240496e-05, + "loss": 0.0076, + "step": 305200 + }, + { + "epoch": 1.54, + "learning_rate": 6.902644151939095e-05, + "loss": 0.0077, + "step": 305210 + }, + { + "epoch": 1.54, + "learning_rate": 6.901887382637693e-05, + "loss": 0.0082, + "step": 305220 + }, + { + "epoch": 1.54, + "learning_rate": 6.901130613336293e-05, + "loss": 0.007, + "step": 305230 + }, + { + "epoch": 1.54, + "learning_rate": 6.900373844034892e-05, + "loss": 0.0057, + "step": 305240 + }, + { + "epoch": 1.54, + "learning_rate": 6.89961707473349e-05, + "loss": 0.0061, + "step": 305250 + }, + { + "epoch": 1.54, + "learning_rate": 6.89886030543209e-05, + "loss": 0.0083, + "step": 305260 + }, + { + "epoch": 1.54, + "learning_rate": 6.898103536130688e-05, + "loss": 0.007, + "step": 305270 + }, + { + "epoch": 1.54, + "learning_rate": 6.897346766829286e-05, + "loss": 0.0073, + "step": 305280 + }, + { + "epoch": 1.54, + "learning_rate": 6.896589997527886e-05, + "loss": 0.0125, + "step": 305290 + }, + { + "epoch": 1.54, + "learning_rate": 6.895833228226485e-05, + "loss": 0.0074, + "step": 305300 + }, + { + "epoch": 1.54, + "learning_rate": 6.895076458925084e-05, + "loss": 0.0065, + "step": 305310 + }, + { + "epoch": 1.54, + "learning_rate": 6.894319689623683e-05, + "loss": 0.0071, + "step": 305320 + }, + { + "epoch": 1.54, + "learning_rate": 6.893562920322283e-05, + "loss": 0.008, + "step": 305330 + }, + { + "epoch": 1.54, + "learning_rate": 6.89280615102088e-05, + "loss": 0.0071, + "step": 305340 + }, + { + "epoch": 1.54, + "learning_rate": 6.89204938171948e-05, + "loss": 0.0078, + "step": 305350 + }, + { + "epoch": 1.54, + "learning_rate": 6.891292612418078e-05, + "loss": 0.0078, + "step": 305360 + }, + { + "epoch": 1.54, + "learning_rate": 6.890535843116678e-05, + "loss": 0.0088, + "step": 305370 + }, + { + "epoch": 1.54, + "learning_rate": 6.889779073815277e-05, + "loss": 0.0065, + "step": 305380 + }, + { + "epoch": 1.54, + "learning_rate": 6.889022304513875e-05, + "loss": 0.0063, + "step": 305390 + }, + { + "epoch": 1.54, + "learning_rate": 6.888265535212475e-05, + "loss": 0.0081, + "step": 305400 + }, + { + "epoch": 1.54, + "learning_rate": 6.887508765911074e-05, + "loss": 0.0076, + "step": 305410 + }, + { + "epoch": 1.54, + "learning_rate": 6.886751996609673e-05, + "loss": 0.0055, + "step": 305420 + }, + { + "epoch": 1.54, + "learning_rate": 6.885995227308272e-05, + "loss": 0.0075, + "step": 305430 + }, + { + "epoch": 1.54, + "learning_rate": 6.88523845800687e-05, + "loss": 0.0064, + "step": 305440 + }, + { + "epoch": 1.54, + "learning_rate": 6.88448168870547e-05, + "loss": 0.008, + "step": 305450 + }, + { + "epoch": 1.54, + "learning_rate": 6.883724919404069e-05, + "loss": 0.0097, + "step": 305460 + }, + { + "epoch": 1.54, + "learning_rate": 6.882968150102667e-05, + "loss": 0.0075, + "step": 305470 + }, + { + "epoch": 1.54, + "learning_rate": 6.882211380801267e-05, + "loss": 0.0073, + "step": 305480 + }, + { + "epoch": 1.54, + "learning_rate": 6.881454611499866e-05, + "loss": 0.0097, + "step": 305490 + }, + { + "epoch": 1.54, + "learning_rate": 6.880697842198465e-05, + "loss": 0.0072, + "step": 305500 + }, + { + "epoch": 1.54, + "learning_rate": 6.879941072897064e-05, + "loss": 0.0097, + "step": 305510 + }, + { + "epoch": 1.54, + "learning_rate": 6.879184303595664e-05, + "loss": 0.0062, + "step": 305520 + }, + { + "epoch": 1.54, + "learning_rate": 6.878427534294262e-05, + "loss": 0.0083, + "step": 305530 + }, + { + "epoch": 1.54, + "learning_rate": 6.877670764992861e-05, + "loss": 0.0087, + "step": 305540 + }, + { + "epoch": 1.54, + "learning_rate": 6.876913995691459e-05, + "loss": 0.0063, + "step": 305550 + }, + { + "epoch": 1.54, + "learning_rate": 6.876157226390059e-05, + "loss": 0.0082, + "step": 305560 + }, + { + "epoch": 1.54, + "learning_rate": 6.875400457088658e-05, + "loss": 0.0079, + "step": 305570 + }, + { + "epoch": 1.54, + "learning_rate": 6.874643687787256e-05, + "loss": 0.0066, + "step": 305580 + }, + { + "epoch": 1.54, + "learning_rate": 6.873886918485855e-05, + "loss": 0.0066, + "step": 305590 + }, + { + "epoch": 1.54, + "learning_rate": 6.873130149184454e-05, + "loss": 0.0063, + "step": 305600 + }, + { + "epoch": 1.54, + "learning_rate": 6.872373379883054e-05, + "loss": 0.0062, + "step": 305610 + }, + { + "epoch": 1.54, + "learning_rate": 6.871616610581652e-05, + "loss": 0.0075, + "step": 305620 + }, + { + "epoch": 1.54, + "learning_rate": 6.870859841280251e-05, + "loss": 0.0075, + "step": 305630 + }, + { + "epoch": 1.54, + "learning_rate": 6.87010307197885e-05, + "loss": 0.0067, + "step": 305640 + }, + { + "epoch": 1.54, + "learning_rate": 6.869346302677449e-05, + "loss": 0.0067, + "step": 305650 + }, + { + "epoch": 1.54, + "learning_rate": 6.868589533376048e-05, + "loss": 0.0052, + "step": 305660 + }, + { + "epoch": 1.54, + "learning_rate": 6.867832764074647e-05, + "loss": 0.007, + "step": 305670 + }, + { + "epoch": 1.54, + "learning_rate": 6.867075994773246e-05, + "loss": 0.0059, + "step": 305680 + }, + { + "epoch": 1.54, + "learning_rate": 6.866319225471846e-05, + "loss": 0.0081, + "step": 305690 + }, + { + "epoch": 1.54, + "learning_rate": 6.865562456170444e-05, + "loss": 0.0098, + "step": 305700 + }, + { + "epoch": 1.54, + "learning_rate": 6.864805686869043e-05, + "loss": 0.0078, + "step": 305710 + }, + { + "epoch": 1.54, + "learning_rate": 6.864048917567641e-05, + "loss": 0.0078, + "step": 305720 + }, + { + "epoch": 1.54, + "learning_rate": 6.863292148266241e-05, + "loss": 0.0102, + "step": 305730 + }, + { + "epoch": 1.54, + "learning_rate": 6.86253537896484e-05, + "loss": 0.0075, + "step": 305740 + }, + { + "epoch": 1.54, + "learning_rate": 6.861778609663438e-05, + "loss": 0.01, + "step": 305750 + }, + { + "epoch": 1.54, + "learning_rate": 6.861021840362038e-05, + "loss": 0.0059, + "step": 305760 + }, + { + "epoch": 1.54, + "learning_rate": 6.860265071060637e-05, + "loss": 0.0093, + "step": 305770 + }, + { + "epoch": 1.54, + "learning_rate": 6.859508301759236e-05, + "loss": 0.0073, + "step": 305780 + }, + { + "epoch": 1.54, + "learning_rate": 6.858751532457835e-05, + "loss": 0.0054, + "step": 305790 + }, + { + "epoch": 1.54, + "learning_rate": 6.857994763156433e-05, + "loss": 0.0063, + "step": 305800 + }, + { + "epoch": 1.54, + "learning_rate": 6.857237993855033e-05, + "loss": 0.0071, + "step": 305810 + }, + { + "epoch": 1.54, + "learning_rate": 6.856481224553632e-05, + "loss": 0.0067, + "step": 305820 + }, + { + "epoch": 1.54, + "learning_rate": 6.85572445525223e-05, + "loss": 0.0083, + "step": 305830 + }, + { + "epoch": 1.54, + "learning_rate": 6.85496768595083e-05, + "loss": 0.0068, + "step": 305840 + }, + { + "epoch": 1.54, + "learning_rate": 6.85421091664943e-05, + "loss": 0.0068, + "step": 305850 + }, + { + "epoch": 1.54, + "learning_rate": 6.853454147348028e-05, + "loss": 0.0065, + "step": 305860 + }, + { + "epoch": 1.54, + "learning_rate": 6.852697378046627e-05, + "loss": 0.0068, + "step": 305870 + }, + { + "epoch": 1.54, + "learning_rate": 6.851940608745225e-05, + "loss": 0.0063, + "step": 305880 + }, + { + "epoch": 1.54, + "learning_rate": 6.851183839443825e-05, + "loss": 0.0102, + "step": 305890 + }, + { + "epoch": 1.54, + "learning_rate": 6.850427070142423e-05, + "loss": 0.0069, + "step": 305900 + }, + { + "epoch": 1.54, + "learning_rate": 6.849670300841022e-05, + "loss": 0.0071, + "step": 305910 + }, + { + "epoch": 1.54, + "learning_rate": 6.84891353153962e-05, + "loss": 0.0068, + "step": 305920 + }, + { + "epoch": 1.54, + "learning_rate": 6.84815676223822e-05, + "loss": 0.0069, + "step": 305930 + }, + { + "epoch": 1.54, + "learning_rate": 6.84739999293682e-05, + "loss": 0.0066, + "step": 305940 + }, + { + "epoch": 1.54, + "learning_rate": 6.846643223635418e-05, + "loss": 0.0081, + "step": 305950 + }, + { + "epoch": 1.54, + "learning_rate": 6.845886454334017e-05, + "loss": 0.0058, + "step": 305960 + }, + { + "epoch": 1.54, + "learning_rate": 6.845129685032617e-05, + "loss": 0.0064, + "step": 305970 + }, + { + "epoch": 1.54, + "learning_rate": 6.844372915731215e-05, + "loss": 0.0072, + "step": 305980 + }, + { + "epoch": 1.54, + "learning_rate": 6.843616146429814e-05, + "loss": 0.0072, + "step": 305990 + }, + { + "epoch": 1.54, + "learning_rate": 6.842859377128412e-05, + "loss": 0.0088, + "step": 306000 + }, + { + "epoch": 1.54, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.00540526770055294, + "eval_runtime": 116.2539, + "eval_samples_per_second": 17.204, + "eval_steps_per_second": 4.301, + "step": 306000 + }, + { + "epoch": 1.54, + "learning_rate": 6.842102607827012e-05, + "loss": 0.0125, + "step": 306010 + }, + { + "epoch": 1.54, + "learning_rate": 6.841345838525611e-05, + "loss": 0.0056, + "step": 306020 + }, + { + "epoch": 1.54, + "learning_rate": 6.84058906922421e-05, + "loss": 0.0085, + "step": 306030 + }, + { + "epoch": 1.54, + "learning_rate": 6.839832299922809e-05, + "loss": 0.0083, + "step": 306040 + }, + { + "epoch": 1.54, + "learning_rate": 6.839075530621409e-05, + "loss": 0.0074, + "step": 306050 + }, + { + "epoch": 1.54, + "learning_rate": 6.838318761320007e-05, + "loss": 0.005, + "step": 306060 + }, + { + "epoch": 1.54, + "learning_rate": 6.837561992018606e-05, + "loss": 0.0062, + "step": 306070 + }, + { + "epoch": 1.54, + "learning_rate": 6.836805222717204e-05, + "loss": 0.0113, + "step": 306080 + }, + { + "epoch": 1.54, + "learning_rate": 6.836048453415804e-05, + "loss": 0.0057, + "step": 306090 + }, + { + "epoch": 1.54, + "learning_rate": 6.835291684114403e-05, + "loss": 0.0053, + "step": 306100 + }, + { + "epoch": 1.54, + "learning_rate": 6.834534914813001e-05, + "loss": 0.0088, + "step": 306110 + }, + { + "epoch": 1.54, + "learning_rate": 6.833778145511601e-05, + "loss": 0.0087, + "step": 306120 + }, + { + "epoch": 1.54, + "learning_rate": 6.8330213762102e-05, + "loss": 0.01, + "step": 306130 + }, + { + "epoch": 1.54, + "learning_rate": 6.832264606908799e-05, + "loss": 0.0061, + "step": 306140 + }, + { + "epoch": 1.54, + "learning_rate": 6.831507837607398e-05, + "loss": 0.0076, + "step": 306150 + }, + { + "epoch": 1.54, + "learning_rate": 6.830751068305996e-05, + "loss": 0.0066, + "step": 306160 + }, + { + "epoch": 1.54, + "learning_rate": 6.829994299004596e-05, + "loss": 0.0066, + "step": 306170 + }, + { + "epoch": 1.54, + "learning_rate": 6.829237529703195e-05, + "loss": 0.0064, + "step": 306180 + }, + { + "epoch": 1.54, + "learning_rate": 6.828480760401793e-05, + "loss": 0.0071, + "step": 306190 + }, + { + "epoch": 1.54, + "learning_rate": 6.827723991100393e-05, + "loss": 0.0068, + "step": 306200 + }, + { + "epoch": 1.54, + "learning_rate": 6.826967221798991e-05, + "loss": 0.0074, + "step": 306210 + }, + { + "epoch": 1.54, + "learning_rate": 6.82621045249759e-05, + "loss": 0.0069, + "step": 306220 + }, + { + "epoch": 1.54, + "learning_rate": 6.825453683196189e-05, + "loss": 0.0043, + "step": 306230 + }, + { + "epoch": 1.55, + "learning_rate": 6.824696913894788e-05, + "loss": 0.0071, + "step": 306240 + }, + { + "epoch": 1.55, + "learning_rate": 6.823940144593386e-05, + "loss": 0.0071, + "step": 306250 + }, + { + "epoch": 1.55, + "learning_rate": 6.823183375291986e-05, + "loss": 0.0093, + "step": 306260 + }, + { + "epoch": 1.55, + "learning_rate": 6.822426605990585e-05, + "loss": 0.0074, + "step": 306270 + }, + { + "epoch": 1.55, + "learning_rate": 6.821669836689183e-05, + "loss": 0.008, + "step": 306280 + }, + { + "epoch": 1.55, + "learning_rate": 6.820913067387783e-05, + "loss": 0.0068, + "step": 306290 + }, + { + "epoch": 1.55, + "learning_rate": 6.820156298086382e-05, + "loss": 0.0068, + "step": 306300 + }, + { + "epoch": 1.55, + "learning_rate": 6.81939952878498e-05, + "loss": 0.0055, + "step": 306310 + }, + { + "epoch": 1.55, + "learning_rate": 6.81864275948358e-05, + "loss": 0.0073, + "step": 306320 + }, + { + "epoch": 1.55, + "learning_rate": 6.817885990182178e-05, + "loss": 0.0097, + "step": 306330 + }, + { + "epoch": 1.55, + "learning_rate": 6.817129220880778e-05, + "loss": 0.007, + "step": 306340 + }, + { + "epoch": 1.55, + "learning_rate": 6.816372451579377e-05, + "loss": 0.0064, + "step": 306350 + }, + { + "epoch": 1.55, + "learning_rate": 6.815615682277975e-05, + "loss": 0.0081, + "step": 306360 + }, + { + "epoch": 1.55, + "learning_rate": 6.814858912976575e-05, + "loss": 0.0076, + "step": 306370 + }, + { + "epoch": 1.55, + "learning_rate": 6.814102143675174e-05, + "loss": 0.0065, + "step": 306380 + }, + { + "epoch": 1.55, + "learning_rate": 6.813345374373773e-05, + "loss": 0.0073, + "step": 306390 + }, + { + "epoch": 1.55, + "learning_rate": 6.812588605072372e-05, + "loss": 0.0066, + "step": 306400 + }, + { + "epoch": 1.55, + "learning_rate": 6.81183183577097e-05, + "loss": 0.0068, + "step": 306410 + }, + { + "epoch": 1.55, + "learning_rate": 6.81107506646957e-05, + "loss": 0.0067, + "step": 306420 + }, + { + "epoch": 1.55, + "learning_rate": 6.810318297168169e-05, + "loss": 0.0062, + "step": 306430 + }, + { + "epoch": 1.55, + "learning_rate": 6.809561527866767e-05, + "loss": 0.0067, + "step": 306440 + }, + { + "epoch": 1.55, + "learning_rate": 6.808804758565367e-05, + "loss": 0.0063, + "step": 306450 + }, + { + "epoch": 1.55, + "learning_rate": 6.808047989263966e-05, + "loss": 0.0082, + "step": 306460 + }, + { + "epoch": 1.55, + "learning_rate": 6.807291219962564e-05, + "loss": 0.0057, + "step": 306470 + }, + { + "epoch": 1.55, + "learning_rate": 6.806534450661164e-05, + "loss": 0.0066, + "step": 306480 + }, + { + "epoch": 1.55, + "learning_rate": 6.805777681359763e-05, + "loss": 0.0072, + "step": 306490 + }, + { + "epoch": 1.55, + "learning_rate": 6.805020912058362e-05, + "loss": 0.0057, + "step": 306500 + }, + { + "epoch": 1.55, + "learning_rate": 6.804264142756961e-05, + "loss": 0.0081, + "step": 306510 + }, + { + "epoch": 1.55, + "learning_rate": 6.803507373455559e-05, + "loss": 0.0069, + "step": 306520 + }, + { + "epoch": 1.55, + "learning_rate": 6.802750604154157e-05, + "loss": 0.0066, + "step": 306530 + }, + { + "epoch": 1.55, + "learning_rate": 6.801993834852757e-05, + "loss": 0.0049, + "step": 306540 + }, + { + "epoch": 1.55, + "learning_rate": 6.801237065551356e-05, + "loss": 0.0082, + "step": 306550 + }, + { + "epoch": 1.55, + "learning_rate": 6.800480296249955e-05, + "loss": 0.0088, + "step": 306560 + }, + { + "epoch": 1.55, + "learning_rate": 6.799723526948554e-05, + "loss": 0.0056, + "step": 306570 + }, + { + "epoch": 1.55, + "learning_rate": 6.798966757647154e-05, + "loss": 0.0099, + "step": 306580 + }, + { + "epoch": 1.55, + "learning_rate": 6.798209988345752e-05, + "loss": 0.0051, + "step": 306590 + }, + { + "epoch": 1.55, + "learning_rate": 6.797453219044351e-05, + "loss": 0.0076, + "step": 306600 + }, + { + "epoch": 1.55, + "learning_rate": 6.79669644974295e-05, + "loss": 0.0061, + "step": 306610 + }, + { + "epoch": 1.55, + "learning_rate": 6.795939680441549e-05, + "loss": 0.0079, + "step": 306620 + }, + { + "epoch": 1.55, + "learning_rate": 6.795182911140148e-05, + "loss": 0.006, + "step": 306630 + }, + { + "epoch": 1.55, + "learning_rate": 6.794426141838746e-05, + "loss": 0.013, + "step": 306640 + }, + { + "epoch": 1.55, + "learning_rate": 6.793669372537346e-05, + "loss": 0.0068, + "step": 306650 + }, + { + "epoch": 1.55, + "learning_rate": 6.792912603235945e-05, + "loss": 0.0089, + "step": 306660 + }, + { + "epoch": 1.55, + "learning_rate": 6.792155833934544e-05, + "loss": 0.0074, + "step": 306670 + }, + { + "epoch": 1.55, + "learning_rate": 6.791399064633143e-05, + "loss": 0.0064, + "step": 306680 + }, + { + "epoch": 1.55, + "learning_rate": 6.790642295331741e-05, + "loss": 0.0063, + "step": 306690 + }, + { + "epoch": 1.55, + "learning_rate": 6.789885526030341e-05, + "loss": 0.008, + "step": 306700 + }, + { + "epoch": 1.55, + "learning_rate": 6.78912875672894e-05, + "loss": 0.0067, + "step": 306710 + }, + { + "epoch": 1.55, + "learning_rate": 6.788371987427538e-05, + "loss": 0.0059, + "step": 306720 + }, + { + "epoch": 1.55, + "learning_rate": 6.787615218126138e-05, + "loss": 0.0082, + "step": 306730 + }, + { + "epoch": 1.55, + "learning_rate": 6.786858448824737e-05, + "loss": 0.0068, + "step": 306740 + }, + { + "epoch": 1.55, + "learning_rate": 6.786101679523336e-05, + "loss": 0.007, + "step": 306750 + }, + { + "epoch": 1.55, + "learning_rate": 6.785344910221935e-05, + "loss": 0.0094, + "step": 306760 + }, + { + "epoch": 1.55, + "learning_rate": 6.784588140920533e-05, + "loss": 0.0067, + "step": 306770 + }, + { + "epoch": 1.55, + "learning_rate": 6.783831371619133e-05, + "loss": 0.0062, + "step": 306780 + }, + { + "epoch": 1.55, + "learning_rate": 6.783074602317732e-05, + "loss": 0.0094, + "step": 306790 + }, + { + "epoch": 1.55, + "learning_rate": 6.78231783301633e-05, + "loss": 0.0059, + "step": 306800 + }, + { + "epoch": 1.55, + "learning_rate": 6.78156106371493e-05, + "loss": 0.0077, + "step": 306810 + }, + { + "epoch": 1.55, + "learning_rate": 6.78080429441353e-05, + "loss": 0.0076, + "step": 306820 + }, + { + "epoch": 1.55, + "learning_rate": 6.780047525112127e-05, + "loss": 0.0093, + "step": 306830 + }, + { + "epoch": 1.55, + "learning_rate": 6.779290755810726e-05, + "loss": 0.0072, + "step": 306840 + }, + { + "epoch": 1.55, + "learning_rate": 6.778533986509325e-05, + "loss": 0.008, + "step": 306850 + }, + { + "epoch": 1.55, + "learning_rate": 6.777777217207923e-05, + "loss": 0.0065, + "step": 306860 + }, + { + "epoch": 1.55, + "learning_rate": 6.777020447906523e-05, + "loss": 0.0074, + "step": 306870 + }, + { + "epoch": 1.55, + "learning_rate": 6.776263678605122e-05, + "loss": 0.0068, + "step": 306880 + }, + { + "epoch": 1.55, + "learning_rate": 6.77550690930372e-05, + "loss": 0.0058, + "step": 306890 + }, + { + "epoch": 1.55, + "learning_rate": 6.77475014000232e-05, + "loss": 0.0067, + "step": 306900 + }, + { + "epoch": 1.55, + "learning_rate": 6.77399337070092e-05, + "loss": 0.0065, + "step": 306910 + }, + { + "epoch": 1.55, + "learning_rate": 6.773236601399518e-05, + "loss": 0.0066, + "step": 306920 + }, + { + "epoch": 1.55, + "learning_rate": 6.772479832098117e-05, + "loss": 0.0066, + "step": 306930 + }, + { + "epoch": 1.55, + "learning_rate": 6.771723062796717e-05, + "loss": 0.0056, + "step": 306940 + }, + { + "epoch": 1.55, + "learning_rate": 6.770966293495315e-05, + "loss": 0.0055, + "step": 306950 + }, + { + "epoch": 1.55, + "learning_rate": 6.770209524193914e-05, + "loss": 0.0072, + "step": 306960 + }, + { + "epoch": 1.55, + "learning_rate": 6.769452754892512e-05, + "loss": 0.0055, + "step": 306970 + }, + { + "epoch": 1.55, + "learning_rate": 6.768695985591112e-05, + "loss": 0.0095, + "step": 306980 + }, + { + "epoch": 1.55, + "learning_rate": 6.767939216289711e-05, + "loss": 0.0047, + "step": 306990 + }, + { + "epoch": 1.55, + "learning_rate": 6.76718244698831e-05, + "loss": 0.0055, + "step": 307000 + }, + { + "epoch": 1.55, + "eval_cer": 0.9144605519419082, + "eval_loss": 0.005416039377450943, + "eval_runtime": 116.4069, + "eval_samples_per_second": 17.181, + "eval_steps_per_second": 4.295, + "step": 307000 + }, + { + "epoch": 1.55, + "learning_rate": 6.766425677686909e-05, + "loss": 0.0072, + "step": 307010 + }, + { + "epoch": 1.55, + "learning_rate": 6.765668908385508e-05, + "loss": 0.0061, + "step": 307020 + }, + { + "epoch": 1.55, + "learning_rate": 6.764912139084107e-05, + "loss": 0.0074, + "step": 307030 + }, + { + "epoch": 1.55, + "learning_rate": 6.764155369782706e-05, + "loss": 0.0077, + "step": 307040 + }, + { + "epoch": 1.55, + "learning_rate": 6.763398600481304e-05, + "loss": 0.009, + "step": 307050 + }, + { + "epoch": 1.55, + "learning_rate": 6.762641831179904e-05, + "loss": 0.0073, + "step": 307060 + }, + { + "epoch": 1.55, + "learning_rate": 6.761885061878503e-05, + "loss": 0.0068, + "step": 307070 + }, + { + "epoch": 1.55, + "learning_rate": 6.761128292577101e-05, + "loss": 0.0065, + "step": 307080 + }, + { + "epoch": 1.55, + "learning_rate": 6.760371523275701e-05, + "loss": 0.0078, + "step": 307090 + }, + { + "epoch": 1.55, + "learning_rate": 6.7596147539743e-05, + "loss": 0.0068, + "step": 307100 + }, + { + "epoch": 1.55, + "learning_rate": 6.758857984672899e-05, + "loss": 0.0069, + "step": 307110 + }, + { + "epoch": 1.55, + "learning_rate": 6.758101215371498e-05, + "loss": 0.0059, + "step": 307120 + }, + { + "epoch": 1.55, + "learning_rate": 6.757344446070096e-05, + "loss": 0.0061, + "step": 307130 + }, + { + "epoch": 1.55, + "learning_rate": 6.756587676768696e-05, + "loss": 0.0079, + "step": 307140 + }, + { + "epoch": 1.55, + "learning_rate": 6.755830907467295e-05, + "loss": 0.0074, + "step": 307150 + }, + { + "epoch": 1.55, + "learning_rate": 6.755074138165893e-05, + "loss": 0.0074, + "step": 307160 + }, + { + "epoch": 1.55, + "learning_rate": 6.754317368864491e-05, + "loss": 0.0064, + "step": 307170 + }, + { + "epoch": 1.55, + "learning_rate": 6.753560599563091e-05, + "loss": 0.0069, + "step": 307180 + }, + { + "epoch": 1.55, + "learning_rate": 6.75280383026169e-05, + "loss": 0.0056, + "step": 307190 + }, + { + "epoch": 1.55, + "learning_rate": 6.752047060960289e-05, + "loss": 0.0062, + "step": 307200 + }, + { + "epoch": 1.55, + "learning_rate": 6.751290291658888e-05, + "loss": 0.0093, + "step": 307210 + }, + { + "epoch": 1.55, + "learning_rate": 6.750533522357486e-05, + "loss": 0.0079, + "step": 307220 + }, + { + "epoch": 1.55, + "learning_rate": 6.749776753056086e-05, + "loss": 0.006, + "step": 307230 + }, + { + "epoch": 1.55, + "learning_rate": 6.749019983754685e-05, + "loss": 0.0075, + "step": 307240 + }, + { + "epoch": 1.55, + "learning_rate": 6.748263214453283e-05, + "loss": 0.0054, + "step": 307250 + }, + { + "epoch": 1.55, + "learning_rate": 6.747506445151883e-05, + "loss": 0.0066, + "step": 307260 + }, + { + "epoch": 1.55, + "learning_rate": 6.746749675850482e-05, + "loss": 0.0086, + "step": 307270 + }, + { + "epoch": 1.55, + "learning_rate": 6.74599290654908e-05, + "loss": 0.0054, + "step": 307280 + }, + { + "epoch": 1.55, + "learning_rate": 6.74523613724768e-05, + "loss": 0.0071, + "step": 307290 + }, + { + "epoch": 1.55, + "learning_rate": 6.744479367946278e-05, + "loss": 0.007, + "step": 307300 + }, + { + "epoch": 1.55, + "learning_rate": 6.743722598644878e-05, + "loss": 0.0066, + "step": 307310 + }, + { + "epoch": 1.55, + "learning_rate": 6.742965829343477e-05, + "loss": 0.0073, + "step": 307320 + }, + { + "epoch": 1.55, + "learning_rate": 6.742209060042075e-05, + "loss": 0.006, + "step": 307330 + }, + { + "epoch": 1.55, + "learning_rate": 6.741452290740675e-05, + "loss": 0.0069, + "step": 307340 + }, + { + "epoch": 1.55, + "learning_rate": 6.740695521439274e-05, + "loss": 0.0068, + "step": 307350 + }, + { + "epoch": 1.55, + "learning_rate": 6.739938752137872e-05, + "loss": 0.0062, + "step": 307360 + }, + { + "epoch": 1.55, + "learning_rate": 6.739181982836472e-05, + "loss": 0.0045, + "step": 307370 + }, + { + "epoch": 1.55, + "learning_rate": 6.73842521353507e-05, + "loss": 0.006, + "step": 307380 + }, + { + "epoch": 1.55, + "learning_rate": 6.73766844423367e-05, + "loss": 0.0059, + "step": 307390 + }, + { + "epoch": 1.55, + "learning_rate": 6.736911674932269e-05, + "loss": 0.0059, + "step": 307400 + }, + { + "epoch": 1.55, + "learning_rate": 6.736154905630867e-05, + "loss": 0.0067, + "step": 307410 + }, + { + "epoch": 1.55, + "learning_rate": 6.735398136329467e-05, + "loss": 0.0072, + "step": 307420 + }, + { + "epoch": 1.55, + "learning_rate": 6.734641367028066e-05, + "loss": 0.0053, + "step": 307430 + }, + { + "epoch": 1.55, + "learning_rate": 6.733884597726664e-05, + "loss": 0.0061, + "step": 307440 + }, + { + "epoch": 1.55, + "learning_rate": 6.733127828425264e-05, + "loss": 0.0079, + "step": 307450 + }, + { + "epoch": 1.55, + "learning_rate": 6.732371059123863e-05, + "loss": 0.0144, + "step": 307460 + }, + { + "epoch": 1.55, + "learning_rate": 6.731614289822462e-05, + "loss": 0.0054, + "step": 307470 + }, + { + "epoch": 1.55, + "learning_rate": 6.73085752052106e-05, + "loss": 0.0063, + "step": 307480 + }, + { + "epoch": 1.55, + "learning_rate": 6.730100751219659e-05, + "loss": 0.0064, + "step": 307490 + }, + { + "epoch": 1.55, + "learning_rate": 6.729343981918257e-05, + "loss": 0.0069, + "step": 307500 + }, + { + "epoch": 1.55, + "learning_rate": 6.728587212616857e-05, + "loss": 0.0077, + "step": 307510 + }, + { + "epoch": 1.55, + "learning_rate": 6.727830443315456e-05, + "loss": 0.0096, + "step": 307520 + }, + { + "epoch": 1.55, + "learning_rate": 6.727073674014055e-05, + "loss": 0.0054, + "step": 307530 + }, + { + "epoch": 1.55, + "learning_rate": 6.726316904712654e-05, + "loss": 0.0062, + "step": 307540 + }, + { + "epoch": 1.55, + "learning_rate": 6.725560135411254e-05, + "loss": 0.0076, + "step": 307550 + }, + { + "epoch": 1.55, + "learning_rate": 6.724803366109852e-05, + "loss": 0.0062, + "step": 307560 + }, + { + "epoch": 1.55, + "learning_rate": 6.724046596808451e-05, + "loss": 0.0057, + "step": 307570 + }, + { + "epoch": 1.55, + "learning_rate": 6.723289827507049e-05, + "loss": 0.011, + "step": 307580 + }, + { + "epoch": 1.55, + "learning_rate": 6.722533058205649e-05, + "loss": 0.0045, + "step": 307590 + }, + { + "epoch": 1.55, + "learning_rate": 6.721776288904248e-05, + "loss": 0.0067, + "step": 307600 + }, + { + "epoch": 1.55, + "learning_rate": 6.721019519602846e-05, + "loss": 0.0079, + "step": 307610 + }, + { + "epoch": 1.55, + "learning_rate": 6.720262750301446e-05, + "loss": 0.0064, + "step": 307620 + }, + { + "epoch": 1.55, + "learning_rate": 6.719505981000045e-05, + "loss": 0.0074, + "step": 307630 + }, + { + "epoch": 1.55, + "learning_rate": 6.718749211698644e-05, + "loss": 0.0046, + "step": 307640 + }, + { + "epoch": 1.55, + "learning_rate": 6.717992442397243e-05, + "loss": 0.0071, + "step": 307650 + }, + { + "epoch": 1.55, + "learning_rate": 6.717235673095841e-05, + "loss": 0.0054, + "step": 307660 + }, + { + "epoch": 1.55, + "learning_rate": 6.716478903794441e-05, + "loss": 0.0056, + "step": 307670 + }, + { + "epoch": 1.55, + "learning_rate": 6.71572213449304e-05, + "loss": 0.0076, + "step": 307680 + }, + { + "epoch": 1.55, + "learning_rate": 6.714965365191638e-05, + "loss": 0.0085, + "step": 307690 + }, + { + "epoch": 1.55, + "learning_rate": 6.714208595890238e-05, + "loss": 0.007, + "step": 307700 + }, + { + "epoch": 1.55, + "learning_rate": 6.713451826588837e-05, + "loss": 0.0072, + "step": 307710 + }, + { + "epoch": 1.55, + "learning_rate": 6.712695057287436e-05, + "loss": 0.0068, + "step": 307720 + }, + { + "epoch": 1.55, + "learning_rate": 6.711938287986035e-05, + "loss": 0.0056, + "step": 307730 + }, + { + "epoch": 1.55, + "learning_rate": 6.711181518684633e-05, + "loss": 0.0065, + "step": 307740 + }, + { + "epoch": 1.55, + "learning_rate": 6.710424749383233e-05, + "loss": 0.0054, + "step": 307750 + }, + { + "epoch": 1.55, + "learning_rate": 6.709667980081832e-05, + "loss": 0.0056, + "step": 307760 + }, + { + "epoch": 1.55, + "learning_rate": 6.70891121078043e-05, + "loss": 0.0088, + "step": 307770 + }, + { + "epoch": 1.55, + "learning_rate": 6.70815444147903e-05, + "loss": 0.0073, + "step": 307780 + }, + { + "epoch": 1.55, + "learning_rate": 6.707397672177628e-05, + "loss": 0.008, + "step": 307790 + }, + { + "epoch": 1.55, + "learning_rate": 6.706640902876227e-05, + "loss": 0.0063, + "step": 307800 + }, + { + "epoch": 1.55, + "learning_rate": 6.705884133574826e-05, + "loss": 0.0079, + "step": 307810 + }, + { + "epoch": 1.55, + "learning_rate": 6.705127364273425e-05, + "loss": 0.0056, + "step": 307820 + }, + { + "epoch": 1.55, + "learning_rate": 6.704370594972023e-05, + "loss": 0.0079, + "step": 307830 + }, + { + "epoch": 1.55, + "learning_rate": 6.703613825670623e-05, + "loss": 0.007, + "step": 307840 + }, + { + "epoch": 1.55, + "learning_rate": 6.702857056369222e-05, + "loss": 0.0076, + "step": 307850 + }, + { + "epoch": 1.55, + "learning_rate": 6.70210028706782e-05, + "loss": 0.0084, + "step": 307860 + }, + { + "epoch": 1.55, + "learning_rate": 6.70134351776642e-05, + "loss": 0.0082, + "step": 307870 + }, + { + "epoch": 1.55, + "learning_rate": 6.70058674846502e-05, + "loss": 0.0076, + "step": 307880 + }, + { + "epoch": 1.55, + "learning_rate": 6.699829979163618e-05, + "loss": 0.0079, + "step": 307890 + }, + { + "epoch": 1.55, + "learning_rate": 6.699073209862217e-05, + "loss": 0.0054, + "step": 307900 + }, + { + "epoch": 1.55, + "learning_rate": 6.698316440560817e-05, + "loss": 0.0069, + "step": 307910 + }, + { + "epoch": 1.55, + "learning_rate": 6.697559671259415e-05, + "loss": 0.0058, + "step": 307920 + }, + { + "epoch": 1.55, + "learning_rate": 6.696802901958014e-05, + "loss": 0.0079, + "step": 307930 + }, + { + "epoch": 1.55, + "learning_rate": 6.696046132656612e-05, + "loss": 0.0084, + "step": 307940 + }, + { + "epoch": 1.55, + "learning_rate": 6.695289363355212e-05, + "loss": 0.0076, + "step": 307950 + }, + { + "epoch": 1.55, + "learning_rate": 6.694532594053811e-05, + "loss": 0.006, + "step": 307960 + }, + { + "epoch": 1.55, + "learning_rate": 6.69377582475241e-05, + "loss": 0.0067, + "step": 307970 + }, + { + "epoch": 1.55, + "learning_rate": 6.693019055451009e-05, + "loss": 0.0098, + "step": 307980 + }, + { + "epoch": 1.55, + "learning_rate": 6.692262286149608e-05, + "loss": 0.0056, + "step": 307990 + }, + { + "epoch": 1.55, + "learning_rate": 6.691505516848207e-05, + "loss": 0.0078, + "step": 308000 + }, + { + "epoch": 1.55, + "eval_cer": 0.9144828710527925, + "eval_loss": 0.005395396146923304, + "eval_runtime": 116.4162, + "eval_samples_per_second": 17.18, + "eval_steps_per_second": 4.295, + "step": 308000 + }, + { + "epoch": 1.55, + "learning_rate": 6.690748747546806e-05, + "loss": 0.006, + "step": 308010 + }, + { + "epoch": 1.55, + "learning_rate": 6.689991978245404e-05, + "loss": 0.0053, + "step": 308020 + }, + { + "epoch": 1.55, + "learning_rate": 6.689235208944004e-05, + "loss": 0.0059, + "step": 308030 + }, + { + "epoch": 1.55, + "learning_rate": 6.688478439642603e-05, + "loss": 0.0071, + "step": 308040 + }, + { + "epoch": 1.55, + "learning_rate": 6.687721670341201e-05, + "loss": 0.0075, + "step": 308050 + }, + { + "epoch": 1.55, + "learning_rate": 6.686964901039801e-05, + "loss": 0.0048, + "step": 308060 + }, + { + "epoch": 1.55, + "learning_rate": 6.6862081317384e-05, + "loss": 0.0096, + "step": 308070 + }, + { + "epoch": 1.55, + "learning_rate": 6.685451362436999e-05, + "loss": 0.0086, + "step": 308080 + }, + { + "epoch": 1.55, + "learning_rate": 6.684694593135598e-05, + "loss": 0.0062, + "step": 308090 + }, + { + "epoch": 1.55, + "learning_rate": 6.683937823834196e-05, + "loss": 0.0048, + "step": 308100 + }, + { + "epoch": 1.55, + "learning_rate": 6.683181054532794e-05, + "loss": 0.0063, + "step": 308110 + }, + { + "epoch": 1.55, + "learning_rate": 6.682424285231394e-05, + "loss": 0.0091, + "step": 308120 + }, + { + "epoch": 1.55, + "learning_rate": 6.681667515929993e-05, + "loss": 0.006, + "step": 308130 + }, + { + "epoch": 1.55, + "learning_rate": 6.680910746628591e-05, + "loss": 0.0075, + "step": 308140 + }, + { + "epoch": 1.55, + "learning_rate": 6.680153977327191e-05, + "loss": 0.0061, + "step": 308150 + }, + { + "epoch": 1.55, + "learning_rate": 6.67939720802579e-05, + "loss": 0.0084, + "step": 308160 + }, + { + "epoch": 1.55, + "learning_rate": 6.678640438724389e-05, + "loss": 0.0074, + "step": 308170 + }, + { + "epoch": 1.55, + "learning_rate": 6.677883669422988e-05, + "loss": 0.0083, + "step": 308180 + }, + { + "epoch": 1.55, + "learning_rate": 6.677126900121586e-05, + "loss": 0.0069, + "step": 308190 + }, + { + "epoch": 1.55, + "learning_rate": 6.676370130820186e-05, + "loss": 0.0066, + "step": 308200 + }, + { + "epoch": 1.55, + "learning_rate": 6.675613361518785e-05, + "loss": 0.007, + "step": 308210 + }, + { + "epoch": 1.56, + "learning_rate": 6.674856592217383e-05, + "loss": 0.0074, + "step": 308220 + }, + { + "epoch": 1.56, + "learning_rate": 6.674099822915983e-05, + "loss": 0.0068, + "step": 308230 + }, + { + "epoch": 1.56, + "learning_rate": 6.673343053614582e-05, + "loss": 0.0075, + "step": 308240 + }, + { + "epoch": 1.56, + "learning_rate": 6.67258628431318e-05, + "loss": 0.0067, + "step": 308250 + }, + { + "epoch": 1.56, + "learning_rate": 6.67182951501178e-05, + "loss": 0.0096, + "step": 308260 + }, + { + "epoch": 1.56, + "learning_rate": 6.671072745710378e-05, + "loss": 0.0067, + "step": 308270 + }, + { + "epoch": 1.56, + "learning_rate": 6.670315976408978e-05, + "loss": 0.0069, + "step": 308280 + }, + { + "epoch": 1.56, + "learning_rate": 6.669559207107577e-05, + "loss": 0.0078, + "step": 308290 + }, + { + "epoch": 1.56, + "learning_rate": 6.668802437806175e-05, + "loss": 0.0092, + "step": 308300 + }, + { + "epoch": 1.56, + "learning_rate": 6.668045668504775e-05, + "loss": 0.0076, + "step": 308310 + }, + { + "epoch": 1.56, + "learning_rate": 6.667288899203374e-05, + "loss": 0.0076, + "step": 308320 + }, + { + "epoch": 1.56, + "learning_rate": 6.666532129901972e-05, + "loss": 0.0058, + "step": 308330 + }, + { + "epoch": 1.56, + "learning_rate": 6.665775360600572e-05, + "loss": 0.0059, + "step": 308340 + }, + { + "epoch": 1.56, + "learning_rate": 6.66501859129917e-05, + "loss": 0.0076, + "step": 308350 + }, + { + "epoch": 1.56, + "learning_rate": 6.66426182199777e-05, + "loss": 0.0062, + "step": 308360 + }, + { + "epoch": 1.56, + "learning_rate": 6.663505052696369e-05, + "loss": 0.0086, + "step": 308370 + }, + { + "epoch": 1.56, + "learning_rate": 6.662748283394967e-05, + "loss": 0.0079, + "step": 308380 + }, + { + "epoch": 1.56, + "learning_rate": 6.661991514093567e-05, + "loss": 0.0084, + "step": 308390 + }, + { + "epoch": 1.56, + "learning_rate": 6.661234744792166e-05, + "loss": 0.0066, + "step": 308400 + }, + { + "epoch": 1.56, + "learning_rate": 6.660477975490764e-05, + "loss": 0.0073, + "step": 308410 + }, + { + "epoch": 1.56, + "learning_rate": 6.659721206189363e-05, + "loss": 0.0106, + "step": 308420 + }, + { + "epoch": 1.56, + "learning_rate": 6.658964436887962e-05, + "loss": 0.0071, + "step": 308430 + }, + { + "epoch": 1.56, + "learning_rate": 6.658207667586562e-05, + "loss": 0.0098, + "step": 308440 + }, + { + "epoch": 1.56, + "learning_rate": 6.65745089828516e-05, + "loss": 0.0068, + "step": 308450 + }, + { + "epoch": 1.56, + "learning_rate": 6.656694128983759e-05, + "loss": 0.0061, + "step": 308460 + }, + { + "epoch": 1.56, + "learning_rate": 6.655937359682357e-05, + "loss": 0.0077, + "step": 308470 + }, + { + "epoch": 1.56, + "learning_rate": 6.655180590380957e-05, + "loss": 0.0062, + "step": 308480 + }, + { + "epoch": 1.56, + "learning_rate": 6.654423821079556e-05, + "loss": 0.0051, + "step": 308490 + }, + { + "epoch": 1.56, + "learning_rate": 6.653667051778154e-05, + "loss": 0.0074, + "step": 308500 + }, + { + "epoch": 1.56, + "learning_rate": 6.652910282476754e-05, + "loss": 0.0078, + "step": 308510 + }, + { + "epoch": 1.56, + "learning_rate": 6.652153513175353e-05, + "loss": 0.0066, + "step": 308520 + }, + { + "epoch": 1.56, + "learning_rate": 6.651396743873952e-05, + "loss": 0.0079, + "step": 308530 + }, + { + "epoch": 1.56, + "learning_rate": 6.650639974572551e-05, + "loss": 0.0084, + "step": 308540 + }, + { + "epoch": 1.56, + "learning_rate": 6.649883205271149e-05, + "loss": 0.006, + "step": 308550 + }, + { + "epoch": 1.56, + "learning_rate": 6.649126435969749e-05, + "loss": 0.0072, + "step": 308560 + }, + { + "epoch": 1.56, + "learning_rate": 6.648369666668348e-05, + "loss": 0.0064, + "step": 308570 + }, + { + "epoch": 1.56, + "learning_rate": 6.647612897366946e-05, + "loss": 0.008, + "step": 308580 + }, + { + "epoch": 1.56, + "learning_rate": 6.646856128065546e-05, + "loss": 0.0065, + "step": 308590 + }, + { + "epoch": 1.56, + "learning_rate": 6.646099358764145e-05, + "loss": 0.0066, + "step": 308600 + }, + { + "epoch": 1.56, + "learning_rate": 6.645342589462744e-05, + "loss": 0.0071, + "step": 308610 + }, + { + "epoch": 1.56, + "learning_rate": 6.644585820161343e-05, + "loss": 0.011, + "step": 308620 + }, + { + "epoch": 1.56, + "learning_rate": 6.643829050859941e-05, + "loss": 0.0062, + "step": 308630 + }, + { + "epoch": 1.56, + "learning_rate": 6.64307228155854e-05, + "loss": 0.0068, + "step": 308640 + }, + { + "epoch": 1.56, + "learning_rate": 6.64231551225714e-05, + "loss": 0.0056, + "step": 308650 + }, + { + "epoch": 1.56, + "learning_rate": 6.641558742955738e-05, + "loss": 0.0078, + "step": 308660 + }, + { + "epoch": 1.56, + "learning_rate": 6.640801973654338e-05, + "loss": 0.006, + "step": 308670 + }, + { + "epoch": 1.56, + "learning_rate": 6.640045204352937e-05, + "loss": 0.0074, + "step": 308680 + }, + { + "epoch": 1.56, + "learning_rate": 6.639288435051535e-05, + "loss": 0.0064, + "step": 308690 + }, + { + "epoch": 1.56, + "learning_rate": 6.638531665750135e-05, + "loss": 0.0081, + "step": 308700 + }, + { + "epoch": 1.56, + "learning_rate": 6.637774896448733e-05, + "loss": 0.0063, + "step": 308710 + }, + { + "epoch": 1.56, + "learning_rate": 6.637018127147333e-05, + "loss": 0.007, + "step": 308720 + }, + { + "epoch": 1.56, + "learning_rate": 6.636261357845931e-05, + "loss": 0.0086, + "step": 308730 + }, + { + "epoch": 1.56, + "learning_rate": 6.63550458854453e-05, + "loss": 0.008, + "step": 308740 + }, + { + "epoch": 1.56, + "learning_rate": 6.634747819243128e-05, + "loss": 0.0072, + "step": 308750 + }, + { + "epoch": 1.56, + "learning_rate": 6.633991049941728e-05, + "loss": 0.0061, + "step": 308760 + }, + { + "epoch": 1.56, + "learning_rate": 6.633234280640327e-05, + "loss": 0.0095, + "step": 308770 + }, + { + "epoch": 1.56, + "learning_rate": 6.632477511338926e-05, + "loss": 0.006, + "step": 308780 + }, + { + "epoch": 1.56, + "learning_rate": 6.631720742037525e-05, + "loss": 0.0078, + "step": 308790 + }, + { + "epoch": 1.56, + "learning_rate": 6.630963972736123e-05, + "loss": 0.0055, + "step": 308800 + }, + { + "epoch": 1.56, + "learning_rate": 6.630207203434723e-05, + "loss": 0.008, + "step": 308810 + }, + { + "epoch": 1.56, + "learning_rate": 6.629450434133322e-05, + "loss": 0.0083, + "step": 308820 + }, + { + "epoch": 1.56, + "learning_rate": 6.62869366483192e-05, + "loss": 0.007, + "step": 308830 + }, + { + "epoch": 1.56, + "learning_rate": 6.62793689553052e-05, + "loss": 0.0086, + "step": 308840 + }, + { + "epoch": 1.56, + "learning_rate": 6.627180126229119e-05, + "loss": 0.0069, + "step": 308850 + }, + { + "epoch": 1.56, + "learning_rate": 6.626423356927717e-05, + "loss": 0.0089, + "step": 308860 + }, + { + "epoch": 1.56, + "learning_rate": 6.625666587626317e-05, + "loss": 0.0047, + "step": 308870 + }, + { + "epoch": 1.56, + "learning_rate": 6.624909818324916e-05, + "loss": 0.0088, + "step": 308880 + }, + { + "epoch": 1.56, + "learning_rate": 6.624153049023515e-05, + "loss": 0.008, + "step": 308890 + }, + { + "epoch": 1.56, + "learning_rate": 6.623396279722114e-05, + "loss": 0.0058, + "step": 308900 + }, + { + "epoch": 1.56, + "learning_rate": 6.622639510420712e-05, + "loss": 0.0088, + "step": 308910 + }, + { + "epoch": 1.56, + "learning_rate": 6.621882741119312e-05, + "loss": 0.0094, + "step": 308920 + }, + { + "epoch": 1.56, + "learning_rate": 6.621125971817911e-05, + "loss": 0.0074, + "step": 308930 + }, + { + "epoch": 1.56, + "learning_rate": 6.62036920251651e-05, + "loss": 0.0065, + "step": 308940 + }, + { + "epoch": 1.56, + "learning_rate": 6.619612433215109e-05, + "loss": 0.0074, + "step": 308950 + }, + { + "epoch": 1.56, + "learning_rate": 6.618855663913708e-05, + "loss": 0.007, + "step": 308960 + }, + { + "epoch": 1.56, + "learning_rate": 6.618098894612307e-05, + "loss": 0.0071, + "step": 308970 + }, + { + "epoch": 1.56, + "learning_rate": 6.617342125310906e-05, + "loss": 0.0077, + "step": 308980 + }, + { + "epoch": 1.56, + "learning_rate": 6.616585356009504e-05, + "loss": 0.0065, + "step": 308990 + }, + { + "epoch": 1.56, + "learning_rate": 6.615828586708104e-05, + "loss": 0.0052, + "step": 309000 + }, + { + "epoch": 1.56, + "eval_cer": 0.9144654039225352, + "eval_loss": 0.005355709232389927, + "eval_runtime": 116.4345, + "eval_samples_per_second": 17.177, + "eval_steps_per_second": 4.294, + "step": 309000 + }, + { + "epoch": 1.56, + "learning_rate": 6.615071817406703e-05, + "loss": 0.0082, + "step": 309010 + }, + { + "epoch": 1.56, + "learning_rate": 6.614315048105301e-05, + "loss": 0.0056, + "step": 309020 + }, + { + "epoch": 1.56, + "learning_rate": 6.613558278803901e-05, + "loss": 0.0066, + "step": 309030 + }, + { + "epoch": 1.56, + "learning_rate": 6.612801509502499e-05, + "loss": 0.0057, + "step": 309040 + }, + { + "epoch": 1.56, + "learning_rate": 6.612044740201098e-05, + "loss": 0.0063, + "step": 309050 + }, + { + "epoch": 1.56, + "learning_rate": 6.611287970899697e-05, + "loss": 0.0065, + "step": 309060 + }, + { + "epoch": 1.56, + "learning_rate": 6.610531201598296e-05, + "loss": 0.0085, + "step": 309070 + }, + { + "epoch": 1.56, + "learning_rate": 6.609774432296894e-05, + "loss": 0.0082, + "step": 309080 + }, + { + "epoch": 1.56, + "learning_rate": 6.609017662995494e-05, + "loss": 0.0081, + "step": 309090 + }, + { + "epoch": 1.56, + "learning_rate": 6.608260893694093e-05, + "loss": 0.0068, + "step": 309100 + }, + { + "epoch": 1.56, + "learning_rate": 6.607504124392691e-05, + "loss": 0.0075, + "step": 309110 + }, + { + "epoch": 1.56, + "learning_rate": 6.606747355091291e-05, + "loss": 0.006, + "step": 309120 + }, + { + "epoch": 1.56, + "learning_rate": 6.60599058578989e-05, + "loss": 0.0046, + "step": 309130 + }, + { + "epoch": 1.56, + "learning_rate": 6.605233816488489e-05, + "loss": 0.0077, + "step": 309140 + }, + { + "epoch": 1.56, + "learning_rate": 6.604477047187088e-05, + "loss": 0.0083, + "step": 309150 + }, + { + "epoch": 1.56, + "learning_rate": 6.603720277885686e-05, + "loss": 0.0071, + "step": 309160 + }, + { + "epoch": 1.56, + "learning_rate": 6.602963508584286e-05, + "loss": 0.0089, + "step": 309170 + }, + { + "epoch": 1.56, + "learning_rate": 6.602206739282885e-05, + "loss": 0.0094, + "step": 309180 + }, + { + "epoch": 1.56, + "learning_rate": 6.601449969981483e-05, + "loss": 0.0074, + "step": 309190 + }, + { + "epoch": 1.56, + "learning_rate": 6.600693200680083e-05, + "loss": 0.0073, + "step": 309200 + }, + { + "epoch": 1.56, + "learning_rate": 6.599936431378682e-05, + "loss": 0.0079, + "step": 309210 + }, + { + "epoch": 1.56, + "learning_rate": 6.59917966207728e-05, + "loss": 0.0078, + "step": 309220 + }, + { + "epoch": 1.56, + "learning_rate": 6.59842289277588e-05, + "loss": 0.0074, + "step": 309230 + }, + { + "epoch": 1.56, + "learning_rate": 6.597666123474478e-05, + "loss": 0.006, + "step": 309240 + }, + { + "epoch": 1.56, + "learning_rate": 6.596909354173078e-05, + "loss": 0.0065, + "step": 309250 + }, + { + "epoch": 1.56, + "learning_rate": 6.596152584871677e-05, + "loss": 0.0091, + "step": 309260 + }, + { + "epoch": 1.56, + "learning_rate": 6.595395815570275e-05, + "loss": 0.0084, + "step": 309270 + }, + { + "epoch": 1.56, + "learning_rate": 6.594639046268875e-05, + "loss": 0.0071, + "step": 309280 + }, + { + "epoch": 1.56, + "learning_rate": 6.593882276967474e-05, + "loss": 0.007, + "step": 309290 + }, + { + "epoch": 1.56, + "learning_rate": 6.593125507666072e-05, + "loss": 0.0074, + "step": 309300 + }, + { + "epoch": 1.56, + "learning_rate": 6.592368738364672e-05, + "loss": 0.0062, + "step": 309310 + }, + { + "epoch": 1.56, + "learning_rate": 6.59161196906327e-05, + "loss": 0.0062, + "step": 309320 + }, + { + "epoch": 1.56, + "learning_rate": 6.59085519976187e-05, + "loss": 0.0055, + "step": 309330 + }, + { + "epoch": 1.56, + "learning_rate": 6.590098430460469e-05, + "loss": 0.0056, + "step": 309340 + }, + { + "epoch": 1.56, + "learning_rate": 6.589341661159067e-05, + "loss": 0.0068, + "step": 309350 + }, + { + "epoch": 1.56, + "learning_rate": 6.588584891857665e-05, + "loss": 0.0082, + "step": 309360 + }, + { + "epoch": 1.56, + "learning_rate": 6.587828122556265e-05, + "loss": 0.0057, + "step": 309370 + }, + { + "epoch": 1.56, + "learning_rate": 6.587071353254864e-05, + "loss": 0.0072, + "step": 309380 + }, + { + "epoch": 1.56, + "learning_rate": 6.586314583953462e-05, + "loss": 0.0054, + "step": 309390 + }, + { + "epoch": 1.56, + "learning_rate": 6.585557814652062e-05, + "loss": 0.0064, + "step": 309400 + }, + { + "epoch": 1.56, + "learning_rate": 6.584801045350661e-05, + "loss": 0.0051, + "step": 309410 + }, + { + "epoch": 1.56, + "learning_rate": 6.58404427604926e-05, + "loss": 0.0063, + "step": 309420 + }, + { + "epoch": 1.56, + "learning_rate": 6.583287506747859e-05, + "loss": 0.0069, + "step": 309430 + }, + { + "epoch": 1.56, + "learning_rate": 6.582530737446457e-05, + "loss": 0.0074, + "step": 309440 + }, + { + "epoch": 1.56, + "learning_rate": 6.581773968145057e-05, + "loss": 0.0085, + "step": 309450 + }, + { + "epoch": 1.56, + "learning_rate": 6.581017198843656e-05, + "loss": 0.0067, + "step": 309460 + }, + { + "epoch": 1.56, + "learning_rate": 6.580260429542254e-05, + "loss": 0.0057, + "step": 309470 + }, + { + "epoch": 1.56, + "learning_rate": 6.579503660240854e-05, + "loss": 0.0059, + "step": 309480 + }, + { + "epoch": 1.56, + "learning_rate": 6.578746890939453e-05, + "loss": 0.0066, + "step": 309490 + }, + { + "epoch": 1.56, + "learning_rate": 6.577990121638052e-05, + "loss": 0.0068, + "step": 309500 + }, + { + "epoch": 1.56, + "learning_rate": 6.577233352336651e-05, + "loss": 0.0071, + "step": 309510 + }, + { + "epoch": 1.56, + "learning_rate": 6.576476583035249e-05, + "loss": 0.0051, + "step": 309520 + }, + { + "epoch": 1.56, + "learning_rate": 6.575719813733849e-05, + "loss": 0.0078, + "step": 309530 + }, + { + "epoch": 1.56, + "learning_rate": 6.574963044432448e-05, + "loss": 0.0099, + "step": 309540 + }, + { + "epoch": 1.56, + "learning_rate": 6.574206275131046e-05, + "loss": 0.0066, + "step": 309550 + }, + { + "epoch": 1.56, + "learning_rate": 6.573449505829646e-05, + "loss": 0.0068, + "step": 309560 + }, + { + "epoch": 1.56, + "learning_rate": 6.572692736528245e-05, + "loss": 0.0096, + "step": 309570 + }, + { + "epoch": 1.56, + "learning_rate": 6.571935967226843e-05, + "loss": 0.0057, + "step": 309580 + }, + { + "epoch": 1.56, + "learning_rate": 6.571179197925443e-05, + "loss": 0.0083, + "step": 309590 + }, + { + "epoch": 1.56, + "learning_rate": 6.570422428624041e-05, + "loss": 0.0078, + "step": 309600 + }, + { + "epoch": 1.56, + "learning_rate": 6.56966565932264e-05, + "loss": 0.0067, + "step": 309610 + }, + { + "epoch": 1.56, + "learning_rate": 6.56890889002124e-05, + "loss": 0.0077, + "step": 309620 + }, + { + "epoch": 1.56, + "learning_rate": 6.568152120719838e-05, + "loss": 0.0077, + "step": 309630 + }, + { + "epoch": 1.56, + "learning_rate": 6.567395351418438e-05, + "loss": 0.0062, + "step": 309640 + }, + { + "epoch": 1.56, + "learning_rate": 6.566638582117037e-05, + "loss": 0.0069, + "step": 309650 + }, + { + "epoch": 1.56, + "learning_rate": 6.565881812815635e-05, + "loss": 0.0068, + "step": 309660 + }, + { + "epoch": 1.56, + "learning_rate": 6.565125043514234e-05, + "loss": 0.0048, + "step": 309670 + }, + { + "epoch": 1.56, + "learning_rate": 6.564368274212833e-05, + "loss": 0.0072, + "step": 309680 + }, + { + "epoch": 1.56, + "learning_rate": 6.563611504911431e-05, + "loss": 0.0064, + "step": 309690 + }, + { + "epoch": 1.56, + "learning_rate": 6.562854735610031e-05, + "loss": 0.0038, + "step": 309700 + }, + { + "epoch": 1.56, + "learning_rate": 6.56209796630863e-05, + "loss": 0.0061, + "step": 309710 + }, + { + "epoch": 1.56, + "learning_rate": 6.561341197007228e-05, + "loss": 0.0047, + "step": 309720 + }, + { + "epoch": 1.56, + "learning_rate": 6.560584427705828e-05, + "loss": 0.0103, + "step": 309730 + }, + { + "epoch": 1.56, + "learning_rate": 6.559827658404427e-05, + "loss": 0.0058, + "step": 309740 + }, + { + "epoch": 1.56, + "learning_rate": 6.559070889103025e-05, + "loss": 0.0065, + "step": 309750 + }, + { + "epoch": 1.56, + "learning_rate": 6.558314119801625e-05, + "loss": 0.0057, + "step": 309760 + }, + { + "epoch": 1.56, + "learning_rate": 6.557557350500223e-05, + "loss": 0.0065, + "step": 309770 + }, + { + "epoch": 1.56, + "learning_rate": 6.556800581198823e-05, + "loss": 0.0057, + "step": 309780 + }, + { + "epoch": 1.56, + "learning_rate": 6.556043811897422e-05, + "loss": 0.0079, + "step": 309790 + }, + { + "epoch": 1.56, + "learning_rate": 6.55528704259602e-05, + "loss": 0.0057, + "step": 309800 + }, + { + "epoch": 1.56, + "learning_rate": 6.55453027329462e-05, + "loss": 0.0073, + "step": 309810 + }, + { + "epoch": 1.56, + "learning_rate": 6.553773503993219e-05, + "loss": 0.0065, + "step": 309820 + }, + { + "epoch": 1.56, + "learning_rate": 6.553016734691817e-05, + "loss": 0.0079, + "step": 309830 + }, + { + "epoch": 1.56, + "learning_rate": 6.552259965390417e-05, + "loss": 0.008, + "step": 309840 + }, + { + "epoch": 1.56, + "learning_rate": 6.551503196089016e-05, + "loss": 0.0057, + "step": 309850 + }, + { + "epoch": 1.56, + "learning_rate": 6.550746426787615e-05, + "loss": 0.008, + "step": 309860 + }, + { + "epoch": 1.56, + "learning_rate": 6.549989657486214e-05, + "loss": 0.0053, + "step": 309870 + }, + { + "epoch": 1.56, + "learning_rate": 6.549232888184812e-05, + "loss": 0.0069, + "step": 309880 + }, + { + "epoch": 1.56, + "learning_rate": 6.548476118883412e-05, + "loss": 0.0066, + "step": 309890 + }, + { + "epoch": 1.56, + "learning_rate": 6.547719349582011e-05, + "loss": 0.0072, + "step": 309900 + }, + { + "epoch": 1.56, + "learning_rate": 6.54696258028061e-05, + "loss": 0.0085, + "step": 309910 + }, + { + "epoch": 1.56, + "learning_rate": 6.546205810979209e-05, + "loss": 0.0072, + "step": 309920 + }, + { + "epoch": 1.56, + "learning_rate": 6.545449041677808e-05, + "loss": 0.0072, + "step": 309930 + }, + { + "epoch": 1.56, + "learning_rate": 6.544692272376406e-05, + "loss": 0.0106, + "step": 309940 + }, + { + "epoch": 1.56, + "learning_rate": 6.543935503075006e-05, + "loss": 0.0073, + "step": 309950 + }, + { + "epoch": 1.56, + "learning_rate": 6.543178733773604e-05, + "loss": 0.008, + "step": 309960 + }, + { + "epoch": 1.56, + "learning_rate": 6.542421964472204e-05, + "loss": 0.0071, + "step": 309970 + }, + { + "epoch": 1.56, + "learning_rate": 6.541665195170802e-05, + "loss": 0.0087, + "step": 309980 + }, + { + "epoch": 1.56, + "learning_rate": 6.540908425869401e-05, + "loss": 0.009, + "step": 309990 + }, + { + "epoch": 1.56, + "learning_rate": 6.540151656568e-05, + "loss": 0.0062, + "step": 310000 + }, + { + "epoch": 1.56, + "eval_cer": 0.9144556999612812, + "eval_loss": 0.005289402790367603, + "eval_runtime": 116.4374, + "eval_samples_per_second": 17.177, + "eval_steps_per_second": 4.294, + "step": 310000 + }, + { + "epoch": 1.56, + "learning_rate": 6.539394887266599e-05, + "loss": 0.0071, + "step": 310010 + }, + { + "epoch": 1.56, + "learning_rate": 6.538638117965198e-05, + "loss": 0.0064, + "step": 310020 + }, + { + "epoch": 1.56, + "learning_rate": 6.537881348663797e-05, + "loss": 0.008, + "step": 310030 + }, + { + "epoch": 1.56, + "learning_rate": 6.537124579362396e-05, + "loss": 0.0061, + "step": 310040 + }, + { + "epoch": 1.56, + "learning_rate": 6.536367810060994e-05, + "loss": 0.0065, + "step": 310050 + }, + { + "epoch": 1.56, + "learning_rate": 6.535611040759594e-05, + "loss": 0.0053, + "step": 310060 + }, + { + "epoch": 1.56, + "learning_rate": 6.534854271458193e-05, + "loss": 0.0089, + "step": 310070 + }, + { + "epoch": 1.56, + "learning_rate": 6.534097502156791e-05, + "loss": 0.0059, + "step": 310080 + }, + { + "epoch": 1.56, + "learning_rate": 6.533340732855391e-05, + "loss": 0.008, + "step": 310090 + }, + { + "epoch": 1.56, + "learning_rate": 6.53258396355399e-05, + "loss": 0.0063, + "step": 310100 + }, + { + "epoch": 1.56, + "learning_rate": 6.531827194252588e-05, + "loss": 0.0075, + "step": 310110 + }, + { + "epoch": 1.56, + "learning_rate": 6.531070424951188e-05, + "loss": 0.0075, + "step": 310120 + }, + { + "epoch": 1.56, + "learning_rate": 6.530313655649786e-05, + "loss": 0.0068, + "step": 310130 + }, + { + "epoch": 1.56, + "learning_rate": 6.529556886348386e-05, + "loss": 0.0083, + "step": 310140 + }, + { + "epoch": 1.56, + "learning_rate": 6.528800117046985e-05, + "loss": 0.006, + "step": 310150 + }, + { + "epoch": 1.56, + "learning_rate": 6.528043347745583e-05, + "loss": 0.0073, + "step": 310160 + }, + { + "epoch": 1.56, + "learning_rate": 6.527286578444183e-05, + "loss": 0.0054, + "step": 310170 + }, + { + "epoch": 1.56, + "learning_rate": 6.526529809142782e-05, + "loss": 0.006, + "step": 310180 + }, + { + "epoch": 1.56, + "learning_rate": 6.52577303984138e-05, + "loss": 0.0056, + "step": 310190 + }, + { + "epoch": 1.56, + "learning_rate": 6.52501627053998e-05, + "loss": 0.0058, + "step": 310200 + }, + { + "epoch": 1.57, + "learning_rate": 6.524259501238578e-05, + "loss": 0.0086, + "step": 310210 + }, + { + "epoch": 1.57, + "learning_rate": 6.523502731937178e-05, + "loss": 0.0056, + "step": 310220 + }, + { + "epoch": 1.57, + "learning_rate": 6.522745962635777e-05, + "loss": 0.0059, + "step": 310230 + }, + { + "epoch": 1.57, + "learning_rate": 6.521989193334375e-05, + "loss": 0.0073, + "step": 310240 + }, + { + "epoch": 1.57, + "learning_rate": 6.521232424032975e-05, + "loss": 0.0052, + "step": 310250 + }, + { + "epoch": 1.57, + "learning_rate": 6.520475654731574e-05, + "loss": 0.0063, + "step": 310260 + }, + { + "epoch": 1.57, + "learning_rate": 6.519718885430172e-05, + "loss": 0.0072, + "step": 310270 + }, + { + "epoch": 1.57, + "learning_rate": 6.518962116128772e-05, + "loss": 0.0068, + "step": 310280 + }, + { + "epoch": 1.57, + "learning_rate": 6.51820534682737e-05, + "loss": 0.0062, + "step": 310290 + }, + { + "epoch": 1.57, + "learning_rate": 6.51744857752597e-05, + "loss": 0.0074, + "step": 310300 + }, + { + "epoch": 1.57, + "learning_rate": 6.516691808224568e-05, + "loss": 0.0062, + "step": 310310 + }, + { + "epoch": 1.57, + "learning_rate": 6.515935038923167e-05, + "loss": 0.0067, + "step": 310320 + }, + { + "epoch": 1.57, + "learning_rate": 6.515178269621765e-05, + "loss": 0.0091, + "step": 310330 + }, + { + "epoch": 1.57, + "learning_rate": 6.514421500320365e-05, + "loss": 0.0099, + "step": 310340 + }, + { + "epoch": 1.57, + "learning_rate": 6.513664731018964e-05, + "loss": 0.0092, + "step": 310350 + }, + { + "epoch": 1.57, + "learning_rate": 6.512907961717562e-05, + "loss": 0.0072, + "step": 310360 + }, + { + "epoch": 1.57, + "learning_rate": 6.512151192416162e-05, + "loss": 0.0095, + "step": 310370 + }, + { + "epoch": 1.57, + "learning_rate": 6.511394423114761e-05, + "loss": 0.0074, + "step": 310380 + }, + { + "epoch": 1.57, + "learning_rate": 6.51063765381336e-05, + "loss": 0.0071, + "step": 310390 + }, + { + "epoch": 1.57, + "learning_rate": 6.509880884511959e-05, + "loss": 0.0075, + "step": 310400 + }, + { + "epoch": 1.57, + "learning_rate": 6.509124115210557e-05, + "loss": 0.0095, + "step": 310410 + }, + { + "epoch": 1.57, + "learning_rate": 6.508367345909157e-05, + "loss": 0.0077, + "step": 310420 + }, + { + "epoch": 1.57, + "learning_rate": 6.507610576607756e-05, + "loss": 0.0069, + "step": 310430 + }, + { + "epoch": 1.57, + "learning_rate": 6.506853807306354e-05, + "loss": 0.0061, + "step": 310440 + }, + { + "epoch": 1.57, + "learning_rate": 6.506097038004954e-05, + "loss": 0.0069, + "step": 310450 + }, + { + "epoch": 1.57, + "learning_rate": 6.505340268703553e-05, + "loss": 0.0079, + "step": 310460 + }, + { + "epoch": 1.57, + "learning_rate": 6.504583499402152e-05, + "loss": 0.005, + "step": 310470 + }, + { + "epoch": 1.57, + "learning_rate": 6.503826730100751e-05, + "loss": 0.0068, + "step": 310480 + }, + { + "epoch": 1.57, + "learning_rate": 6.503069960799349e-05, + "loss": 0.0088, + "step": 310490 + }, + { + "epoch": 1.57, + "learning_rate": 6.502313191497949e-05, + "loss": 0.0069, + "step": 310500 + }, + { + "epoch": 1.57, + "learning_rate": 6.501556422196548e-05, + "loss": 0.0059, + "step": 310510 + }, + { + "epoch": 1.57, + "learning_rate": 6.500799652895146e-05, + "loss": 0.0073, + "step": 310520 + }, + { + "epoch": 1.57, + "learning_rate": 6.500042883593746e-05, + "loss": 0.0067, + "step": 310530 + }, + { + "epoch": 1.57, + "learning_rate": 6.499286114292345e-05, + "loss": 0.0078, + "step": 310540 + }, + { + "epoch": 1.57, + "learning_rate": 6.498529344990943e-05, + "loss": 0.0056, + "step": 310550 + }, + { + "epoch": 1.57, + "learning_rate": 6.497772575689543e-05, + "loss": 0.0057, + "step": 310560 + }, + { + "epoch": 1.57, + "learning_rate": 6.497015806388141e-05, + "loss": 0.0079, + "step": 310570 + }, + { + "epoch": 1.57, + "learning_rate": 6.49625903708674e-05, + "loss": 0.0071, + "step": 310580 + }, + { + "epoch": 1.57, + "learning_rate": 6.49550226778534e-05, + "loss": 0.0073, + "step": 310590 + }, + { + "epoch": 1.57, + "learning_rate": 6.494745498483938e-05, + "loss": 0.0084, + "step": 310600 + }, + { + "epoch": 1.57, + "learning_rate": 6.493988729182536e-05, + "loss": 0.006, + "step": 310610 + }, + { + "epoch": 1.57, + "learning_rate": 6.493231959881136e-05, + "loss": 0.0061, + "step": 310620 + }, + { + "epoch": 1.57, + "learning_rate": 6.492475190579735e-05, + "loss": 0.0083, + "step": 310630 + }, + { + "epoch": 1.57, + "learning_rate": 6.491718421278334e-05, + "loss": 0.0067, + "step": 310640 + }, + { + "epoch": 1.57, + "learning_rate": 6.490961651976933e-05, + "loss": 0.0049, + "step": 310650 + }, + { + "epoch": 1.57, + "learning_rate": 6.490204882675531e-05, + "loss": 0.0057, + "step": 310660 + }, + { + "epoch": 1.57, + "learning_rate": 6.48944811337413e-05, + "loss": 0.0096, + "step": 310670 + }, + { + "epoch": 1.57, + "learning_rate": 6.48869134407273e-05, + "loss": 0.0073, + "step": 310680 + }, + { + "epoch": 1.57, + "learning_rate": 6.487934574771328e-05, + "loss": 0.008, + "step": 310690 + }, + { + "epoch": 1.57, + "learning_rate": 6.487177805469928e-05, + "loss": 0.0058, + "step": 310700 + }, + { + "epoch": 1.57, + "learning_rate": 6.486421036168527e-05, + "loss": 0.0095, + "step": 310710 + }, + { + "epoch": 1.57, + "learning_rate": 6.485664266867125e-05, + "loss": 0.0091, + "step": 310720 + }, + { + "epoch": 1.57, + "learning_rate": 6.484907497565725e-05, + "loss": 0.0083, + "step": 310730 + }, + { + "epoch": 1.57, + "learning_rate": 6.484150728264323e-05, + "loss": 0.0067, + "step": 310740 + }, + { + "epoch": 1.57, + "learning_rate": 6.483393958962923e-05, + "loss": 0.0064, + "step": 310750 + }, + { + "epoch": 1.57, + "learning_rate": 6.482637189661522e-05, + "loss": 0.0069, + "step": 310760 + }, + { + "epoch": 1.57, + "learning_rate": 6.48188042036012e-05, + "loss": 0.007, + "step": 310770 + }, + { + "epoch": 1.57, + "learning_rate": 6.48112365105872e-05, + "loss": 0.0091, + "step": 310780 + }, + { + "epoch": 1.57, + "learning_rate": 6.480366881757319e-05, + "loss": 0.0056, + "step": 310790 + }, + { + "epoch": 1.57, + "learning_rate": 6.479610112455917e-05, + "loss": 0.0063, + "step": 310800 + }, + { + "epoch": 1.57, + "learning_rate": 6.478853343154517e-05, + "loss": 0.0067, + "step": 310810 + }, + { + "epoch": 1.57, + "learning_rate": 6.478096573853116e-05, + "loss": 0.0068, + "step": 310820 + }, + { + "epoch": 1.57, + "learning_rate": 6.477339804551715e-05, + "loss": 0.008, + "step": 310830 + }, + { + "epoch": 1.57, + "learning_rate": 6.476583035250314e-05, + "loss": 0.0079, + "step": 310840 + }, + { + "epoch": 1.57, + "learning_rate": 6.475826265948912e-05, + "loss": 0.0058, + "step": 310850 + }, + { + "epoch": 1.57, + "learning_rate": 6.475069496647512e-05, + "loss": 0.0067, + "step": 310860 + }, + { + "epoch": 1.57, + "learning_rate": 6.474312727346111e-05, + "loss": 0.0081, + "step": 310870 + }, + { + "epoch": 1.57, + "learning_rate": 6.473555958044709e-05, + "loss": 0.0055, + "step": 310880 + }, + { + "epoch": 1.57, + "learning_rate": 6.472799188743309e-05, + "loss": 0.0061, + "step": 310890 + }, + { + "epoch": 1.57, + "learning_rate": 6.472042419441908e-05, + "loss": 0.0062, + "step": 310900 + }, + { + "epoch": 1.57, + "learning_rate": 6.471285650140506e-05, + "loss": 0.0057, + "step": 310910 + }, + { + "epoch": 1.57, + "learning_rate": 6.470528880839106e-05, + "loss": 0.0058, + "step": 310920 + }, + { + "epoch": 1.57, + "learning_rate": 6.469772111537704e-05, + "loss": 0.007, + "step": 310930 + }, + { + "epoch": 1.57, + "learning_rate": 6.469015342236302e-05, + "loss": 0.0061, + "step": 310940 + }, + { + "epoch": 1.57, + "learning_rate": 6.468258572934902e-05, + "loss": 0.0087, + "step": 310950 + }, + { + "epoch": 1.57, + "learning_rate": 6.467501803633501e-05, + "loss": 0.0065, + "step": 310960 + }, + { + "epoch": 1.57, + "learning_rate": 6.4667450343321e-05, + "loss": 0.0058, + "step": 310970 + }, + { + "epoch": 1.57, + "learning_rate": 6.465988265030699e-05, + "loss": 0.0079, + "step": 310980 + }, + { + "epoch": 1.57, + "learning_rate": 6.465231495729298e-05, + "loss": 0.0088, + "step": 310990 + }, + { + "epoch": 1.57, + "learning_rate": 6.464474726427897e-05, + "loss": 0.0083, + "step": 311000 + }, + { + "epoch": 1.57, + "eval_cer": 0.9144498775845288, + "eval_loss": 0.005227969028055668, + "eval_runtime": 116.309, + "eval_samples_per_second": 17.196, + "eval_steps_per_second": 4.299, + "step": 311000 + }, + { + "epoch": 1.57, + "learning_rate": 6.463717957126496e-05, + "loss": 0.0074, + "step": 311010 + }, + { + "epoch": 1.57, + "learning_rate": 6.462961187825094e-05, + "loss": 0.0069, + "step": 311020 + }, + { + "epoch": 1.57, + "learning_rate": 6.462204418523694e-05, + "loss": 0.0093, + "step": 311030 + }, + { + "epoch": 1.57, + "learning_rate": 6.461447649222293e-05, + "loss": 0.007, + "step": 311040 + }, + { + "epoch": 1.57, + "learning_rate": 6.460690879920891e-05, + "loss": 0.0064, + "step": 311050 + }, + { + "epoch": 1.57, + "learning_rate": 6.459934110619491e-05, + "loss": 0.0075, + "step": 311060 + }, + { + "epoch": 1.57, + "learning_rate": 6.45917734131809e-05, + "loss": 0.0049, + "step": 311070 + }, + { + "epoch": 1.57, + "learning_rate": 6.458420572016688e-05, + "loss": 0.0071, + "step": 311080 + }, + { + "epoch": 1.57, + "learning_rate": 6.457663802715288e-05, + "loss": 0.0084, + "step": 311090 + }, + { + "epoch": 1.57, + "learning_rate": 6.456907033413886e-05, + "loss": 0.0062, + "step": 311100 + }, + { + "epoch": 1.57, + "learning_rate": 6.456150264112486e-05, + "loss": 0.0065, + "step": 311110 + }, + { + "epoch": 1.57, + "learning_rate": 6.455393494811085e-05, + "loss": 0.0064, + "step": 311120 + }, + { + "epoch": 1.57, + "learning_rate": 6.454636725509683e-05, + "loss": 0.0056, + "step": 311130 + }, + { + "epoch": 1.57, + "learning_rate": 6.453879956208283e-05, + "loss": 0.0076, + "step": 311140 + }, + { + "epoch": 1.57, + "learning_rate": 6.453123186906882e-05, + "loss": 0.0056, + "step": 311150 + }, + { + "epoch": 1.57, + "learning_rate": 6.45236641760548e-05, + "loss": 0.0082, + "step": 311160 + }, + { + "epoch": 1.57, + "learning_rate": 6.45160964830408e-05, + "loss": 0.0076, + "step": 311170 + }, + { + "epoch": 1.57, + "learning_rate": 6.450852879002678e-05, + "loss": 0.009, + "step": 311180 + }, + { + "epoch": 1.57, + "learning_rate": 6.450096109701278e-05, + "loss": 0.0083, + "step": 311190 + }, + { + "epoch": 1.57, + "learning_rate": 6.449339340399877e-05, + "loss": 0.0094, + "step": 311200 + }, + { + "epoch": 1.57, + "learning_rate": 6.448582571098475e-05, + "loss": 0.0058, + "step": 311210 + }, + { + "epoch": 1.57, + "learning_rate": 6.447825801797075e-05, + "loss": 0.0053, + "step": 311220 + }, + { + "epoch": 1.57, + "learning_rate": 6.447069032495674e-05, + "loss": 0.0088, + "step": 311230 + }, + { + "epoch": 1.57, + "learning_rate": 6.446312263194272e-05, + "loss": 0.0074, + "step": 311240 + }, + { + "epoch": 1.57, + "learning_rate": 6.44555549389287e-05, + "loss": 0.0051, + "step": 311250 + }, + { + "epoch": 1.57, + "learning_rate": 6.44479872459147e-05, + "loss": 0.0056, + "step": 311260 + }, + { + "epoch": 1.57, + "learning_rate": 6.44404195529007e-05, + "loss": 0.0059, + "step": 311270 + }, + { + "epoch": 1.57, + "learning_rate": 6.443285185988668e-05, + "loss": 0.0093, + "step": 311280 + }, + { + "epoch": 1.57, + "learning_rate": 6.442528416687267e-05, + "loss": 0.0091, + "step": 311290 + }, + { + "epoch": 1.57, + "learning_rate": 6.441771647385865e-05, + "loss": 0.0074, + "step": 311300 + }, + { + "epoch": 1.57, + "learning_rate": 6.441014878084465e-05, + "loss": 0.0075, + "step": 311310 + }, + { + "epoch": 1.57, + "learning_rate": 6.440258108783064e-05, + "loss": 0.0086, + "step": 311320 + }, + { + "epoch": 1.57, + "learning_rate": 6.439501339481662e-05, + "loss": 0.0055, + "step": 311330 + }, + { + "epoch": 1.57, + "learning_rate": 6.438744570180262e-05, + "loss": 0.0061, + "step": 311340 + }, + { + "epoch": 1.57, + "learning_rate": 6.437987800878861e-05, + "loss": 0.0097, + "step": 311350 + }, + { + "epoch": 1.57, + "learning_rate": 6.43723103157746e-05, + "loss": 0.0076, + "step": 311360 + }, + { + "epoch": 1.57, + "learning_rate": 6.436474262276059e-05, + "loss": 0.0057, + "step": 311370 + }, + { + "epoch": 1.57, + "learning_rate": 6.435717492974657e-05, + "loss": 0.0064, + "step": 311380 + }, + { + "epoch": 1.57, + "learning_rate": 6.434960723673257e-05, + "loss": 0.0076, + "step": 311390 + }, + { + "epoch": 1.57, + "learning_rate": 6.434203954371856e-05, + "loss": 0.009, + "step": 311400 + }, + { + "epoch": 1.57, + "learning_rate": 6.433447185070454e-05, + "loss": 0.0062, + "step": 311410 + }, + { + "epoch": 1.57, + "learning_rate": 6.432690415769054e-05, + "loss": 0.0073, + "step": 311420 + }, + { + "epoch": 1.57, + "learning_rate": 6.431933646467653e-05, + "loss": 0.0062, + "step": 311430 + }, + { + "epoch": 1.57, + "learning_rate": 6.431176877166251e-05, + "loss": 0.0061, + "step": 311440 + }, + { + "epoch": 1.57, + "learning_rate": 6.430420107864851e-05, + "loss": 0.009, + "step": 311450 + }, + { + "epoch": 1.57, + "learning_rate": 6.429663338563449e-05, + "loss": 0.0048, + "step": 311460 + }, + { + "epoch": 1.57, + "learning_rate": 6.428906569262049e-05, + "loss": 0.006, + "step": 311470 + }, + { + "epoch": 1.57, + "learning_rate": 6.428149799960648e-05, + "loss": 0.0069, + "step": 311480 + }, + { + "epoch": 1.57, + "learning_rate": 6.427393030659246e-05, + "loss": 0.0058, + "step": 311490 + }, + { + "epoch": 1.57, + "learning_rate": 6.426636261357846e-05, + "loss": 0.0084, + "step": 311500 + }, + { + "epoch": 1.57, + "learning_rate": 6.425879492056445e-05, + "loss": 0.0074, + "step": 311510 + }, + { + "epoch": 1.57, + "learning_rate": 6.425122722755043e-05, + "loss": 0.0065, + "step": 311520 + }, + { + "epoch": 1.57, + "learning_rate": 6.424365953453643e-05, + "loss": 0.0047, + "step": 311530 + }, + { + "epoch": 1.57, + "learning_rate": 6.423609184152241e-05, + "loss": 0.0063, + "step": 311540 + }, + { + "epoch": 1.57, + "learning_rate": 6.42285241485084e-05, + "loss": 0.0058, + "step": 311550 + }, + { + "epoch": 1.57, + "learning_rate": 6.422095645549439e-05, + "loss": 0.0083, + "step": 311560 + }, + { + "epoch": 1.57, + "learning_rate": 6.421338876248038e-05, + "loss": 0.0067, + "step": 311570 + }, + { + "epoch": 1.57, + "learning_rate": 6.420582106946636e-05, + "loss": 0.0072, + "step": 311580 + }, + { + "epoch": 1.57, + "learning_rate": 6.419825337645236e-05, + "loss": 0.0071, + "step": 311590 + }, + { + "epoch": 1.57, + "learning_rate": 6.419068568343835e-05, + "loss": 0.0052, + "step": 311600 + }, + { + "epoch": 1.57, + "learning_rate": 6.418311799042433e-05, + "loss": 0.009, + "step": 311610 + }, + { + "epoch": 1.57, + "learning_rate": 6.417555029741033e-05, + "loss": 0.0065, + "step": 311620 + }, + { + "epoch": 1.57, + "learning_rate": 6.416798260439631e-05, + "loss": 0.0084, + "step": 311630 + }, + { + "epoch": 1.57, + "learning_rate": 6.41604149113823e-05, + "loss": 0.006, + "step": 311640 + }, + { + "epoch": 1.57, + "learning_rate": 6.41528472183683e-05, + "loss": 0.0054, + "step": 311650 + }, + { + "epoch": 1.57, + "learning_rate": 6.414527952535428e-05, + "loss": 0.0065, + "step": 311660 + }, + { + "epoch": 1.57, + "learning_rate": 6.413771183234028e-05, + "loss": 0.0051, + "step": 311670 + }, + { + "epoch": 1.57, + "learning_rate": 6.413014413932627e-05, + "loss": 0.0064, + "step": 311680 + }, + { + "epoch": 1.57, + "learning_rate": 6.412257644631225e-05, + "loss": 0.0071, + "step": 311690 + }, + { + "epoch": 1.57, + "learning_rate": 6.411500875329825e-05, + "loss": 0.0074, + "step": 311700 + }, + { + "epoch": 1.57, + "learning_rate": 6.410744106028423e-05, + "loss": 0.0068, + "step": 311710 + }, + { + "epoch": 1.57, + "learning_rate": 6.409987336727023e-05, + "loss": 0.0068, + "step": 311720 + }, + { + "epoch": 1.57, + "learning_rate": 6.409230567425622e-05, + "loss": 0.0096, + "step": 311730 + }, + { + "epoch": 1.57, + "learning_rate": 6.40847379812422e-05, + "loss": 0.0062, + "step": 311740 + }, + { + "epoch": 1.57, + "learning_rate": 6.40771702882282e-05, + "loss": 0.0053, + "step": 311750 + }, + { + "epoch": 1.57, + "learning_rate": 6.406960259521419e-05, + "loss": 0.0085, + "step": 311760 + }, + { + "epoch": 1.57, + "learning_rate": 6.406203490220017e-05, + "loss": 0.0086, + "step": 311770 + }, + { + "epoch": 1.57, + "learning_rate": 6.405446720918617e-05, + "loss": 0.0075, + "step": 311780 + }, + { + "epoch": 1.57, + "learning_rate": 6.404689951617216e-05, + "loss": 0.0074, + "step": 311790 + }, + { + "epoch": 1.57, + "learning_rate": 6.403933182315814e-05, + "loss": 0.0072, + "step": 311800 + }, + { + "epoch": 1.57, + "learning_rate": 6.403176413014414e-05, + "loss": 0.0057, + "step": 311810 + }, + { + "epoch": 1.57, + "learning_rate": 6.402419643713012e-05, + "loss": 0.0071, + "step": 311820 + }, + { + "epoch": 1.57, + "learning_rate": 6.401662874411612e-05, + "loss": 0.0059, + "step": 311830 + }, + { + "epoch": 1.57, + "learning_rate": 6.400906105110211e-05, + "loss": 0.0096, + "step": 311840 + }, + { + "epoch": 1.57, + "learning_rate": 6.400149335808809e-05, + "loss": 0.0076, + "step": 311850 + }, + { + "epoch": 1.57, + "learning_rate": 6.399392566507409e-05, + "loss": 0.0061, + "step": 311860 + }, + { + "epoch": 1.57, + "learning_rate": 6.398635797206007e-05, + "loss": 0.0072, + "step": 311870 + }, + { + "epoch": 1.57, + "learning_rate": 6.397879027904606e-05, + "loss": 0.006, + "step": 311880 + }, + { + "epoch": 1.57, + "learning_rate": 6.397122258603205e-05, + "loss": 0.0079, + "step": 311890 + }, + { + "epoch": 1.57, + "learning_rate": 6.396365489301804e-05, + "loss": 0.0074, + "step": 311900 + }, + { + "epoch": 1.57, + "learning_rate": 6.395608720000402e-05, + "loss": 0.0141, + "step": 311910 + }, + { + "epoch": 1.57, + "learning_rate": 6.394851950699002e-05, + "loss": 0.0067, + "step": 311920 + }, + { + "epoch": 1.57, + "learning_rate": 6.394095181397601e-05, + "loss": 0.0048, + "step": 311930 + }, + { + "epoch": 1.57, + "learning_rate": 6.3933384120962e-05, + "loss": 0.0065, + "step": 311940 + }, + { + "epoch": 1.57, + "learning_rate": 6.392581642794799e-05, + "loss": 0.0063, + "step": 311950 + }, + { + "epoch": 1.57, + "learning_rate": 6.391824873493398e-05, + "loss": 0.009, + "step": 311960 + }, + { + "epoch": 1.57, + "learning_rate": 6.391068104191996e-05, + "loss": 0.0116, + "step": 311970 + }, + { + "epoch": 1.57, + "learning_rate": 6.390311334890596e-05, + "loss": 0.0053, + "step": 311980 + }, + { + "epoch": 1.57, + "learning_rate": 6.389554565589194e-05, + "loss": 0.0093, + "step": 311990 + }, + { + "epoch": 1.57, + "learning_rate": 6.388797796287794e-05, + "loss": 0.0116, + "step": 312000 + }, + { + "epoch": 1.57, + "eval_cer": 0.914462492734159, + "eval_loss": 0.005281941965222359, + "eval_runtime": 116.1751, + "eval_samples_per_second": 17.215, + "eval_steps_per_second": 4.304, + "step": 312000 + }, + { + "epoch": 1.57, + "learning_rate": 6.388041026986393e-05, + "loss": 0.0074, + "step": 312010 + }, + { + "epoch": 1.57, + "learning_rate": 6.387284257684991e-05, + "loss": 0.0085, + "step": 312020 + }, + { + "epoch": 1.57, + "learning_rate": 6.386527488383591e-05, + "loss": 0.0098, + "step": 312030 + }, + { + "epoch": 1.57, + "learning_rate": 6.38577071908219e-05, + "loss": 0.0057, + "step": 312040 + }, + { + "epoch": 1.57, + "learning_rate": 6.385013949780788e-05, + "loss": 0.0077, + "step": 312050 + }, + { + "epoch": 1.57, + "learning_rate": 6.384257180479388e-05, + "loss": 0.0076, + "step": 312060 + }, + { + "epoch": 1.57, + "learning_rate": 6.383500411177986e-05, + "loss": 0.0061, + "step": 312070 + }, + { + "epoch": 1.57, + "learning_rate": 6.382743641876586e-05, + "loss": 0.0083, + "step": 312080 + }, + { + "epoch": 1.57, + "learning_rate": 6.381986872575185e-05, + "loss": 0.0068, + "step": 312090 + }, + { + "epoch": 1.57, + "learning_rate": 6.381230103273783e-05, + "loss": 0.0113, + "step": 312100 + }, + { + "epoch": 1.57, + "learning_rate": 6.380473333972383e-05, + "loss": 0.0067, + "step": 312110 + }, + { + "epoch": 1.57, + "learning_rate": 6.379716564670982e-05, + "loss": 0.0053, + "step": 312120 + }, + { + "epoch": 1.57, + "learning_rate": 6.37895979536958e-05, + "loss": 0.0075, + "step": 312130 + }, + { + "epoch": 1.57, + "learning_rate": 6.37820302606818e-05, + "loss": 0.0063, + "step": 312140 + }, + { + "epoch": 1.57, + "learning_rate": 6.377446256766778e-05, + "loss": 0.0078, + "step": 312150 + }, + { + "epoch": 1.57, + "learning_rate": 6.376689487465377e-05, + "loss": 0.0063, + "step": 312160 + }, + { + "epoch": 1.57, + "learning_rate": 6.375932718163977e-05, + "loss": 0.0066, + "step": 312170 + }, + { + "epoch": 1.57, + "learning_rate": 6.375175948862575e-05, + "loss": 0.0091, + "step": 312180 + }, + { + "epoch": 1.58, + "learning_rate": 6.374419179561173e-05, + "loss": 0.0051, + "step": 312190 + }, + { + "epoch": 1.58, + "learning_rate": 6.373662410259773e-05, + "loss": 0.0053, + "step": 312200 + }, + { + "epoch": 1.58, + "learning_rate": 6.372905640958372e-05, + "loss": 0.0057, + "step": 312210 + }, + { + "epoch": 1.58, + "learning_rate": 6.37214887165697e-05, + "loss": 0.0068, + "step": 312220 + }, + { + "epoch": 1.58, + "learning_rate": 6.37139210235557e-05, + "loss": 0.0069, + "step": 312230 + }, + { + "epoch": 1.58, + "learning_rate": 6.37063533305417e-05, + "loss": 0.0058, + "step": 312240 + }, + { + "epoch": 1.58, + "learning_rate": 6.369878563752768e-05, + "loss": 0.0069, + "step": 312250 + }, + { + "epoch": 1.58, + "learning_rate": 6.369121794451367e-05, + "loss": 0.0083, + "step": 312260 + }, + { + "epoch": 1.58, + "learning_rate": 6.368365025149965e-05, + "loss": 0.0057, + "step": 312270 + }, + { + "epoch": 1.58, + "learning_rate": 6.367608255848565e-05, + "loss": 0.0076, + "step": 312280 + }, + { + "epoch": 1.58, + "learning_rate": 6.366851486547164e-05, + "loss": 0.0061, + "step": 312290 + }, + { + "epoch": 1.58, + "learning_rate": 6.366094717245762e-05, + "loss": 0.0067, + "step": 312300 + }, + { + "epoch": 1.58, + "learning_rate": 6.365337947944362e-05, + "loss": 0.0096, + "step": 312310 + }, + { + "epoch": 1.58, + "learning_rate": 6.364581178642961e-05, + "loss": 0.007, + "step": 312320 + }, + { + "epoch": 1.58, + "learning_rate": 6.36382440934156e-05, + "loss": 0.0074, + "step": 312330 + }, + { + "epoch": 1.58, + "learning_rate": 6.363067640040159e-05, + "loss": 0.0059, + "step": 312340 + }, + { + "epoch": 1.58, + "learning_rate": 6.362310870738757e-05, + "loss": 0.0072, + "step": 312350 + }, + { + "epoch": 1.58, + "learning_rate": 6.361554101437357e-05, + "loss": 0.0058, + "step": 312360 + }, + { + "epoch": 1.58, + "learning_rate": 6.360797332135956e-05, + "loss": 0.0071, + "step": 312370 + }, + { + "epoch": 1.58, + "learning_rate": 6.360040562834554e-05, + "loss": 0.0079, + "step": 312380 + }, + { + "epoch": 1.58, + "learning_rate": 6.359283793533154e-05, + "loss": 0.0066, + "step": 312390 + }, + { + "epoch": 1.58, + "learning_rate": 6.358527024231753e-05, + "loss": 0.0072, + "step": 312400 + }, + { + "epoch": 1.58, + "learning_rate": 6.357770254930351e-05, + "loss": 0.0055, + "step": 312410 + }, + { + "epoch": 1.58, + "learning_rate": 6.357013485628951e-05, + "loss": 0.0116, + "step": 312420 + }, + { + "epoch": 1.58, + "learning_rate": 6.356256716327549e-05, + "loss": 0.0061, + "step": 312430 + }, + { + "epoch": 1.58, + "learning_rate": 6.355499947026149e-05, + "loss": 0.0059, + "step": 312440 + }, + { + "epoch": 1.58, + "learning_rate": 6.354743177724748e-05, + "loss": 0.0065, + "step": 312450 + }, + { + "epoch": 1.58, + "learning_rate": 6.353986408423346e-05, + "loss": 0.0078, + "step": 312460 + }, + { + "epoch": 1.58, + "learning_rate": 6.353229639121946e-05, + "loss": 0.0099, + "step": 312470 + }, + { + "epoch": 1.58, + "learning_rate": 6.352472869820545e-05, + "loss": 0.0075, + "step": 312480 + }, + { + "epoch": 1.58, + "learning_rate": 6.351716100519143e-05, + "loss": 0.0071, + "step": 312490 + }, + { + "epoch": 1.58, + "learning_rate": 6.350959331217741e-05, + "loss": 0.0069, + "step": 312500 + }, + { + "epoch": 1.58, + "learning_rate": 6.350202561916341e-05, + "loss": 0.0078, + "step": 312510 + }, + { + "epoch": 1.58, + "learning_rate": 6.349445792614939e-05, + "loss": 0.0062, + "step": 312520 + }, + { + "epoch": 1.58, + "learning_rate": 6.348689023313539e-05, + "loss": 0.007, + "step": 312530 + }, + { + "epoch": 1.58, + "learning_rate": 6.347932254012138e-05, + "loss": 0.0062, + "step": 312540 + }, + { + "epoch": 1.58, + "learning_rate": 6.347175484710736e-05, + "loss": 0.0061, + "step": 312550 + }, + { + "epoch": 1.58, + "learning_rate": 6.346418715409336e-05, + "loss": 0.0057, + "step": 312560 + }, + { + "epoch": 1.58, + "learning_rate": 6.345661946107935e-05, + "loss": 0.0063, + "step": 312570 + }, + { + "epoch": 1.58, + "learning_rate": 6.344905176806533e-05, + "loss": 0.0075, + "step": 312580 + }, + { + "epoch": 1.58, + "learning_rate": 6.344148407505133e-05, + "loss": 0.0084, + "step": 312590 + }, + { + "epoch": 1.58, + "learning_rate": 6.343391638203731e-05, + "loss": 0.007, + "step": 312600 + }, + { + "epoch": 1.58, + "learning_rate": 6.34263486890233e-05, + "loss": 0.0091, + "step": 312610 + }, + { + "epoch": 1.58, + "learning_rate": 6.34187809960093e-05, + "loss": 0.0091, + "step": 312620 + }, + { + "epoch": 1.58, + "learning_rate": 6.341121330299528e-05, + "loss": 0.0078, + "step": 312630 + }, + { + "epoch": 1.58, + "learning_rate": 6.340364560998128e-05, + "loss": 0.0065, + "step": 312640 + }, + { + "epoch": 1.58, + "learning_rate": 6.339607791696727e-05, + "loss": 0.0074, + "step": 312650 + }, + { + "epoch": 1.58, + "learning_rate": 6.338851022395325e-05, + "loss": 0.0062, + "step": 312660 + }, + { + "epoch": 1.58, + "learning_rate": 6.338094253093925e-05, + "loss": 0.0091, + "step": 312670 + }, + { + "epoch": 1.58, + "learning_rate": 6.337337483792523e-05, + "loss": 0.0055, + "step": 312680 + }, + { + "epoch": 1.58, + "learning_rate": 6.336580714491122e-05, + "loss": 0.0082, + "step": 312690 + }, + { + "epoch": 1.58, + "learning_rate": 6.335823945189722e-05, + "loss": 0.0072, + "step": 312700 + }, + { + "epoch": 1.58, + "learning_rate": 6.33506717588832e-05, + "loss": 0.0069, + "step": 312710 + }, + { + "epoch": 1.58, + "learning_rate": 6.33431040658692e-05, + "loss": 0.0067, + "step": 312720 + }, + { + "epoch": 1.58, + "learning_rate": 6.333553637285519e-05, + "loss": 0.0057, + "step": 312730 + }, + { + "epoch": 1.58, + "learning_rate": 6.332796867984117e-05, + "loss": 0.0067, + "step": 312740 + }, + { + "epoch": 1.58, + "learning_rate": 6.332040098682717e-05, + "loss": 0.0058, + "step": 312750 + }, + { + "epoch": 1.58, + "learning_rate": 6.331283329381316e-05, + "loss": 0.0074, + "step": 312760 + }, + { + "epoch": 1.58, + "learning_rate": 6.330526560079914e-05, + "loss": 0.0092, + "step": 312770 + }, + { + "epoch": 1.58, + "learning_rate": 6.329769790778514e-05, + "loss": 0.0074, + "step": 312780 + }, + { + "epoch": 1.58, + "learning_rate": 6.329013021477112e-05, + "loss": 0.0072, + "step": 312790 + }, + { + "epoch": 1.58, + "learning_rate": 6.328256252175712e-05, + "loss": 0.0074, + "step": 312800 + }, + { + "epoch": 1.58, + "learning_rate": 6.32749948287431e-05, + "loss": 0.0109, + "step": 312810 + }, + { + "epoch": 1.58, + "learning_rate": 6.326742713572909e-05, + "loss": 0.0049, + "step": 312820 + }, + { + "epoch": 1.58, + "learning_rate": 6.325985944271507e-05, + "loss": 0.0059, + "step": 312830 + }, + { + "epoch": 1.58, + "learning_rate": 6.325229174970107e-05, + "loss": 0.0071, + "step": 312840 + }, + { + "epoch": 1.58, + "learning_rate": 6.324472405668706e-05, + "loss": 0.0057, + "step": 312850 + }, + { + "epoch": 1.58, + "learning_rate": 6.323715636367304e-05, + "loss": 0.0076, + "step": 312860 + }, + { + "epoch": 1.58, + "learning_rate": 6.322958867065904e-05, + "loss": 0.0063, + "step": 312870 + }, + { + "epoch": 1.58, + "learning_rate": 6.322202097764502e-05, + "loss": 0.0085, + "step": 312880 + }, + { + "epoch": 1.58, + "learning_rate": 6.321445328463102e-05, + "loss": 0.0087, + "step": 312890 + }, + { + "epoch": 1.58, + "learning_rate": 6.320688559161701e-05, + "loss": 0.0072, + "step": 312900 + }, + { + "epoch": 1.58, + "learning_rate": 6.319931789860299e-05, + "loss": 0.0064, + "step": 312910 + }, + { + "epoch": 1.58, + "learning_rate": 6.319175020558899e-05, + "loss": 0.007, + "step": 312920 + }, + { + "epoch": 1.58, + "learning_rate": 6.318418251257498e-05, + "loss": 0.0057, + "step": 312930 + }, + { + "epoch": 1.58, + "learning_rate": 6.317661481956096e-05, + "loss": 0.0083, + "step": 312940 + }, + { + "epoch": 1.58, + "learning_rate": 6.316904712654696e-05, + "loss": 0.0072, + "step": 312950 + }, + { + "epoch": 1.58, + "learning_rate": 6.316147943353294e-05, + "loss": 0.0083, + "step": 312960 + }, + { + "epoch": 1.58, + "learning_rate": 6.315391174051894e-05, + "loss": 0.0072, + "step": 312970 + }, + { + "epoch": 1.58, + "learning_rate": 6.314634404750493e-05, + "loss": 0.007, + "step": 312980 + }, + { + "epoch": 1.58, + "learning_rate": 6.313877635449091e-05, + "loss": 0.0075, + "step": 312990 + }, + { + "epoch": 1.58, + "learning_rate": 6.313120866147691e-05, + "loss": 0.0064, + "step": 313000 + }, + { + "epoch": 1.58, + "eval_cer": 0.914438232831024, + "eval_loss": 0.005189271178096533, + "eval_runtime": 116.2305, + "eval_samples_per_second": 17.207, + "eval_steps_per_second": 4.302, + "step": 313000 + }, + { + "epoch": 1.58, + "learning_rate": 6.31236409684629e-05, + "loss": 0.0081, + "step": 313010 + }, + { + "epoch": 1.58, + "learning_rate": 6.311607327544888e-05, + "loss": 0.008, + "step": 313020 + }, + { + "epoch": 1.58, + "learning_rate": 6.310850558243488e-05, + "loss": 0.0079, + "step": 313030 + }, + { + "epoch": 1.58, + "learning_rate": 6.310093788942086e-05, + "loss": 0.0079, + "step": 313040 + }, + { + "epoch": 1.58, + "learning_rate": 6.309337019640685e-05, + "loss": 0.006, + "step": 313050 + }, + { + "epoch": 1.58, + "learning_rate": 6.308580250339285e-05, + "loss": 0.0071, + "step": 313060 + }, + { + "epoch": 1.58, + "learning_rate": 6.307823481037883e-05, + "loss": 0.0065, + "step": 313070 + }, + { + "epoch": 1.58, + "learning_rate": 6.307066711736483e-05, + "loss": 0.0082, + "step": 313080 + }, + { + "epoch": 1.58, + "learning_rate": 6.306309942435082e-05, + "loss": 0.0056, + "step": 313090 + }, + { + "epoch": 1.58, + "learning_rate": 6.30555317313368e-05, + "loss": 0.0062, + "step": 313100 + }, + { + "epoch": 1.58, + "learning_rate": 6.30479640383228e-05, + "loss": 0.0075, + "step": 313110 + }, + { + "epoch": 1.58, + "learning_rate": 6.304039634530878e-05, + "loss": 0.0068, + "step": 313120 + }, + { + "epoch": 1.58, + "learning_rate": 6.303282865229476e-05, + "loss": 0.0097, + "step": 313130 + }, + { + "epoch": 1.58, + "learning_rate": 6.302526095928076e-05, + "loss": 0.0082, + "step": 313140 + }, + { + "epoch": 1.58, + "learning_rate": 6.301769326626675e-05, + "loss": 0.0066, + "step": 313150 + }, + { + "epoch": 1.58, + "learning_rate": 6.301012557325273e-05, + "loss": 0.0063, + "step": 313160 + }, + { + "epoch": 1.58, + "learning_rate": 6.300255788023873e-05, + "loss": 0.0052, + "step": 313170 + }, + { + "epoch": 1.58, + "learning_rate": 6.299499018722472e-05, + "loss": 0.0084, + "step": 313180 + }, + { + "epoch": 1.58, + "learning_rate": 6.29874224942107e-05, + "loss": 0.0069, + "step": 313190 + }, + { + "epoch": 1.58, + "learning_rate": 6.29798548011967e-05, + "loss": 0.006, + "step": 313200 + }, + { + "epoch": 1.58, + "learning_rate": 6.29722871081827e-05, + "loss": 0.0059, + "step": 313210 + }, + { + "epoch": 1.58, + "learning_rate": 6.296471941516867e-05, + "loss": 0.0078, + "step": 313220 + }, + { + "epoch": 1.58, + "learning_rate": 6.295715172215467e-05, + "loss": 0.0079, + "step": 313230 + }, + { + "epoch": 1.58, + "learning_rate": 6.294958402914065e-05, + "loss": 0.0084, + "step": 313240 + }, + { + "epoch": 1.58, + "learning_rate": 6.294201633612665e-05, + "loss": 0.005, + "step": 313250 + }, + { + "epoch": 1.58, + "learning_rate": 6.293444864311264e-05, + "loss": 0.0064, + "step": 313260 + }, + { + "epoch": 1.58, + "learning_rate": 6.292688095009862e-05, + "loss": 0.0063, + "step": 313270 + }, + { + "epoch": 1.58, + "learning_rate": 6.291931325708462e-05, + "loss": 0.0055, + "step": 313280 + }, + { + "epoch": 1.58, + "learning_rate": 6.291174556407061e-05, + "loss": 0.0051, + "step": 313290 + }, + { + "epoch": 1.58, + "learning_rate": 6.29041778710566e-05, + "loss": 0.0096, + "step": 313300 + }, + { + "epoch": 1.58, + "learning_rate": 6.289661017804259e-05, + "loss": 0.0071, + "step": 313310 + }, + { + "epoch": 1.58, + "learning_rate": 6.288904248502857e-05, + "loss": 0.007, + "step": 313320 + }, + { + "epoch": 1.58, + "learning_rate": 6.288147479201457e-05, + "loss": 0.006, + "step": 313330 + }, + { + "epoch": 1.58, + "learning_rate": 6.287390709900056e-05, + "loss": 0.0093, + "step": 313340 + }, + { + "epoch": 1.58, + "learning_rate": 6.286633940598654e-05, + "loss": 0.0055, + "step": 313350 + }, + { + "epoch": 1.58, + "learning_rate": 6.285877171297254e-05, + "loss": 0.0064, + "step": 313360 + }, + { + "epoch": 1.58, + "learning_rate": 6.285120401995853e-05, + "loss": 0.0061, + "step": 313370 + }, + { + "epoch": 1.58, + "learning_rate": 6.284363632694451e-05, + "loss": 0.0057, + "step": 313380 + }, + { + "epoch": 1.58, + "learning_rate": 6.283606863393051e-05, + "loss": 0.0065, + "step": 313390 + }, + { + "epoch": 1.58, + "learning_rate": 6.282850094091649e-05, + "loss": 0.0065, + "step": 313400 + }, + { + "epoch": 1.58, + "learning_rate": 6.282093324790249e-05, + "loss": 0.006, + "step": 313410 + }, + { + "epoch": 1.58, + "learning_rate": 6.281336555488848e-05, + "loss": 0.0071, + "step": 313420 + }, + { + "epoch": 1.58, + "learning_rate": 6.280579786187446e-05, + "loss": 0.0079, + "step": 313430 + }, + { + "epoch": 1.58, + "learning_rate": 6.279823016886044e-05, + "loss": 0.0054, + "step": 313440 + }, + { + "epoch": 1.58, + "learning_rate": 6.279066247584644e-05, + "loss": 0.0086, + "step": 313450 + }, + { + "epoch": 1.58, + "learning_rate": 6.278309478283243e-05, + "loss": 0.0073, + "step": 313460 + }, + { + "epoch": 1.58, + "learning_rate": 6.277552708981841e-05, + "loss": 0.0057, + "step": 313470 + }, + { + "epoch": 1.58, + "learning_rate": 6.276795939680441e-05, + "loss": 0.0092, + "step": 313480 + }, + { + "epoch": 1.58, + "learning_rate": 6.276039170379039e-05, + "loss": 0.0064, + "step": 313490 + }, + { + "epoch": 1.58, + "learning_rate": 6.275282401077639e-05, + "loss": 0.0063, + "step": 313500 + }, + { + "epoch": 1.58, + "learning_rate": 6.274525631776238e-05, + "loss": 0.0059, + "step": 313510 + }, + { + "epoch": 1.58, + "learning_rate": 6.273768862474836e-05, + "loss": 0.0059, + "step": 313520 + }, + { + "epoch": 1.58, + "learning_rate": 6.273012093173436e-05, + "loss": 0.01, + "step": 313530 + }, + { + "epoch": 1.58, + "learning_rate": 6.272255323872035e-05, + "loss": 0.0077, + "step": 313540 + }, + { + "epoch": 1.58, + "learning_rate": 6.271498554570633e-05, + "loss": 0.0061, + "step": 313550 + }, + { + "epoch": 1.58, + "learning_rate": 6.270741785269233e-05, + "loss": 0.0055, + "step": 313560 + }, + { + "epoch": 1.58, + "learning_rate": 6.269985015967831e-05, + "loss": 0.0097, + "step": 313570 + }, + { + "epoch": 1.58, + "learning_rate": 6.26922824666643e-05, + "loss": 0.0067, + "step": 313580 + }, + { + "epoch": 1.58, + "learning_rate": 6.26847147736503e-05, + "loss": 0.0078, + "step": 313590 + }, + { + "epoch": 1.58, + "learning_rate": 6.267714708063628e-05, + "loss": 0.0096, + "step": 313600 + }, + { + "epoch": 1.58, + "learning_rate": 6.266957938762228e-05, + "loss": 0.0053, + "step": 313610 + }, + { + "epoch": 1.58, + "learning_rate": 6.266201169460827e-05, + "loss": 0.0077, + "step": 313620 + }, + { + "epoch": 1.58, + "learning_rate": 6.265444400159425e-05, + "loss": 0.0075, + "step": 313630 + }, + { + "epoch": 1.58, + "learning_rate": 6.264687630858025e-05, + "loss": 0.0069, + "step": 313640 + }, + { + "epoch": 1.58, + "learning_rate": 6.263930861556623e-05, + "loss": 0.0069, + "step": 313650 + }, + { + "epoch": 1.58, + "learning_rate": 6.263174092255222e-05, + "loss": 0.0054, + "step": 313660 + }, + { + "epoch": 1.58, + "learning_rate": 6.262417322953822e-05, + "loss": 0.0074, + "step": 313670 + }, + { + "epoch": 1.58, + "learning_rate": 6.26166055365242e-05, + "loss": 0.005, + "step": 313680 + }, + { + "epoch": 1.58, + "learning_rate": 6.26090378435102e-05, + "loss": 0.0053, + "step": 313690 + }, + { + "epoch": 1.58, + "learning_rate": 6.260147015049619e-05, + "loss": 0.0051, + "step": 313700 + }, + { + "epoch": 1.58, + "learning_rate": 6.259390245748217e-05, + "loss": 0.0068, + "step": 313710 + }, + { + "epoch": 1.58, + "learning_rate": 6.258633476446817e-05, + "loss": 0.0058, + "step": 313720 + }, + { + "epoch": 1.58, + "learning_rate": 6.257876707145416e-05, + "loss": 0.0069, + "step": 313730 + }, + { + "epoch": 1.58, + "learning_rate": 6.257119937844014e-05, + "loss": 0.0061, + "step": 313740 + }, + { + "epoch": 1.58, + "learning_rate": 6.256363168542614e-05, + "loss": 0.0087, + "step": 313750 + }, + { + "epoch": 1.58, + "learning_rate": 6.255606399241212e-05, + "loss": 0.0069, + "step": 313760 + }, + { + "epoch": 1.58, + "learning_rate": 6.25484962993981e-05, + "loss": 0.0055, + "step": 313770 + }, + { + "epoch": 1.58, + "learning_rate": 6.25409286063841e-05, + "loss": 0.0074, + "step": 313780 + }, + { + "epoch": 1.58, + "learning_rate": 6.253336091337009e-05, + "loss": 0.008, + "step": 313790 + }, + { + "epoch": 1.58, + "learning_rate": 6.252579322035607e-05, + "loss": 0.0065, + "step": 313800 + }, + { + "epoch": 1.58, + "learning_rate": 6.251822552734207e-05, + "loss": 0.0059, + "step": 313810 + }, + { + "epoch": 1.58, + "learning_rate": 6.251065783432806e-05, + "loss": 0.0073, + "step": 313820 + }, + { + "epoch": 1.58, + "learning_rate": 6.250309014131404e-05, + "loss": 0.0069, + "step": 313830 + }, + { + "epoch": 1.58, + "learning_rate": 6.249552244830004e-05, + "loss": 0.0077, + "step": 313840 + }, + { + "epoch": 1.58, + "learning_rate": 6.248795475528602e-05, + "loss": 0.0075, + "step": 313850 + }, + { + "epoch": 1.58, + "learning_rate": 6.248038706227202e-05, + "loss": 0.0089, + "step": 313860 + }, + { + "epoch": 1.58, + "learning_rate": 6.247281936925801e-05, + "loss": 0.006, + "step": 313870 + }, + { + "epoch": 1.58, + "learning_rate": 6.246525167624399e-05, + "loss": 0.0064, + "step": 313880 + }, + { + "epoch": 1.58, + "learning_rate": 6.245768398322999e-05, + "loss": 0.0064, + "step": 313890 + }, + { + "epoch": 1.58, + "learning_rate": 6.245011629021598e-05, + "loss": 0.0062, + "step": 313900 + }, + { + "epoch": 1.58, + "learning_rate": 6.244254859720196e-05, + "loss": 0.0072, + "step": 313910 + }, + { + "epoch": 1.58, + "learning_rate": 6.243498090418796e-05, + "loss": 0.0105, + "step": 313920 + }, + { + "epoch": 1.58, + "learning_rate": 6.242741321117394e-05, + "loss": 0.0067, + "step": 313930 + }, + { + "epoch": 1.58, + "learning_rate": 6.241984551815994e-05, + "loss": 0.007, + "step": 313940 + }, + { + "epoch": 1.58, + "learning_rate": 6.241227782514593e-05, + "loss": 0.0062, + "step": 313950 + }, + { + "epoch": 1.58, + "learning_rate": 6.240471013213191e-05, + "loss": 0.008, + "step": 313960 + }, + { + "epoch": 1.58, + "learning_rate": 6.23971424391179e-05, + "loss": 0.0068, + "step": 313970 + }, + { + "epoch": 1.58, + "learning_rate": 6.23895747461039e-05, + "loss": 0.0085, + "step": 313980 + }, + { + "epoch": 1.58, + "learning_rate": 6.238200705308988e-05, + "loss": 0.0067, + "step": 313990 + }, + { + "epoch": 1.58, + "learning_rate": 6.237443936007588e-05, + "loss": 0.0059, + "step": 314000 + }, + { + "epoch": 1.58, + "eval_cer": 0.9144314400581461, + "eval_loss": 0.005062195006757975, + "eval_runtime": 116.4946, + "eval_samples_per_second": 17.168, + "eval_steps_per_second": 4.292, + "step": 314000 + }, + { + "epoch": 1.58, + "learning_rate": 6.236687166706186e-05, + "loss": 0.0077, + "step": 314010 + }, + { + "epoch": 1.58, + "learning_rate": 6.235930397404785e-05, + "loss": 0.0077, + "step": 314020 + }, + { + "epoch": 1.58, + "learning_rate": 6.235173628103385e-05, + "loss": 0.0076, + "step": 314030 + }, + { + "epoch": 1.58, + "learning_rate": 6.234416858801983e-05, + "loss": 0.009, + "step": 314040 + }, + { + "epoch": 1.58, + "learning_rate": 6.233660089500583e-05, + "loss": 0.0073, + "step": 314050 + }, + { + "epoch": 1.58, + "learning_rate": 6.232903320199182e-05, + "loss": 0.0057, + "step": 314060 + }, + { + "epoch": 1.58, + "learning_rate": 6.23214655089778e-05, + "loss": 0.008, + "step": 314070 + }, + { + "epoch": 1.58, + "learning_rate": 6.231389781596378e-05, + "loss": 0.0063, + "step": 314080 + }, + { + "epoch": 1.58, + "learning_rate": 6.230633012294978e-05, + "loss": 0.0072, + "step": 314090 + }, + { + "epoch": 1.58, + "learning_rate": 6.229876242993576e-05, + "loss": 0.0063, + "step": 314100 + }, + { + "epoch": 1.58, + "learning_rate": 6.229119473692176e-05, + "loss": 0.0078, + "step": 314110 + }, + { + "epoch": 1.58, + "learning_rate": 6.228362704390775e-05, + "loss": 0.0059, + "step": 314120 + }, + { + "epoch": 1.58, + "learning_rate": 6.227605935089373e-05, + "loss": 0.0054, + "step": 314130 + }, + { + "epoch": 1.58, + "learning_rate": 6.226849165787973e-05, + "loss": 0.0108, + "step": 314140 + }, + { + "epoch": 1.58, + "learning_rate": 6.226092396486572e-05, + "loss": 0.0088, + "step": 314150 + }, + { + "epoch": 1.58, + "learning_rate": 6.22533562718517e-05, + "loss": 0.0065, + "step": 314160 + }, + { + "epoch": 1.59, + "learning_rate": 6.22457885788377e-05, + "loss": 0.0061, + "step": 314170 + }, + { + "epoch": 1.59, + "learning_rate": 6.223822088582369e-05, + "loss": 0.0057, + "step": 314180 + }, + { + "epoch": 1.59, + "learning_rate": 6.223065319280967e-05, + "loss": 0.0055, + "step": 314190 + }, + { + "epoch": 1.59, + "learning_rate": 6.222308549979567e-05, + "loss": 0.0079, + "step": 314200 + }, + { + "epoch": 1.59, + "learning_rate": 6.221551780678165e-05, + "loss": 0.0067, + "step": 314210 + }, + { + "epoch": 1.59, + "learning_rate": 6.220795011376765e-05, + "loss": 0.0054, + "step": 314220 + }, + { + "epoch": 1.59, + "learning_rate": 6.220038242075364e-05, + "loss": 0.008, + "step": 314230 + }, + { + "epoch": 1.59, + "learning_rate": 6.219281472773962e-05, + "loss": 0.0059, + "step": 314240 + }, + { + "epoch": 1.59, + "learning_rate": 6.218524703472562e-05, + "loss": 0.0077, + "step": 314250 + }, + { + "epoch": 1.59, + "learning_rate": 6.217767934171161e-05, + "loss": 0.0044, + "step": 314260 + }, + { + "epoch": 1.59, + "learning_rate": 6.21701116486976e-05, + "loss": 0.006, + "step": 314270 + }, + { + "epoch": 1.59, + "learning_rate": 6.216254395568359e-05, + "loss": 0.0055, + "step": 314280 + }, + { + "epoch": 1.59, + "learning_rate": 6.215497626266957e-05, + "loss": 0.0078, + "step": 314290 + }, + { + "epoch": 1.59, + "learning_rate": 6.214740856965557e-05, + "loss": 0.0053, + "step": 314300 + }, + { + "epoch": 1.59, + "learning_rate": 6.213984087664156e-05, + "loss": 0.0059, + "step": 314310 + }, + { + "epoch": 1.59, + "learning_rate": 6.213227318362754e-05, + "loss": 0.0065, + "step": 314320 + }, + { + "epoch": 1.59, + "learning_rate": 6.212470549061354e-05, + "loss": 0.0067, + "step": 314330 + }, + { + "epoch": 1.59, + "learning_rate": 6.211713779759953e-05, + "loss": 0.0048, + "step": 314340 + }, + { + "epoch": 1.59, + "learning_rate": 6.210957010458551e-05, + "loss": 0.0059, + "step": 314350 + }, + { + "epoch": 1.59, + "learning_rate": 6.210200241157151e-05, + "loss": 0.0077, + "step": 314360 + }, + { + "epoch": 1.59, + "learning_rate": 6.209443471855749e-05, + "loss": 0.0072, + "step": 314370 + }, + { + "epoch": 1.59, + "learning_rate": 6.208686702554347e-05, + "loss": 0.0073, + "step": 314380 + }, + { + "epoch": 1.59, + "learning_rate": 6.207929933252947e-05, + "loss": 0.008, + "step": 314390 + }, + { + "epoch": 1.59, + "learning_rate": 6.207173163951546e-05, + "loss": 0.009, + "step": 314400 + }, + { + "epoch": 1.59, + "learning_rate": 6.206416394650144e-05, + "loss": 0.0056, + "step": 314410 + }, + { + "epoch": 1.59, + "learning_rate": 6.205659625348744e-05, + "loss": 0.0077, + "step": 314420 + }, + { + "epoch": 1.59, + "learning_rate": 6.204902856047343e-05, + "loss": 0.009, + "step": 314430 + }, + { + "epoch": 1.59, + "learning_rate": 6.204146086745941e-05, + "loss": 0.0066, + "step": 314440 + }, + { + "epoch": 1.59, + "learning_rate": 6.203389317444541e-05, + "loss": 0.0058, + "step": 314450 + }, + { + "epoch": 1.59, + "learning_rate": 6.202632548143139e-05, + "loss": 0.0071, + "step": 314460 + }, + { + "epoch": 1.59, + "learning_rate": 6.201875778841739e-05, + "loss": 0.0058, + "step": 314470 + }, + { + "epoch": 1.59, + "learning_rate": 6.201119009540338e-05, + "loss": 0.0066, + "step": 314480 + }, + { + "epoch": 1.59, + "learning_rate": 6.200362240238936e-05, + "loss": 0.0054, + "step": 314490 + }, + { + "epoch": 1.59, + "learning_rate": 6.199605470937536e-05, + "loss": 0.0047, + "step": 314500 + }, + { + "epoch": 1.59, + "learning_rate": 6.198848701636135e-05, + "loss": 0.0054, + "step": 314510 + }, + { + "epoch": 1.59, + "learning_rate": 6.198091932334733e-05, + "loss": 0.0074, + "step": 314520 + }, + { + "epoch": 1.59, + "learning_rate": 6.197335163033333e-05, + "loss": 0.0062, + "step": 314530 + }, + { + "epoch": 1.59, + "learning_rate": 6.196578393731931e-05, + "loss": 0.0069, + "step": 314540 + }, + { + "epoch": 1.59, + "learning_rate": 6.19582162443053e-05, + "loss": 0.0075, + "step": 314550 + }, + { + "epoch": 1.59, + "learning_rate": 6.19506485512913e-05, + "loss": 0.0078, + "step": 314560 + }, + { + "epoch": 1.59, + "learning_rate": 6.194308085827728e-05, + "loss": 0.0059, + "step": 314570 + }, + { + "epoch": 1.59, + "learning_rate": 6.193551316526328e-05, + "loss": 0.009, + "step": 314580 + }, + { + "epoch": 1.59, + "learning_rate": 6.192794547224927e-05, + "loss": 0.005, + "step": 314590 + }, + { + "epoch": 1.59, + "learning_rate": 6.192037777923525e-05, + "loss": 0.0057, + "step": 314600 + }, + { + "epoch": 1.59, + "learning_rate": 6.191281008622125e-05, + "loss": 0.0071, + "step": 314610 + }, + { + "epoch": 1.59, + "learning_rate": 6.190524239320723e-05, + "loss": 0.0094, + "step": 314620 + }, + { + "epoch": 1.59, + "learning_rate": 6.189767470019322e-05, + "loss": 0.0065, + "step": 314630 + }, + { + "epoch": 1.59, + "learning_rate": 6.189010700717922e-05, + "loss": 0.0076, + "step": 314640 + }, + { + "epoch": 1.59, + "learning_rate": 6.18825393141652e-05, + "loss": 0.0073, + "step": 314650 + }, + { + "epoch": 1.59, + "learning_rate": 6.18749716211512e-05, + "loss": 0.008, + "step": 314660 + }, + { + "epoch": 1.59, + "learning_rate": 6.186740392813719e-05, + "loss": 0.0083, + "step": 314670 + }, + { + "epoch": 1.59, + "learning_rate": 6.185983623512317e-05, + "loss": 0.0071, + "step": 314680 + }, + { + "epoch": 1.59, + "learning_rate": 6.185226854210917e-05, + "loss": 0.0076, + "step": 314690 + }, + { + "epoch": 1.59, + "learning_rate": 6.184470084909515e-05, + "loss": 0.0044, + "step": 314700 + }, + { + "epoch": 1.59, + "learning_rate": 6.183713315608114e-05, + "loss": 0.0069, + "step": 314710 + }, + { + "epoch": 1.59, + "learning_rate": 6.182956546306712e-05, + "loss": 0.0063, + "step": 314720 + }, + { + "epoch": 1.59, + "learning_rate": 6.182199777005312e-05, + "loss": 0.0069, + "step": 314730 + }, + { + "epoch": 1.59, + "learning_rate": 6.18144300770391e-05, + "loss": 0.0115, + "step": 314740 + }, + { + "epoch": 1.59, + "learning_rate": 6.18068623840251e-05, + "loss": 0.006, + "step": 314750 + }, + { + "epoch": 1.59, + "learning_rate": 6.179929469101109e-05, + "loss": 0.0079, + "step": 314760 + }, + { + "epoch": 1.59, + "learning_rate": 6.179172699799707e-05, + "loss": 0.0067, + "step": 314770 + }, + { + "epoch": 1.59, + "learning_rate": 6.178415930498307e-05, + "loss": 0.007, + "step": 314780 + }, + { + "epoch": 1.59, + "learning_rate": 6.177659161196906e-05, + "loss": 0.0061, + "step": 314790 + }, + { + "epoch": 1.59, + "learning_rate": 6.176902391895504e-05, + "loss": 0.0072, + "step": 314800 + }, + { + "epoch": 1.59, + "learning_rate": 6.176145622594104e-05, + "loss": 0.0067, + "step": 314810 + }, + { + "epoch": 1.59, + "learning_rate": 6.175388853292702e-05, + "loss": 0.0058, + "step": 314820 + }, + { + "epoch": 1.59, + "learning_rate": 6.174632083991302e-05, + "loss": 0.007, + "step": 314830 + }, + { + "epoch": 1.59, + "learning_rate": 6.173875314689901e-05, + "loss": 0.007, + "step": 314840 + }, + { + "epoch": 1.59, + "learning_rate": 6.173118545388499e-05, + "loss": 0.0058, + "step": 314850 + }, + { + "epoch": 1.59, + "learning_rate": 6.172361776087099e-05, + "loss": 0.0064, + "step": 314860 + }, + { + "epoch": 1.59, + "learning_rate": 6.171605006785698e-05, + "loss": 0.0074, + "step": 314870 + }, + { + "epoch": 1.59, + "learning_rate": 6.170848237484296e-05, + "loss": 0.0107, + "step": 314880 + }, + { + "epoch": 1.59, + "learning_rate": 6.170091468182896e-05, + "loss": 0.0055, + "step": 314890 + }, + { + "epoch": 1.59, + "learning_rate": 6.169334698881494e-05, + "loss": 0.0083, + "step": 314900 + }, + { + "epoch": 1.59, + "learning_rate": 6.168577929580093e-05, + "loss": 0.0074, + "step": 314910 + }, + { + "epoch": 1.59, + "learning_rate": 6.167821160278693e-05, + "loss": 0.0082, + "step": 314920 + }, + { + "epoch": 1.59, + "learning_rate": 6.167064390977291e-05, + "loss": 0.0071, + "step": 314930 + }, + { + "epoch": 1.59, + "learning_rate": 6.16630762167589e-05, + "loss": 0.0073, + "step": 314940 + }, + { + "epoch": 1.59, + "learning_rate": 6.16555085237449e-05, + "loss": 0.007, + "step": 314950 + }, + { + "epoch": 1.59, + "learning_rate": 6.164794083073088e-05, + "loss": 0.0045, + "step": 314960 + }, + { + "epoch": 1.59, + "learning_rate": 6.164037313771688e-05, + "loss": 0.0061, + "step": 314970 + }, + { + "epoch": 1.59, + "learning_rate": 6.163280544470286e-05, + "loss": 0.0056, + "step": 314980 + }, + { + "epoch": 1.59, + "learning_rate": 6.162523775168885e-05, + "loss": 0.0069, + "step": 314990 + }, + { + "epoch": 1.59, + "learning_rate": 6.161767005867485e-05, + "loss": 0.0065, + "step": 315000 + }, + { + "epoch": 1.59, + "eval_cer": 0.9144207657007667, + "eval_loss": 0.005126504693180323, + "eval_runtime": 116.2813, + "eval_samples_per_second": 17.2, + "eval_steps_per_second": 4.3, + "step": 315000 + }, + { + "epoch": 1.59, + "learning_rate": 6.161010236566083e-05, + "loss": 0.0066, + "step": 315010 + }, + { + "epoch": 1.59, + "learning_rate": 6.160253467264681e-05, + "loss": 0.0056, + "step": 315020 + }, + { + "epoch": 1.59, + "learning_rate": 6.159496697963281e-05, + "loss": 0.005, + "step": 315030 + }, + { + "epoch": 1.59, + "learning_rate": 6.15873992866188e-05, + "loss": 0.0087, + "step": 315040 + }, + { + "epoch": 1.59, + "learning_rate": 6.157983159360478e-05, + "loss": 0.0079, + "step": 315050 + }, + { + "epoch": 1.59, + "learning_rate": 6.157226390059078e-05, + "loss": 0.0066, + "step": 315060 + }, + { + "epoch": 1.59, + "learning_rate": 6.156469620757676e-05, + "loss": 0.0067, + "step": 315070 + }, + { + "epoch": 1.59, + "learning_rate": 6.155712851456275e-05, + "loss": 0.0095, + "step": 315080 + }, + { + "epoch": 1.59, + "learning_rate": 6.154956082154875e-05, + "loss": 0.0076, + "step": 315090 + }, + { + "epoch": 1.59, + "learning_rate": 6.154199312853473e-05, + "loss": 0.0104, + "step": 315100 + }, + { + "epoch": 1.59, + "learning_rate": 6.153442543552073e-05, + "loss": 0.0092, + "step": 315110 + }, + { + "epoch": 1.59, + "learning_rate": 6.152685774250672e-05, + "loss": 0.0069, + "step": 315120 + }, + { + "epoch": 1.59, + "learning_rate": 6.15192900494927e-05, + "loss": 0.0068, + "step": 315130 + }, + { + "epoch": 1.59, + "learning_rate": 6.15117223564787e-05, + "loss": 0.0065, + "step": 315140 + }, + { + "epoch": 1.59, + "learning_rate": 6.150415466346469e-05, + "loss": 0.007, + "step": 315150 + }, + { + "epoch": 1.59, + "learning_rate": 6.149658697045067e-05, + "loss": 0.0081, + "step": 315160 + }, + { + "epoch": 1.59, + "learning_rate": 6.148901927743667e-05, + "loss": 0.0069, + "step": 315170 + }, + { + "epoch": 1.59, + "learning_rate": 6.148145158442265e-05, + "loss": 0.0062, + "step": 315180 + }, + { + "epoch": 1.59, + "learning_rate": 6.147388389140865e-05, + "loss": 0.0071, + "step": 315190 + }, + { + "epoch": 1.59, + "learning_rate": 6.146631619839464e-05, + "loss": 0.0067, + "step": 315200 + }, + { + "epoch": 1.59, + "learning_rate": 6.145874850538062e-05, + "loss": 0.0073, + "step": 315210 + }, + { + "epoch": 1.59, + "learning_rate": 6.145118081236662e-05, + "loss": 0.0079, + "step": 315220 + }, + { + "epoch": 1.59, + "learning_rate": 6.144361311935261e-05, + "loss": 0.0061, + "step": 315230 + }, + { + "epoch": 1.59, + "learning_rate": 6.14360454263386e-05, + "loss": 0.0062, + "step": 315240 + }, + { + "epoch": 1.59, + "learning_rate": 6.142847773332459e-05, + "loss": 0.0074, + "step": 315250 + }, + { + "epoch": 1.59, + "learning_rate": 6.142091004031057e-05, + "loss": 0.0063, + "step": 315260 + }, + { + "epoch": 1.59, + "learning_rate": 6.141334234729656e-05, + "loss": 0.0068, + "step": 315270 + }, + { + "epoch": 1.59, + "learning_rate": 6.140577465428256e-05, + "loss": 0.0056, + "step": 315280 + }, + { + "epoch": 1.59, + "learning_rate": 6.139820696126854e-05, + "loss": 0.006, + "step": 315290 + }, + { + "epoch": 1.59, + "learning_rate": 6.139063926825454e-05, + "loss": 0.0071, + "step": 315300 + }, + { + "epoch": 1.59, + "learning_rate": 6.138307157524053e-05, + "loss": 0.0074, + "step": 315310 + }, + { + "epoch": 1.59, + "learning_rate": 6.137550388222651e-05, + "loss": 0.0052, + "step": 315320 + }, + { + "epoch": 1.59, + "learning_rate": 6.13679361892125e-05, + "loss": 0.0058, + "step": 315330 + }, + { + "epoch": 1.59, + "learning_rate": 6.136036849619849e-05, + "loss": 0.0059, + "step": 315340 + }, + { + "epoch": 1.59, + "learning_rate": 6.135280080318447e-05, + "loss": 0.0061, + "step": 315350 + }, + { + "epoch": 1.59, + "learning_rate": 6.134523311017047e-05, + "loss": 0.0066, + "step": 315360 + }, + { + "epoch": 1.59, + "learning_rate": 6.133766541715646e-05, + "loss": 0.006, + "step": 315370 + }, + { + "epoch": 1.59, + "learning_rate": 6.133009772414244e-05, + "loss": 0.0069, + "step": 315380 + }, + { + "epoch": 1.59, + "learning_rate": 6.132253003112844e-05, + "loss": 0.0068, + "step": 315390 + }, + { + "epoch": 1.59, + "learning_rate": 6.131496233811443e-05, + "loss": 0.0075, + "step": 315400 + }, + { + "epoch": 1.59, + "learning_rate": 6.130739464510041e-05, + "loss": 0.0056, + "step": 315410 + }, + { + "epoch": 1.59, + "learning_rate": 6.129982695208641e-05, + "loss": 0.0073, + "step": 315420 + }, + { + "epoch": 1.59, + "learning_rate": 6.129225925907239e-05, + "loss": 0.0071, + "step": 315430 + }, + { + "epoch": 1.59, + "learning_rate": 6.128469156605838e-05, + "loss": 0.0067, + "step": 315440 + }, + { + "epoch": 1.59, + "learning_rate": 6.127712387304438e-05, + "loss": 0.0065, + "step": 315450 + }, + { + "epoch": 1.59, + "learning_rate": 6.126955618003036e-05, + "loss": 0.0083, + "step": 315460 + }, + { + "epoch": 1.59, + "learning_rate": 6.126198848701636e-05, + "loss": 0.0102, + "step": 315470 + }, + { + "epoch": 1.59, + "learning_rate": 6.125442079400235e-05, + "loss": 0.0066, + "step": 315480 + }, + { + "epoch": 1.59, + "learning_rate": 6.124685310098833e-05, + "loss": 0.0063, + "step": 315490 + }, + { + "epoch": 1.59, + "learning_rate": 6.123928540797433e-05, + "loss": 0.0067, + "step": 315500 + }, + { + "epoch": 1.59, + "learning_rate": 6.123171771496031e-05, + "loss": 0.0053, + "step": 315510 + }, + { + "epoch": 1.59, + "learning_rate": 6.12241500219463e-05, + "loss": 0.0068, + "step": 315520 + }, + { + "epoch": 1.59, + "learning_rate": 6.12165823289323e-05, + "loss": 0.0058, + "step": 315530 + }, + { + "epoch": 1.59, + "learning_rate": 6.120901463591828e-05, + "loss": 0.0059, + "step": 315540 + }, + { + "epoch": 1.59, + "learning_rate": 6.120144694290428e-05, + "loss": 0.0056, + "step": 315550 + }, + { + "epoch": 1.59, + "learning_rate": 6.119387924989027e-05, + "loss": 0.0081, + "step": 315560 + }, + { + "epoch": 1.59, + "learning_rate": 6.118631155687625e-05, + "loss": 0.0082, + "step": 315570 + }, + { + "epoch": 1.59, + "learning_rate": 6.117874386386225e-05, + "loss": 0.0081, + "step": 315580 + }, + { + "epoch": 1.59, + "learning_rate": 6.117117617084823e-05, + "loss": 0.0059, + "step": 315590 + }, + { + "epoch": 1.59, + "learning_rate": 6.116360847783422e-05, + "loss": 0.0094, + "step": 315600 + }, + { + "epoch": 1.59, + "learning_rate": 6.115604078482022e-05, + "loss": 0.0084, + "step": 315610 + }, + { + "epoch": 1.59, + "learning_rate": 6.11484730918062e-05, + "loss": 0.006, + "step": 315620 + }, + { + "epoch": 1.59, + "learning_rate": 6.11409053987922e-05, + "loss": 0.0066, + "step": 315630 + }, + { + "epoch": 1.59, + "learning_rate": 6.113333770577818e-05, + "loss": 0.0074, + "step": 315640 + }, + { + "epoch": 1.59, + "learning_rate": 6.112577001276417e-05, + "loss": 0.0058, + "step": 315650 + }, + { + "epoch": 1.59, + "learning_rate": 6.111820231975015e-05, + "loss": 0.0058, + "step": 315660 + }, + { + "epoch": 1.59, + "learning_rate": 6.111063462673615e-05, + "loss": 0.0076, + "step": 315670 + }, + { + "epoch": 1.59, + "learning_rate": 6.110306693372214e-05, + "loss": 0.0055, + "step": 315680 + }, + { + "epoch": 1.59, + "learning_rate": 6.109549924070812e-05, + "loss": 0.0111, + "step": 315690 + }, + { + "epoch": 1.59, + "learning_rate": 6.108793154769412e-05, + "loss": 0.0078, + "step": 315700 + }, + { + "epoch": 1.59, + "learning_rate": 6.10803638546801e-05, + "loss": 0.0075, + "step": 315710 + }, + { + "epoch": 1.59, + "learning_rate": 6.10727961616661e-05, + "loss": 0.0073, + "step": 315720 + }, + { + "epoch": 1.59, + "learning_rate": 6.106522846865209e-05, + "loss": 0.0062, + "step": 315730 + }, + { + "epoch": 1.59, + "learning_rate": 6.105766077563807e-05, + "loss": 0.009, + "step": 315740 + }, + { + "epoch": 1.59, + "learning_rate": 6.105009308262407e-05, + "loss": 0.0069, + "step": 315750 + }, + { + "epoch": 1.59, + "learning_rate": 6.104252538961006e-05, + "loss": 0.0073, + "step": 315760 + }, + { + "epoch": 1.59, + "learning_rate": 6.1034957696596043e-05, + "loss": 0.0092, + "step": 315770 + }, + { + "epoch": 1.59, + "learning_rate": 6.102739000358204e-05, + "loss": 0.0078, + "step": 315780 + }, + { + "epoch": 1.59, + "learning_rate": 6.101982231056803e-05, + "loss": 0.0065, + "step": 315790 + }, + { + "epoch": 1.59, + "learning_rate": 6.1012254617554015e-05, + "loss": 0.0066, + "step": 315800 + }, + { + "epoch": 1.59, + "learning_rate": 6.100468692454e-05, + "loss": 0.007, + "step": 315810 + }, + { + "epoch": 1.59, + "learning_rate": 6.0997119231526e-05, + "loss": 0.007, + "step": 315820 + }, + { + "epoch": 1.59, + "learning_rate": 6.0989551538511986e-05, + "loss": 0.0057, + "step": 315830 + }, + { + "epoch": 1.59, + "learning_rate": 6.0981983845497975e-05, + "loss": 0.0086, + "step": 315840 + }, + { + "epoch": 1.59, + "learning_rate": 6.097441615248396e-05, + "loss": 0.012, + "step": 315850 + }, + { + "epoch": 1.59, + "learning_rate": 6.096684845946996e-05, + "loss": 0.0072, + "step": 315860 + }, + { + "epoch": 1.59, + "learning_rate": 6.0959280766455946e-05, + "loss": 0.0114, + "step": 315870 + }, + { + "epoch": 1.59, + "learning_rate": 6.0951713073441934e-05, + "loss": 0.0061, + "step": 315880 + }, + { + "epoch": 1.59, + "learning_rate": 6.094414538042792e-05, + "loss": 0.0058, + "step": 315890 + }, + { + "epoch": 1.59, + "learning_rate": 6.093657768741392e-05, + "loss": 0.007, + "step": 315900 + }, + { + "epoch": 1.59, + "learning_rate": 6.0929009994399906e-05, + "loss": 0.005, + "step": 315910 + }, + { + "epoch": 1.59, + "learning_rate": 6.0921442301385894e-05, + "loss": 0.0061, + "step": 315920 + }, + { + "epoch": 1.59, + "learning_rate": 6.091387460837188e-05, + "loss": 0.0048, + "step": 315930 + }, + { + "epoch": 1.59, + "learning_rate": 6.090630691535788e-05, + "loss": 0.0077, + "step": 315940 + }, + { + "epoch": 1.59, + "learning_rate": 6.089873922234386e-05, + "loss": 0.0074, + "step": 315950 + }, + { + "epoch": 1.59, + "learning_rate": 6.089117152932985e-05, + "loss": 0.0066, + "step": 315960 + }, + { + "epoch": 1.59, + "learning_rate": 6.0883603836315835e-05, + "loss": 0.0072, + "step": 315970 + }, + { + "epoch": 1.59, + "learning_rate": 6.087603614330182e-05, + "loss": 0.0065, + "step": 315980 + }, + { + "epoch": 1.59, + "learning_rate": 6.086846845028782e-05, + "loss": 0.0066, + "step": 315990 + }, + { + "epoch": 1.59, + "learning_rate": 6.0860900757273806e-05, + "loss": 0.0074, + "step": 316000 + }, + { + "epoch": 1.59, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.005030008032917976, + "eval_runtime": 116.3264, + "eval_samples_per_second": 17.193, + "eval_steps_per_second": 4.298, + "step": 316000 + }, + { + "epoch": 1.59, + "learning_rate": 6.0853333064259795e-05, + "loss": 0.0076, + "step": 316010 + }, + { + "epoch": 1.59, + "learning_rate": 6.084576537124578e-05, + "loss": 0.0054, + "step": 316020 + }, + { + "epoch": 1.59, + "learning_rate": 6.083819767823178e-05, + "loss": 0.0062, + "step": 316030 + }, + { + "epoch": 1.59, + "learning_rate": 6.0830629985217766e-05, + "loss": 0.0065, + "step": 316040 + }, + { + "epoch": 1.59, + "learning_rate": 6.0823062292203754e-05, + "loss": 0.0074, + "step": 316050 + }, + { + "epoch": 1.59, + "learning_rate": 6.081549459918974e-05, + "loss": 0.0079, + "step": 316060 + }, + { + "epoch": 1.59, + "learning_rate": 6.080792690617574e-05, + "loss": 0.0049, + "step": 316070 + }, + { + "epoch": 1.59, + "learning_rate": 6.0800359213161726e-05, + "loss": 0.0077, + "step": 316080 + }, + { + "epoch": 1.59, + "learning_rate": 6.0792791520147714e-05, + "loss": 0.0063, + "step": 316090 + }, + { + "epoch": 1.59, + "learning_rate": 6.078522382713371e-05, + "loss": 0.0048, + "step": 316100 + }, + { + "epoch": 1.59, + "learning_rate": 6.07776561341197e-05, + "loss": 0.0065, + "step": 316110 + }, + { + "epoch": 1.59, + "learning_rate": 6.0770088441105685e-05, + "loss": 0.0096, + "step": 316120 + }, + { + "epoch": 1.59, + "learning_rate": 6.0762520748091674e-05, + "loss": 0.0071, + "step": 316130 + }, + { + "epoch": 1.59, + "learning_rate": 6.075495305507767e-05, + "loss": 0.0065, + "step": 316140 + }, + { + "epoch": 1.6, + "learning_rate": 6.074738536206366e-05, + "loss": 0.008, + "step": 316150 + }, + { + "epoch": 1.6, + "learning_rate": 6.0739817669049645e-05, + "loss": 0.0064, + "step": 316160 + }, + { + "epoch": 1.6, + "learning_rate": 6.073224997603563e-05, + "loss": 0.0063, + "step": 316170 + }, + { + "epoch": 1.6, + "learning_rate": 6.072468228302163e-05, + "loss": 0.0061, + "step": 316180 + }, + { + "epoch": 1.6, + "learning_rate": 6.0717114590007616e-05, + "loss": 0.0071, + "step": 316190 + }, + { + "epoch": 1.6, + "learning_rate": 6.0709546896993605e-05, + "loss": 0.0059, + "step": 316200 + }, + { + "epoch": 1.6, + "learning_rate": 6.070197920397959e-05, + "loss": 0.0062, + "step": 316210 + }, + { + "epoch": 1.6, + "learning_rate": 6.069441151096559e-05, + "loss": 0.0078, + "step": 316220 + }, + { + "epoch": 1.6, + "learning_rate": 6.0686843817951576e-05, + "loss": 0.0047, + "step": 316230 + }, + { + "epoch": 1.6, + "learning_rate": 6.0679276124937564e-05, + "loss": 0.0082, + "step": 316240 + }, + { + "epoch": 1.6, + "learning_rate": 6.067170843192355e-05, + "loss": 0.0061, + "step": 316250 + }, + { + "epoch": 1.6, + "learning_rate": 6.066414073890955e-05, + "loss": 0.007, + "step": 316260 + }, + { + "epoch": 1.6, + "learning_rate": 6.065657304589553e-05, + "loss": 0.0065, + "step": 316270 + }, + { + "epoch": 1.6, + "learning_rate": 6.064900535288152e-05, + "loss": 0.0071, + "step": 316280 + }, + { + "epoch": 1.6, + "learning_rate": 6.0641437659867505e-05, + "loss": 0.0086, + "step": 316290 + }, + { + "epoch": 1.6, + "learning_rate": 6.0633869966853494e-05, + "loss": 0.0066, + "step": 316300 + }, + { + "epoch": 1.6, + "learning_rate": 6.062630227383949e-05, + "loss": 0.0069, + "step": 316310 + }, + { + "epoch": 1.6, + "learning_rate": 6.061873458082548e-05, + "loss": 0.0085, + "step": 316320 + }, + { + "epoch": 1.6, + "learning_rate": 6.0611166887811465e-05, + "loss": 0.0069, + "step": 316330 + }, + { + "epoch": 1.6, + "learning_rate": 6.060359919479745e-05, + "loss": 0.0051, + "step": 316340 + }, + { + "epoch": 1.6, + "learning_rate": 6.059603150178345e-05, + "loss": 0.0067, + "step": 316350 + }, + { + "epoch": 1.6, + "learning_rate": 6.0588463808769436e-05, + "loss": 0.008, + "step": 316360 + }, + { + "epoch": 1.6, + "learning_rate": 6.0580896115755425e-05, + "loss": 0.0068, + "step": 316370 + }, + { + "epoch": 1.6, + "learning_rate": 6.057332842274141e-05, + "loss": 0.0075, + "step": 316380 + }, + { + "epoch": 1.6, + "learning_rate": 6.056576072972741e-05, + "loss": 0.0064, + "step": 316390 + }, + { + "epoch": 1.6, + "learning_rate": 6.0558193036713396e-05, + "loss": 0.0074, + "step": 316400 + }, + { + "epoch": 1.6, + "learning_rate": 6.0550625343699384e-05, + "loss": 0.0068, + "step": 316410 + }, + { + "epoch": 1.6, + "learning_rate": 6.054305765068537e-05, + "loss": 0.008, + "step": 316420 + }, + { + "epoch": 1.6, + "learning_rate": 6.053548995767137e-05, + "loss": 0.0083, + "step": 316430 + }, + { + "epoch": 1.6, + "learning_rate": 6.0527922264657356e-05, + "loss": 0.0059, + "step": 316440 + }, + { + "epoch": 1.6, + "learning_rate": 6.0520354571643344e-05, + "loss": 0.0067, + "step": 316450 + }, + { + "epoch": 1.6, + "learning_rate": 6.051278687862933e-05, + "loss": 0.006, + "step": 316460 + }, + { + "epoch": 1.6, + "learning_rate": 6.050521918561533e-05, + "loss": 0.0087, + "step": 316470 + }, + { + "epoch": 1.6, + "learning_rate": 6.0497651492601315e-05, + "loss": 0.0085, + "step": 316480 + }, + { + "epoch": 1.6, + "learning_rate": 6.0490083799587304e-05, + "loss": 0.0067, + "step": 316490 + }, + { + "epoch": 1.6, + "learning_rate": 6.048251610657329e-05, + "loss": 0.0072, + "step": 316500 + }, + { + "epoch": 1.6, + "learning_rate": 6.047494841355929e-05, + "loss": 0.0058, + "step": 316510 + }, + { + "epoch": 1.6, + "learning_rate": 6.0467380720545275e-05, + "loss": 0.0068, + "step": 316520 + }, + { + "epoch": 1.6, + "learning_rate": 6.045981302753126e-05, + "loss": 0.0078, + "step": 316530 + }, + { + "epoch": 1.6, + "learning_rate": 6.045224533451725e-05, + "loss": 0.0058, + "step": 316540 + }, + { + "epoch": 1.6, + "learning_rate": 6.0444677641503247e-05, + "loss": 0.0058, + "step": 316550 + }, + { + "epoch": 1.6, + "learning_rate": 6.0437109948489235e-05, + "loss": 0.0059, + "step": 316560 + }, + { + "epoch": 1.6, + "learning_rate": 6.042954225547522e-05, + "loss": 0.0072, + "step": 316570 + }, + { + "epoch": 1.6, + "learning_rate": 6.0421974562461204e-05, + "loss": 0.0066, + "step": 316580 + }, + { + "epoch": 1.6, + "learning_rate": 6.04144068694472e-05, + "loss": 0.0072, + "step": 316590 + }, + { + "epoch": 1.6, + "learning_rate": 6.040683917643319e-05, + "loss": 0.0076, + "step": 316600 + }, + { + "epoch": 1.6, + "learning_rate": 6.0399271483419176e-05, + "loss": 0.0056, + "step": 316610 + }, + { + "epoch": 1.6, + "learning_rate": 6.0391703790405164e-05, + "loss": 0.0062, + "step": 316620 + }, + { + "epoch": 1.6, + "learning_rate": 6.038413609739116e-05, + "loss": 0.0059, + "step": 316630 + }, + { + "epoch": 1.6, + "learning_rate": 6.037656840437715e-05, + "loss": 0.0069, + "step": 316640 + }, + { + "epoch": 1.6, + "learning_rate": 6.0369000711363135e-05, + "loss": 0.0065, + "step": 316650 + }, + { + "epoch": 1.6, + "learning_rate": 6.0361433018349124e-05, + "loss": 0.0063, + "step": 316660 + }, + { + "epoch": 1.6, + "learning_rate": 6.035386532533512e-05, + "loss": 0.0062, + "step": 316670 + }, + { + "epoch": 1.6, + "learning_rate": 6.034629763232111e-05, + "loss": 0.0071, + "step": 316680 + }, + { + "epoch": 1.6, + "learning_rate": 6.0338729939307095e-05, + "loss": 0.0061, + "step": 316690 + }, + { + "epoch": 1.6, + "learning_rate": 6.033116224629308e-05, + "loss": 0.0063, + "step": 316700 + }, + { + "epoch": 1.6, + "learning_rate": 6.032359455327908e-05, + "loss": 0.0057, + "step": 316710 + }, + { + "epoch": 1.6, + "learning_rate": 6.0316026860265067e-05, + "loss": 0.0077, + "step": 316720 + }, + { + "epoch": 1.6, + "learning_rate": 6.0308459167251055e-05, + "loss": 0.0075, + "step": 316730 + }, + { + "epoch": 1.6, + "learning_rate": 6.030089147423704e-05, + "loss": 0.0062, + "step": 316740 + }, + { + "epoch": 1.6, + "learning_rate": 6.029332378122304e-05, + "loss": 0.0076, + "step": 316750 + }, + { + "epoch": 1.6, + "learning_rate": 6.0285756088209026e-05, + "loss": 0.0052, + "step": 316760 + }, + { + "epoch": 1.6, + "learning_rate": 6.0278188395195014e-05, + "loss": 0.0074, + "step": 316770 + }, + { + "epoch": 1.6, + "learning_rate": 6.0270620702181e-05, + "loss": 0.0052, + "step": 316780 + }, + { + "epoch": 1.6, + "learning_rate": 6.0263053009167e-05, + "loss": 0.0064, + "step": 316790 + }, + { + "epoch": 1.6, + "learning_rate": 6.0255485316152986e-05, + "loss": 0.0097, + "step": 316800 + }, + { + "epoch": 1.6, + "learning_rate": 6.0247917623138974e-05, + "loss": 0.0076, + "step": 316810 + }, + { + "epoch": 1.6, + "learning_rate": 6.024034993012496e-05, + "loss": 0.0068, + "step": 316820 + }, + { + "epoch": 1.6, + "learning_rate": 6.023278223711096e-05, + "loss": 0.0074, + "step": 316830 + }, + { + "epoch": 1.6, + "learning_rate": 6.0225214544096946e-05, + "loss": 0.0074, + "step": 316840 + }, + { + "epoch": 1.6, + "learning_rate": 6.0217646851082934e-05, + "loss": 0.0053, + "step": 316850 + }, + { + "epoch": 1.6, + "learning_rate": 6.021007915806892e-05, + "loss": 0.0082, + "step": 316860 + }, + { + "epoch": 1.6, + "learning_rate": 6.020251146505492e-05, + "loss": 0.008, + "step": 316870 + }, + { + "epoch": 1.6, + "learning_rate": 6.0194943772040905e-05, + "loss": 0.0058, + "step": 316880 + }, + { + "epoch": 1.6, + "learning_rate": 6.018737607902689e-05, + "loss": 0.0061, + "step": 316890 + }, + { + "epoch": 1.6, + "learning_rate": 6.0179808386012875e-05, + "loss": 0.007, + "step": 316900 + }, + { + "epoch": 1.6, + "learning_rate": 6.017224069299886e-05, + "loss": 0.0055, + "step": 316910 + }, + { + "epoch": 1.6, + "learning_rate": 6.016467299998486e-05, + "loss": 0.0083, + "step": 316920 + }, + { + "epoch": 1.6, + "learning_rate": 6.0157105306970846e-05, + "loss": 0.0068, + "step": 316930 + }, + { + "epoch": 1.6, + "learning_rate": 6.0149537613956834e-05, + "loss": 0.0087, + "step": 316940 + }, + { + "epoch": 1.6, + "learning_rate": 6.014196992094282e-05, + "loss": 0.007, + "step": 316950 + }, + { + "epoch": 1.6, + "learning_rate": 6.013440222792882e-05, + "loss": 0.0087, + "step": 316960 + }, + { + "epoch": 1.6, + "learning_rate": 6.0126834534914806e-05, + "loss": 0.006, + "step": 316970 + }, + { + "epoch": 1.6, + "learning_rate": 6.0119266841900794e-05, + "loss": 0.0063, + "step": 316980 + }, + { + "epoch": 1.6, + "learning_rate": 6.011169914888678e-05, + "loss": 0.0073, + "step": 316990 + }, + { + "epoch": 1.6, + "learning_rate": 6.010413145587278e-05, + "loss": 0.0076, + "step": 317000 + }, + { + "epoch": 1.6, + "eval_cer": 0.9144518183767796, + "eval_loss": 0.005164159927517176, + "eval_runtime": 116.3465, + "eval_samples_per_second": 17.19, + "eval_steps_per_second": 4.298, + "step": 317000 + }, + { + "epoch": 1.6, + "learning_rate": 6.0096563762858766e-05, + "loss": 0.0069, + "step": 317010 + }, + { + "epoch": 1.6, + "learning_rate": 6.0088996069844754e-05, + "loss": 0.0065, + "step": 317020 + }, + { + "epoch": 1.6, + "learning_rate": 6.008142837683074e-05, + "loss": 0.0062, + "step": 317030 + }, + { + "epoch": 1.6, + "learning_rate": 6.007386068381674e-05, + "loss": 0.0066, + "step": 317040 + }, + { + "epoch": 1.6, + "learning_rate": 6.0066292990802725e-05, + "loss": 0.0097, + "step": 317050 + }, + { + "epoch": 1.6, + "learning_rate": 6.0058725297788713e-05, + "loss": 0.0098, + "step": 317060 + }, + { + "epoch": 1.6, + "learning_rate": 6.005115760477471e-05, + "loss": 0.0077, + "step": 317070 + }, + { + "epoch": 1.6, + "learning_rate": 6.00435899117607e-05, + "loss": 0.0087, + "step": 317080 + }, + { + "epoch": 1.6, + "learning_rate": 6.0036022218746685e-05, + "loss": 0.0061, + "step": 317090 + }, + { + "epoch": 1.6, + "learning_rate": 6.002845452573267e-05, + "loss": 0.0078, + "step": 317100 + }, + { + "epoch": 1.6, + "learning_rate": 6.002088683271867e-05, + "loss": 0.0063, + "step": 317110 + }, + { + "epoch": 1.6, + "learning_rate": 6.0013319139704656e-05, + "loss": 0.0056, + "step": 317120 + }, + { + "epoch": 1.6, + "learning_rate": 6.0005751446690645e-05, + "loss": 0.0068, + "step": 317130 + }, + { + "epoch": 1.6, + "learning_rate": 5.999818375367663e-05, + "loss": 0.0067, + "step": 317140 + }, + { + "epoch": 1.6, + "learning_rate": 5.999061606066263e-05, + "loss": 0.0079, + "step": 317150 + }, + { + "epoch": 1.6, + "learning_rate": 5.9983048367648616e-05, + "loss": 0.0064, + "step": 317160 + }, + { + "epoch": 1.6, + "learning_rate": 5.9975480674634604e-05, + "loss": 0.0052, + "step": 317170 + }, + { + "epoch": 1.6, + "learning_rate": 5.996791298162059e-05, + "loss": 0.007, + "step": 317180 + }, + { + "epoch": 1.6, + "learning_rate": 5.996034528860659e-05, + "loss": 0.0075, + "step": 317190 + }, + { + "epoch": 1.6, + "learning_rate": 5.9952777595592576e-05, + "loss": 0.008, + "step": 317200 + }, + { + "epoch": 1.6, + "learning_rate": 5.994520990257856e-05, + "loss": 0.006, + "step": 317210 + }, + { + "epoch": 1.6, + "learning_rate": 5.9937642209564545e-05, + "loss": 0.0053, + "step": 317220 + }, + { + "epoch": 1.6, + "learning_rate": 5.9930074516550533e-05, + "loss": 0.0084, + "step": 317230 + }, + { + "epoch": 1.6, + "learning_rate": 5.992250682353653e-05, + "loss": 0.0062, + "step": 317240 + }, + { + "epoch": 1.6, + "learning_rate": 5.991493913052252e-05, + "loss": 0.0077, + "step": 317250 + }, + { + "epoch": 1.6, + "learning_rate": 5.9907371437508505e-05, + "loss": 0.005, + "step": 317260 + }, + { + "epoch": 1.6, + "learning_rate": 5.989980374449449e-05, + "loss": 0.0086, + "step": 317270 + }, + { + "epoch": 1.6, + "learning_rate": 5.989223605148049e-05, + "loss": 0.0063, + "step": 317280 + }, + { + "epoch": 1.6, + "learning_rate": 5.9884668358466476e-05, + "loss": 0.0075, + "step": 317290 + }, + { + "epoch": 1.6, + "learning_rate": 5.9877100665452465e-05, + "loss": 0.0057, + "step": 317300 + }, + { + "epoch": 1.6, + "learning_rate": 5.986953297243845e-05, + "loss": 0.0062, + "step": 317310 + }, + { + "epoch": 1.6, + "learning_rate": 5.986196527942445e-05, + "loss": 0.0073, + "step": 317320 + }, + { + "epoch": 1.6, + "learning_rate": 5.9854397586410436e-05, + "loss": 0.0052, + "step": 317330 + }, + { + "epoch": 1.6, + "learning_rate": 5.9846829893396424e-05, + "loss": 0.0067, + "step": 317340 + }, + { + "epoch": 1.6, + "learning_rate": 5.983926220038241e-05, + "loss": 0.0061, + "step": 317350 + }, + { + "epoch": 1.6, + "learning_rate": 5.983169450736841e-05, + "loss": 0.0076, + "step": 317360 + }, + { + "epoch": 1.6, + "learning_rate": 5.9824126814354396e-05, + "loss": 0.0066, + "step": 317370 + }, + { + "epoch": 1.6, + "learning_rate": 5.9816559121340384e-05, + "loss": 0.0073, + "step": 317380 + }, + { + "epoch": 1.6, + "learning_rate": 5.980899142832637e-05, + "loss": 0.0079, + "step": 317390 + }, + { + "epoch": 1.6, + "learning_rate": 5.980142373531237e-05, + "loss": 0.0068, + "step": 317400 + }, + { + "epoch": 1.6, + "learning_rate": 5.9793856042298355e-05, + "loss": 0.0058, + "step": 317410 + }, + { + "epoch": 1.6, + "learning_rate": 5.9786288349284344e-05, + "loss": 0.0076, + "step": 317420 + }, + { + "epoch": 1.6, + "learning_rate": 5.977872065627033e-05, + "loss": 0.0062, + "step": 317430 + }, + { + "epoch": 1.6, + "learning_rate": 5.977115296325633e-05, + "loss": 0.0058, + "step": 317440 + }, + { + "epoch": 1.6, + "learning_rate": 5.9763585270242315e-05, + "loss": 0.0078, + "step": 317450 + }, + { + "epoch": 1.6, + "learning_rate": 5.97560175772283e-05, + "loss": 0.0063, + "step": 317460 + }, + { + "epoch": 1.6, + "learning_rate": 5.974844988421429e-05, + "loss": 0.0071, + "step": 317470 + }, + { + "epoch": 1.6, + "learning_rate": 5.9740882191200286e-05, + "loss": 0.0093, + "step": 317480 + }, + { + "epoch": 1.6, + "learning_rate": 5.9733314498186275e-05, + "loss": 0.008, + "step": 317490 + }, + { + "epoch": 1.6, + "learning_rate": 5.972574680517226e-05, + "loss": 0.0071, + "step": 317500 + }, + { + "epoch": 1.6, + "learning_rate": 5.971817911215825e-05, + "loss": 0.0058, + "step": 317510 + }, + { + "epoch": 1.6, + "learning_rate": 5.9710611419144246e-05, + "loss": 0.0073, + "step": 317520 + }, + { + "epoch": 1.6, + "learning_rate": 5.970304372613023e-05, + "loss": 0.006, + "step": 317530 + }, + { + "epoch": 1.6, + "learning_rate": 5.9695476033116216e-05, + "loss": 0.0058, + "step": 317540 + }, + { + "epoch": 1.6, + "learning_rate": 5.9687908340102204e-05, + "loss": 0.0071, + "step": 317550 + }, + { + "epoch": 1.6, + "learning_rate": 5.96803406470882e-05, + "loss": 0.0058, + "step": 317560 + }, + { + "epoch": 1.6, + "learning_rate": 5.967277295407419e-05, + "loss": 0.0102, + "step": 317570 + }, + { + "epoch": 1.6, + "learning_rate": 5.9665205261060175e-05, + "loss": 0.0068, + "step": 317580 + }, + { + "epoch": 1.6, + "learning_rate": 5.9657637568046164e-05, + "loss": 0.007, + "step": 317590 + }, + { + "epoch": 1.6, + "learning_rate": 5.965006987503216e-05, + "loss": 0.0071, + "step": 317600 + }, + { + "epoch": 1.6, + "learning_rate": 5.964250218201815e-05, + "loss": 0.0059, + "step": 317610 + }, + { + "epoch": 1.6, + "learning_rate": 5.9634934489004135e-05, + "loss": 0.0073, + "step": 317620 + }, + { + "epoch": 1.6, + "learning_rate": 5.962736679599012e-05, + "loss": 0.0061, + "step": 317630 + }, + { + "epoch": 1.6, + "learning_rate": 5.961979910297612e-05, + "loss": 0.0059, + "step": 317640 + }, + { + "epoch": 1.6, + "learning_rate": 5.9612231409962106e-05, + "loss": 0.0068, + "step": 317650 + }, + { + "epoch": 1.6, + "learning_rate": 5.9604663716948095e-05, + "loss": 0.0069, + "step": 317660 + }, + { + "epoch": 1.6, + "learning_rate": 5.959709602393408e-05, + "loss": 0.0069, + "step": 317670 + }, + { + "epoch": 1.6, + "learning_rate": 5.958952833092008e-05, + "loss": 0.0069, + "step": 317680 + }, + { + "epoch": 1.6, + "learning_rate": 5.9581960637906066e-05, + "loss": 0.0072, + "step": 317690 + }, + { + "epoch": 1.6, + "learning_rate": 5.9574392944892054e-05, + "loss": 0.0059, + "step": 317700 + }, + { + "epoch": 1.6, + "learning_rate": 5.956682525187804e-05, + "loss": 0.0089, + "step": 317710 + }, + { + "epoch": 1.6, + "learning_rate": 5.955925755886404e-05, + "loss": 0.0069, + "step": 317720 + }, + { + "epoch": 1.6, + "learning_rate": 5.9551689865850026e-05, + "loss": 0.008, + "step": 317730 + }, + { + "epoch": 1.6, + "learning_rate": 5.9544122172836014e-05, + "loss": 0.0074, + "step": 317740 + }, + { + "epoch": 1.6, + "learning_rate": 5.9536554479822e-05, + "loss": 0.006, + "step": 317750 + }, + { + "epoch": 1.6, + "learning_rate": 5.9528986786808e-05, + "loss": 0.0089, + "step": 317760 + }, + { + "epoch": 1.6, + "learning_rate": 5.9521419093793985e-05, + "loss": 0.0076, + "step": 317770 + }, + { + "epoch": 1.6, + "learning_rate": 5.9513851400779974e-05, + "loss": 0.009, + "step": 317780 + }, + { + "epoch": 1.6, + "learning_rate": 5.950628370776596e-05, + "loss": 0.0052, + "step": 317790 + }, + { + "epoch": 1.6, + "learning_rate": 5.949871601475196e-05, + "loss": 0.0056, + "step": 317800 + }, + { + "epoch": 1.6, + "learning_rate": 5.9491148321737945e-05, + "loss": 0.007, + "step": 317810 + }, + { + "epoch": 1.6, + "learning_rate": 5.948358062872393e-05, + "loss": 0.0084, + "step": 317820 + }, + { + "epoch": 1.6, + "learning_rate": 5.947601293570992e-05, + "loss": 0.0083, + "step": 317830 + }, + { + "epoch": 1.6, + "learning_rate": 5.94684452426959e-05, + "loss": 0.0069, + "step": 317840 + }, + { + "epoch": 1.6, + "learning_rate": 5.94608775496819e-05, + "loss": 0.0071, + "step": 317850 + }, + { + "epoch": 1.6, + "learning_rate": 5.9453309856667886e-05, + "loss": 0.0088, + "step": 317860 + }, + { + "epoch": 1.6, + "learning_rate": 5.9445742163653874e-05, + "loss": 0.0059, + "step": 317870 + }, + { + "epoch": 1.6, + "learning_rate": 5.943817447063986e-05, + "loss": 0.005, + "step": 317880 + }, + { + "epoch": 1.6, + "learning_rate": 5.943060677762586e-05, + "loss": 0.0065, + "step": 317890 + }, + { + "epoch": 1.6, + "learning_rate": 5.9423039084611846e-05, + "loss": 0.0062, + "step": 317900 + }, + { + "epoch": 1.6, + "learning_rate": 5.9415471391597834e-05, + "loss": 0.0061, + "step": 317910 + }, + { + "epoch": 1.6, + "learning_rate": 5.940790369858382e-05, + "loss": 0.0065, + "step": 317920 + }, + { + "epoch": 1.6, + "learning_rate": 5.940033600556982e-05, + "loss": 0.0065, + "step": 317930 + }, + { + "epoch": 1.6, + "learning_rate": 5.9392768312555805e-05, + "loss": 0.0059, + "step": 317940 + }, + { + "epoch": 1.6, + "learning_rate": 5.9385200619541794e-05, + "loss": 0.0065, + "step": 317950 + }, + { + "epoch": 1.6, + "learning_rate": 5.937763292652778e-05, + "loss": 0.0058, + "step": 317960 + }, + { + "epoch": 1.6, + "learning_rate": 5.937006523351378e-05, + "loss": 0.0075, + "step": 317970 + }, + { + "epoch": 1.6, + "learning_rate": 5.9362497540499765e-05, + "loss": 0.0061, + "step": 317980 + }, + { + "epoch": 1.6, + "learning_rate": 5.935492984748575e-05, + "loss": 0.0076, + "step": 317990 + }, + { + "epoch": 1.6, + "learning_rate": 5.934736215447174e-05, + "loss": 0.0051, + "step": 318000 + }, + { + "epoch": 1.6, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.005206539761275053, + "eval_runtime": 116.4709, + "eval_samples_per_second": 17.172, + "eval_steps_per_second": 4.293, + "step": 318000 + }, + { + "epoch": 1.6, + "learning_rate": 5.9339794461457737e-05, + "loss": 0.0057, + "step": 318010 + }, + { + "epoch": 1.6, + "learning_rate": 5.9332226768443725e-05, + "loss": 0.0096, + "step": 318020 + }, + { + "epoch": 1.6, + "learning_rate": 5.932465907542971e-05, + "loss": 0.0058, + "step": 318030 + }, + { + "epoch": 1.6, + "learning_rate": 5.931709138241571e-05, + "loss": 0.0061, + "step": 318040 + }, + { + "epoch": 1.6, + "learning_rate": 5.9309523689401696e-05, + "loss": 0.0083, + "step": 318050 + }, + { + "epoch": 1.6, + "learning_rate": 5.9301955996387684e-05, + "loss": 0.006, + "step": 318060 + }, + { + "epoch": 1.6, + "learning_rate": 5.929438830337367e-05, + "loss": 0.0071, + "step": 318070 + }, + { + "epoch": 1.6, + "learning_rate": 5.928682061035967e-05, + "loss": 0.0052, + "step": 318080 + }, + { + "epoch": 1.6, + "learning_rate": 5.9279252917345656e-05, + "loss": 0.0086, + "step": 318090 + }, + { + "epoch": 1.6, + "learning_rate": 5.9271685224331644e-05, + "loss": 0.0057, + "step": 318100 + }, + { + "epoch": 1.6, + "learning_rate": 5.926411753131763e-05, + "loss": 0.0086, + "step": 318110 + }, + { + "epoch": 1.6, + "learning_rate": 5.925654983830363e-05, + "loss": 0.0067, + "step": 318120 + }, + { + "epoch": 1.6, + "learning_rate": 5.9248982145289615e-05, + "loss": 0.0071, + "step": 318130 + }, + { + "epoch": 1.61, + "learning_rate": 5.9241414452275604e-05, + "loss": 0.0093, + "step": 318140 + }, + { + "epoch": 1.61, + "learning_rate": 5.9233846759261585e-05, + "loss": 0.0101, + "step": 318150 + }, + { + "epoch": 1.61, + "learning_rate": 5.922627906624757e-05, + "loss": 0.0071, + "step": 318160 + }, + { + "epoch": 1.61, + "learning_rate": 5.921871137323357e-05, + "loss": 0.0059, + "step": 318170 + }, + { + "epoch": 1.61, + "learning_rate": 5.9211143680219557e-05, + "loss": 0.0075, + "step": 318180 + }, + { + "epoch": 1.61, + "learning_rate": 5.9203575987205545e-05, + "loss": 0.0091, + "step": 318190 + }, + { + "epoch": 1.61, + "learning_rate": 5.919600829419153e-05, + "loss": 0.0086, + "step": 318200 + }, + { + "epoch": 1.61, + "learning_rate": 5.918844060117753e-05, + "loss": 0.0073, + "step": 318210 + }, + { + "epoch": 1.61, + "learning_rate": 5.9180872908163516e-05, + "loss": 0.0065, + "step": 318220 + }, + { + "epoch": 1.61, + "learning_rate": 5.9173305215149504e-05, + "loss": 0.0087, + "step": 318230 + }, + { + "epoch": 1.61, + "learning_rate": 5.916573752213549e-05, + "loss": 0.0068, + "step": 318240 + }, + { + "epoch": 1.61, + "learning_rate": 5.915816982912149e-05, + "loss": 0.0059, + "step": 318250 + }, + { + "epoch": 1.61, + "learning_rate": 5.9150602136107476e-05, + "loss": 0.0065, + "step": 318260 + }, + { + "epoch": 1.61, + "learning_rate": 5.9143034443093464e-05, + "loss": 0.0059, + "step": 318270 + }, + { + "epoch": 1.61, + "learning_rate": 5.913546675007945e-05, + "loss": 0.005, + "step": 318280 + }, + { + "epoch": 1.61, + "learning_rate": 5.912789905706545e-05, + "loss": 0.0077, + "step": 318290 + }, + { + "epoch": 1.61, + "learning_rate": 5.9120331364051436e-05, + "loss": 0.0081, + "step": 318300 + }, + { + "epoch": 1.61, + "learning_rate": 5.9112763671037424e-05, + "loss": 0.0063, + "step": 318310 + }, + { + "epoch": 1.61, + "learning_rate": 5.910519597802341e-05, + "loss": 0.006, + "step": 318320 + }, + { + "epoch": 1.61, + "learning_rate": 5.909762828500941e-05, + "loss": 0.0059, + "step": 318330 + }, + { + "epoch": 1.61, + "learning_rate": 5.9090060591995395e-05, + "loss": 0.0064, + "step": 318340 + }, + { + "epoch": 1.61, + "learning_rate": 5.908249289898138e-05, + "loss": 0.0062, + "step": 318350 + }, + { + "epoch": 1.61, + "learning_rate": 5.907492520596737e-05, + "loss": 0.0063, + "step": 318360 + }, + { + "epoch": 1.61, + "learning_rate": 5.9067357512953367e-05, + "loss": 0.0069, + "step": 318370 + }, + { + "epoch": 1.61, + "learning_rate": 5.9059789819939355e-05, + "loss": 0.0082, + "step": 318380 + }, + { + "epoch": 1.61, + "learning_rate": 5.905222212692534e-05, + "loss": 0.0062, + "step": 318390 + }, + { + "epoch": 1.61, + "learning_rate": 5.904465443391133e-05, + "loss": 0.0085, + "step": 318400 + }, + { + "epoch": 1.61, + "learning_rate": 5.9037086740897326e-05, + "loss": 0.0064, + "step": 318410 + }, + { + "epoch": 1.61, + "learning_rate": 5.9029519047883314e-05, + "loss": 0.0086, + "step": 318420 + }, + { + "epoch": 1.61, + "learning_rate": 5.90219513548693e-05, + "loss": 0.0088, + "step": 318430 + }, + { + "epoch": 1.61, + "learning_rate": 5.901438366185529e-05, + "loss": 0.008, + "step": 318440 + }, + { + "epoch": 1.61, + "learning_rate": 5.9006815968841286e-05, + "loss": 0.0071, + "step": 318450 + }, + { + "epoch": 1.61, + "learning_rate": 5.8999248275827274e-05, + "loss": 0.0057, + "step": 318460 + }, + { + "epoch": 1.61, + "learning_rate": 5.8991680582813256e-05, + "loss": 0.0068, + "step": 318470 + }, + { + "epoch": 1.61, + "learning_rate": 5.8984112889799244e-05, + "loss": 0.0056, + "step": 318480 + }, + { + "epoch": 1.61, + "learning_rate": 5.897654519678523e-05, + "loss": 0.0068, + "step": 318490 + }, + { + "epoch": 1.61, + "learning_rate": 5.896897750377123e-05, + "loss": 0.0065, + "step": 318500 + }, + { + "epoch": 1.61, + "learning_rate": 5.8961409810757215e-05, + "loss": 0.0062, + "step": 318510 + }, + { + "epoch": 1.61, + "learning_rate": 5.8953842117743203e-05, + "loss": 0.0077, + "step": 318520 + }, + { + "epoch": 1.61, + "learning_rate": 5.89462744247292e-05, + "loss": 0.0063, + "step": 318530 + }, + { + "epoch": 1.61, + "learning_rate": 5.893870673171519e-05, + "loss": 0.006, + "step": 318540 + }, + { + "epoch": 1.61, + "learning_rate": 5.8931139038701175e-05, + "loss": 0.0079, + "step": 318550 + }, + { + "epoch": 1.61, + "learning_rate": 5.892357134568716e-05, + "loss": 0.0075, + "step": 318560 + }, + { + "epoch": 1.61, + "learning_rate": 5.891600365267316e-05, + "loss": 0.008, + "step": 318570 + }, + { + "epoch": 1.61, + "learning_rate": 5.8908435959659146e-05, + "loss": 0.0098, + "step": 318580 + }, + { + "epoch": 1.61, + "learning_rate": 5.8900868266645135e-05, + "loss": 0.0068, + "step": 318590 + }, + { + "epoch": 1.61, + "learning_rate": 5.889330057363112e-05, + "loss": 0.0039, + "step": 318600 + }, + { + "epoch": 1.61, + "learning_rate": 5.888573288061712e-05, + "loss": 0.0062, + "step": 318610 + }, + { + "epoch": 1.61, + "learning_rate": 5.8878165187603106e-05, + "loss": 0.0086, + "step": 318620 + }, + { + "epoch": 1.61, + "learning_rate": 5.8870597494589094e-05, + "loss": 0.0049, + "step": 318630 + }, + { + "epoch": 1.61, + "learning_rate": 5.886302980157508e-05, + "loss": 0.0069, + "step": 318640 + }, + { + "epoch": 1.61, + "learning_rate": 5.885546210856108e-05, + "loss": 0.0065, + "step": 318650 + }, + { + "epoch": 1.61, + "learning_rate": 5.8847894415547066e-05, + "loss": 0.0085, + "step": 318660 + }, + { + "epoch": 1.61, + "learning_rate": 5.8840326722533054e-05, + "loss": 0.0062, + "step": 318670 + }, + { + "epoch": 1.61, + "learning_rate": 5.883275902951904e-05, + "loss": 0.0072, + "step": 318680 + }, + { + "epoch": 1.61, + "learning_rate": 5.882519133650504e-05, + "loss": 0.0058, + "step": 318690 + }, + { + "epoch": 1.61, + "learning_rate": 5.8817623643491025e-05, + "loss": 0.0081, + "step": 318700 + }, + { + "epoch": 1.61, + "learning_rate": 5.8810055950477013e-05, + "loss": 0.0069, + "step": 318710 + }, + { + "epoch": 1.61, + "learning_rate": 5.8802488257463e-05, + "loss": 0.0081, + "step": 318720 + }, + { + "epoch": 1.61, + "learning_rate": 5.8794920564449e-05, + "loss": 0.0075, + "step": 318730 + }, + { + "epoch": 1.61, + "learning_rate": 5.8787352871434985e-05, + "loss": 0.0055, + "step": 318740 + }, + { + "epoch": 1.61, + "learning_rate": 5.877978517842097e-05, + "loss": 0.0058, + "step": 318750 + }, + { + "epoch": 1.61, + "learning_rate": 5.877221748540696e-05, + "loss": 0.0067, + "step": 318760 + }, + { + "epoch": 1.61, + "learning_rate": 5.8764649792392956e-05, + "loss": 0.0051, + "step": 318770 + }, + { + "epoch": 1.61, + "learning_rate": 5.875708209937894e-05, + "loss": 0.0097, + "step": 318780 + }, + { + "epoch": 1.61, + "learning_rate": 5.8749514406364926e-05, + "loss": 0.0085, + "step": 318790 + }, + { + "epoch": 1.61, + "learning_rate": 5.8741946713350914e-05, + "loss": 0.0066, + "step": 318800 + }, + { + "epoch": 1.61, + "learning_rate": 5.87343790203369e-05, + "loss": 0.009, + "step": 318810 + }, + { + "epoch": 1.61, + "learning_rate": 5.87268113273229e-05, + "loss": 0.0054, + "step": 318820 + }, + { + "epoch": 1.61, + "learning_rate": 5.8719243634308886e-05, + "loss": 0.009, + "step": 318830 + }, + { + "epoch": 1.61, + "learning_rate": 5.8711675941294874e-05, + "loss": 0.0059, + "step": 318840 + }, + { + "epoch": 1.61, + "learning_rate": 5.870410824828086e-05, + "loss": 0.0086, + "step": 318850 + }, + { + "epoch": 1.61, + "learning_rate": 5.869654055526686e-05, + "loss": 0.0051, + "step": 318860 + }, + { + "epoch": 1.61, + "learning_rate": 5.8688972862252845e-05, + "loss": 0.0066, + "step": 318870 + }, + { + "epoch": 1.61, + "learning_rate": 5.8681405169238834e-05, + "loss": 0.0086, + "step": 318880 + }, + { + "epoch": 1.61, + "learning_rate": 5.867383747622482e-05, + "loss": 0.0096, + "step": 318890 + }, + { + "epoch": 1.61, + "learning_rate": 5.866626978321082e-05, + "loss": 0.0101, + "step": 318900 + }, + { + "epoch": 1.61, + "learning_rate": 5.8658702090196805e-05, + "loss": 0.0054, + "step": 318910 + }, + { + "epoch": 1.61, + "learning_rate": 5.865113439718279e-05, + "loss": 0.004, + "step": 318920 + }, + { + "epoch": 1.61, + "learning_rate": 5.864356670416878e-05, + "loss": 0.0062, + "step": 318930 + }, + { + "epoch": 1.61, + "learning_rate": 5.8635999011154776e-05, + "loss": 0.0064, + "step": 318940 + }, + { + "epoch": 1.61, + "learning_rate": 5.8628431318140765e-05, + "loss": 0.0063, + "step": 318950 + }, + { + "epoch": 1.61, + "learning_rate": 5.862086362512675e-05, + "loss": 0.0061, + "step": 318960 + }, + { + "epoch": 1.61, + "learning_rate": 5.861329593211274e-05, + "loss": 0.0076, + "step": 318970 + }, + { + "epoch": 1.61, + "learning_rate": 5.8605728239098736e-05, + "loss": 0.0083, + "step": 318980 + }, + { + "epoch": 1.61, + "learning_rate": 5.8598160546084724e-05, + "loss": 0.0108, + "step": 318990 + }, + { + "epoch": 1.61, + "learning_rate": 5.859059285307071e-05, + "loss": 0.0057, + "step": 319000 + }, + { + "epoch": 1.61, + "eval_cer": 0.9144294992658953, + "eval_loss": 0.00516105629503727, + "eval_runtime": 116.3084, + "eval_samples_per_second": 17.196, + "eval_steps_per_second": 4.299, + "step": 319000 + }, + { + "epoch": 1.61, + "learning_rate": 5.858302516005671e-05, + "loss": 0.0061, + "step": 319010 + }, + { + "epoch": 1.61, + "learning_rate": 5.8575457467042696e-05, + "loss": 0.0062, + "step": 319020 + }, + { + "epoch": 1.61, + "learning_rate": 5.8567889774028684e-05, + "loss": 0.0084, + "step": 319030 + }, + { + "epoch": 1.61, + "learning_rate": 5.856032208101467e-05, + "loss": 0.0066, + "step": 319040 + }, + { + "epoch": 1.61, + "learning_rate": 5.855275438800067e-05, + "loss": 0.0077, + "step": 319050 + }, + { + "epoch": 1.61, + "learning_rate": 5.8545186694986655e-05, + "loss": 0.0092, + "step": 319060 + }, + { + "epoch": 1.61, + "learning_rate": 5.8537619001972644e-05, + "loss": 0.0067, + "step": 319070 + }, + { + "epoch": 1.61, + "learning_rate": 5.853005130895863e-05, + "loss": 0.0057, + "step": 319080 + }, + { + "epoch": 1.61, + "learning_rate": 5.852248361594463e-05, + "loss": 0.0092, + "step": 319090 + }, + { + "epoch": 1.61, + "learning_rate": 5.851491592293061e-05, + "loss": 0.0064, + "step": 319100 + }, + { + "epoch": 1.61, + "learning_rate": 5.8507348229916596e-05, + "loss": 0.0076, + "step": 319110 + }, + { + "epoch": 1.61, + "learning_rate": 5.8499780536902585e-05, + "loss": 0.0085, + "step": 319120 + }, + { + "epoch": 1.61, + "learning_rate": 5.849221284388857e-05, + "loss": 0.0044, + "step": 319130 + }, + { + "epoch": 1.61, + "learning_rate": 5.848464515087457e-05, + "loss": 0.008, + "step": 319140 + }, + { + "epoch": 1.61, + "learning_rate": 5.8477077457860556e-05, + "loss": 0.0072, + "step": 319150 + }, + { + "epoch": 1.61, + "learning_rate": 5.8469509764846544e-05, + "loss": 0.0083, + "step": 319160 + }, + { + "epoch": 1.61, + "learning_rate": 5.846194207183253e-05, + "loss": 0.0095, + "step": 319170 + }, + { + "epoch": 1.61, + "learning_rate": 5.845437437881853e-05, + "loss": 0.0075, + "step": 319180 + }, + { + "epoch": 1.61, + "learning_rate": 5.8446806685804516e-05, + "loss": 0.007, + "step": 319190 + }, + { + "epoch": 1.61, + "learning_rate": 5.8439238992790504e-05, + "loss": 0.0062, + "step": 319200 + }, + { + "epoch": 1.61, + "learning_rate": 5.843167129977649e-05, + "loss": 0.0054, + "step": 319210 + }, + { + "epoch": 1.61, + "learning_rate": 5.842410360676249e-05, + "loss": 0.0069, + "step": 319220 + }, + { + "epoch": 1.61, + "learning_rate": 5.8416535913748475e-05, + "loss": 0.0071, + "step": 319230 + }, + { + "epoch": 1.61, + "learning_rate": 5.8408968220734464e-05, + "loss": 0.0068, + "step": 319240 + }, + { + "epoch": 1.61, + "learning_rate": 5.840140052772045e-05, + "loss": 0.0089, + "step": 319250 + }, + { + "epoch": 1.61, + "learning_rate": 5.839383283470645e-05, + "loss": 0.0065, + "step": 319260 + }, + { + "epoch": 1.61, + "learning_rate": 5.8386265141692435e-05, + "loss": 0.0081, + "step": 319270 + }, + { + "epoch": 1.61, + "learning_rate": 5.837869744867842e-05, + "loss": 0.0071, + "step": 319280 + }, + { + "epoch": 1.61, + "learning_rate": 5.837112975566441e-05, + "loss": 0.011, + "step": 319290 + }, + { + "epoch": 1.61, + "learning_rate": 5.8363562062650406e-05, + "loss": 0.0049, + "step": 319300 + }, + { + "epoch": 1.61, + "learning_rate": 5.8355994369636395e-05, + "loss": 0.0064, + "step": 319310 + }, + { + "epoch": 1.61, + "learning_rate": 5.834842667662238e-05, + "loss": 0.0052, + "step": 319320 + }, + { + "epoch": 1.61, + "learning_rate": 5.834085898360837e-05, + "loss": 0.0066, + "step": 319330 + }, + { + "epoch": 1.61, + "learning_rate": 5.8333291290594366e-05, + "loss": 0.0067, + "step": 319340 + }, + { + "epoch": 1.61, + "learning_rate": 5.8325723597580354e-05, + "loss": 0.009, + "step": 319350 + }, + { + "epoch": 1.61, + "learning_rate": 5.831815590456634e-05, + "loss": 0.0066, + "step": 319360 + }, + { + "epoch": 1.61, + "learning_rate": 5.831058821155233e-05, + "loss": 0.0077, + "step": 319370 + }, + { + "epoch": 1.61, + "learning_rate": 5.8303020518538326e-05, + "loss": 0.0061, + "step": 319380 + }, + { + "epoch": 1.61, + "learning_rate": 5.8295452825524314e-05, + "loss": 0.0071, + "step": 319390 + }, + { + "epoch": 1.61, + "learning_rate": 5.82878851325103e-05, + "loss": 0.0054, + "step": 319400 + }, + { + "epoch": 1.61, + "learning_rate": 5.8280317439496284e-05, + "loss": 0.0068, + "step": 319410 + }, + { + "epoch": 1.61, + "learning_rate": 5.827274974648227e-05, + "loss": 0.0091, + "step": 319420 + }, + { + "epoch": 1.61, + "learning_rate": 5.826518205346827e-05, + "loss": 0.0054, + "step": 319430 + }, + { + "epoch": 1.61, + "learning_rate": 5.8257614360454255e-05, + "loss": 0.0053, + "step": 319440 + }, + { + "epoch": 1.61, + "learning_rate": 5.825004666744024e-05, + "loss": 0.0069, + "step": 319450 + }, + { + "epoch": 1.61, + "learning_rate": 5.824247897442623e-05, + "loss": 0.0067, + "step": 319460 + }, + { + "epoch": 1.61, + "learning_rate": 5.8234911281412227e-05, + "loss": 0.0081, + "step": 319470 + }, + { + "epoch": 1.61, + "learning_rate": 5.8227343588398215e-05, + "loss": 0.0082, + "step": 319480 + }, + { + "epoch": 1.61, + "learning_rate": 5.82197758953842e-05, + "loss": 0.0065, + "step": 319490 + }, + { + "epoch": 1.61, + "learning_rate": 5.82122082023702e-05, + "loss": 0.0079, + "step": 319500 + }, + { + "epoch": 1.61, + "learning_rate": 5.8204640509356186e-05, + "loss": 0.0068, + "step": 319510 + }, + { + "epoch": 1.61, + "learning_rate": 5.8197072816342174e-05, + "loss": 0.0086, + "step": 319520 + }, + { + "epoch": 1.61, + "learning_rate": 5.818950512332816e-05, + "loss": 0.0051, + "step": 319530 + }, + { + "epoch": 1.61, + "learning_rate": 5.818193743031416e-05, + "loss": 0.0059, + "step": 319540 + }, + { + "epoch": 1.61, + "learning_rate": 5.8174369737300146e-05, + "loss": 0.0054, + "step": 319550 + }, + { + "epoch": 1.61, + "learning_rate": 5.8166802044286134e-05, + "loss": 0.0054, + "step": 319560 + }, + { + "epoch": 1.61, + "learning_rate": 5.815923435127212e-05, + "loss": 0.0069, + "step": 319570 + }, + { + "epoch": 1.61, + "learning_rate": 5.815166665825812e-05, + "loss": 0.0065, + "step": 319580 + }, + { + "epoch": 1.61, + "learning_rate": 5.8144098965244105e-05, + "loss": 0.0051, + "step": 319590 + }, + { + "epoch": 1.61, + "learning_rate": 5.8136531272230094e-05, + "loss": 0.0063, + "step": 319600 + }, + { + "epoch": 1.61, + "learning_rate": 5.812896357921608e-05, + "loss": 0.006, + "step": 319610 + }, + { + "epoch": 1.61, + "learning_rate": 5.812139588620208e-05, + "loss": 0.0071, + "step": 319620 + }, + { + "epoch": 1.61, + "learning_rate": 5.8113828193188065e-05, + "loss": 0.0074, + "step": 319630 + }, + { + "epoch": 1.61, + "learning_rate": 5.810626050017405e-05, + "loss": 0.006, + "step": 319640 + }, + { + "epoch": 1.61, + "learning_rate": 5.809869280716004e-05, + "loss": 0.0062, + "step": 319650 + }, + { + "epoch": 1.61, + "learning_rate": 5.8091125114146037e-05, + "loss": 0.0068, + "step": 319660 + }, + { + "epoch": 1.61, + "learning_rate": 5.8083557421132025e-05, + "loss": 0.0065, + "step": 319670 + }, + { + "epoch": 1.61, + "learning_rate": 5.807598972811801e-05, + "loss": 0.0054, + "step": 319680 + }, + { + "epoch": 1.61, + "learning_rate": 5.8068422035104e-05, + "loss": 0.0051, + "step": 319690 + }, + { + "epoch": 1.61, + "learning_rate": 5.8060854342089996e-05, + "loss": 0.0055, + "step": 319700 + }, + { + "epoch": 1.61, + "learning_rate": 5.8053286649075984e-05, + "loss": 0.0077, + "step": 319710 + }, + { + "epoch": 1.61, + "learning_rate": 5.804571895606197e-05, + "loss": 0.0066, + "step": 319720 + }, + { + "epoch": 1.61, + "learning_rate": 5.8038151263047954e-05, + "loss": 0.0051, + "step": 319730 + }, + { + "epoch": 1.61, + "learning_rate": 5.803058357003394e-05, + "loss": 0.0069, + "step": 319740 + }, + { + "epoch": 1.61, + "learning_rate": 5.802301587701994e-05, + "loss": 0.0064, + "step": 319750 + }, + { + "epoch": 1.61, + "learning_rate": 5.8015448184005926e-05, + "loss": 0.0076, + "step": 319760 + }, + { + "epoch": 1.61, + "learning_rate": 5.8007880490991914e-05, + "loss": 0.0087, + "step": 319770 + }, + { + "epoch": 1.61, + "learning_rate": 5.80003127979779e-05, + "loss": 0.0068, + "step": 319780 + }, + { + "epoch": 1.61, + "learning_rate": 5.79927451049639e-05, + "loss": 0.0076, + "step": 319790 + }, + { + "epoch": 1.61, + "learning_rate": 5.7985177411949885e-05, + "loss": 0.0065, + "step": 319800 + }, + { + "epoch": 1.61, + "learning_rate": 5.7977609718935873e-05, + "loss": 0.0077, + "step": 319810 + }, + { + "epoch": 1.61, + "learning_rate": 5.797004202592186e-05, + "loss": 0.0048, + "step": 319820 + }, + { + "epoch": 1.61, + "learning_rate": 5.7962474332907857e-05, + "loss": 0.0057, + "step": 319830 + }, + { + "epoch": 1.61, + "learning_rate": 5.7954906639893845e-05, + "loss": 0.0054, + "step": 319840 + }, + { + "epoch": 1.61, + "learning_rate": 5.794733894687983e-05, + "loss": 0.0062, + "step": 319850 + }, + { + "epoch": 1.61, + "learning_rate": 5.793977125386582e-05, + "loss": 0.0056, + "step": 319860 + }, + { + "epoch": 1.61, + "learning_rate": 5.7932203560851816e-05, + "loss": 0.0083, + "step": 319870 + }, + { + "epoch": 1.61, + "learning_rate": 5.7924635867837804e-05, + "loss": 0.0064, + "step": 319880 + }, + { + "epoch": 1.61, + "learning_rate": 5.791706817482379e-05, + "loss": 0.0063, + "step": 319890 + }, + { + "epoch": 1.61, + "learning_rate": 5.790950048180978e-05, + "loss": 0.0069, + "step": 319900 + }, + { + "epoch": 1.61, + "learning_rate": 5.7901932788795776e-05, + "loss": 0.008, + "step": 319910 + }, + { + "epoch": 1.61, + "learning_rate": 5.7894365095781764e-05, + "loss": 0.0068, + "step": 319920 + }, + { + "epoch": 1.61, + "learning_rate": 5.788679740276775e-05, + "loss": 0.0064, + "step": 319930 + }, + { + "epoch": 1.61, + "learning_rate": 5.787922970975374e-05, + "loss": 0.0066, + "step": 319940 + }, + { + "epoch": 1.61, + "learning_rate": 5.7871662016739736e-05, + "loss": 0.007, + "step": 319950 + }, + { + "epoch": 1.61, + "learning_rate": 5.7864094323725724e-05, + "loss": 0.0054, + "step": 319960 + }, + { + "epoch": 1.61, + "learning_rate": 5.785652663071171e-05, + "loss": 0.0068, + "step": 319970 + }, + { + "epoch": 1.61, + "learning_rate": 5.784895893769771e-05, + "loss": 0.0068, + "step": 319980 + }, + { + "epoch": 1.61, + "learning_rate": 5.7841391244683695e-05, + "loss": 0.0073, + "step": 319990 + }, + { + "epoch": 1.61, + "learning_rate": 5.7833823551669683e-05, + "loss": 0.0058, + "step": 320000 + }, + { + "epoch": 1.61, + "eval_cer": 0.9144392032271493, + "eval_loss": 0.005123169161379337, + "eval_runtime": 116.2037, + "eval_samples_per_second": 17.211, + "eval_steps_per_second": 4.303, + "step": 320000 + }, + { + "epoch": 1.61, + "learning_rate": 5.782625585865567e-05, + "loss": 0.0062, + "step": 320010 + }, + { + "epoch": 1.61, + "learning_rate": 5.781868816564167e-05, + "loss": 0.0058, + "step": 320020 + }, + { + "epoch": 1.61, + "learning_rate": 5.7811120472627655e-05, + "loss": 0.0101, + "step": 320030 + }, + { + "epoch": 1.61, + "learning_rate": 5.7803552779613636e-05, + "loss": 0.0063, + "step": 320040 + }, + { + "epoch": 1.61, + "learning_rate": 5.7795985086599625e-05, + "loss": 0.007, + "step": 320050 + }, + { + "epoch": 1.61, + "learning_rate": 5.778841739358561e-05, + "loss": 0.0061, + "step": 320060 + }, + { + "epoch": 1.61, + "learning_rate": 5.778084970057161e-05, + "loss": 0.0097, + "step": 320070 + }, + { + "epoch": 1.61, + "learning_rate": 5.7773282007557596e-05, + "loss": 0.0067, + "step": 320080 + }, + { + "epoch": 1.61, + "learning_rate": 5.7765714314543584e-05, + "loss": 0.0064, + "step": 320090 + }, + { + "epoch": 1.61, + "learning_rate": 5.775814662152957e-05, + "loss": 0.0095, + "step": 320100 + }, + { + "epoch": 1.61, + "learning_rate": 5.775057892851557e-05, + "loss": 0.0074, + "step": 320110 + }, + { + "epoch": 1.62, + "learning_rate": 5.7743011235501556e-05, + "loss": 0.0069, + "step": 320120 + }, + { + "epoch": 1.62, + "learning_rate": 5.7735443542487544e-05, + "loss": 0.0064, + "step": 320130 + }, + { + "epoch": 1.62, + "learning_rate": 5.772787584947353e-05, + "loss": 0.0096, + "step": 320140 + }, + { + "epoch": 1.62, + "learning_rate": 5.772030815645953e-05, + "loss": 0.0079, + "step": 320150 + }, + { + "epoch": 1.62, + "learning_rate": 5.7712740463445515e-05, + "loss": 0.0063, + "step": 320160 + }, + { + "epoch": 1.62, + "learning_rate": 5.7705172770431503e-05, + "loss": 0.0073, + "step": 320170 + }, + { + "epoch": 1.62, + "learning_rate": 5.769760507741749e-05, + "loss": 0.0079, + "step": 320180 + }, + { + "epoch": 1.62, + "learning_rate": 5.769003738440349e-05, + "loss": 0.0073, + "step": 320190 + }, + { + "epoch": 1.62, + "learning_rate": 5.7682469691389475e-05, + "loss": 0.0075, + "step": 320200 + }, + { + "epoch": 1.62, + "learning_rate": 5.767490199837546e-05, + "loss": 0.0073, + "step": 320210 + }, + { + "epoch": 1.62, + "learning_rate": 5.766733430536145e-05, + "loss": 0.008, + "step": 320220 + }, + { + "epoch": 1.62, + "learning_rate": 5.7659766612347446e-05, + "loss": 0.0054, + "step": 320230 + }, + { + "epoch": 1.62, + "learning_rate": 5.7652198919333435e-05, + "loss": 0.0061, + "step": 320240 + }, + { + "epoch": 1.62, + "learning_rate": 5.764463122631942e-05, + "loss": 0.0054, + "step": 320250 + }, + { + "epoch": 1.62, + "learning_rate": 5.763706353330541e-05, + "loss": 0.0067, + "step": 320260 + }, + { + "epoch": 1.62, + "learning_rate": 5.7629495840291406e-05, + "loss": 0.0111, + "step": 320270 + }, + { + "epoch": 1.62, + "learning_rate": 5.7621928147277394e-05, + "loss": 0.0069, + "step": 320280 + }, + { + "epoch": 1.62, + "learning_rate": 5.761436045426338e-05, + "loss": 0.0095, + "step": 320290 + }, + { + "epoch": 1.62, + "learning_rate": 5.760679276124937e-05, + "loss": 0.0072, + "step": 320300 + }, + { + "epoch": 1.62, + "learning_rate": 5.7599225068235366e-05, + "loss": 0.0067, + "step": 320310 + }, + { + "epoch": 1.62, + "learning_rate": 5.7591657375221354e-05, + "loss": 0.0068, + "step": 320320 + }, + { + "epoch": 1.62, + "learning_rate": 5.758408968220734e-05, + "loss": 0.0074, + "step": 320330 + }, + { + "epoch": 1.62, + "learning_rate": 5.757652198919333e-05, + "loss": 0.0091, + "step": 320340 + }, + { + "epoch": 1.62, + "learning_rate": 5.756895429617931e-05, + "loss": 0.0069, + "step": 320350 + }, + { + "epoch": 1.62, + "learning_rate": 5.756138660316531e-05, + "loss": 0.0071, + "step": 320360 + }, + { + "epoch": 1.62, + "learning_rate": 5.7553818910151295e-05, + "loss": 0.0051, + "step": 320370 + }, + { + "epoch": 1.62, + "learning_rate": 5.754625121713728e-05, + "loss": 0.0111, + "step": 320380 + }, + { + "epoch": 1.62, + "learning_rate": 5.753868352412327e-05, + "loss": 0.0073, + "step": 320390 + }, + { + "epoch": 1.62, + "learning_rate": 5.7531115831109266e-05, + "loss": 0.0086, + "step": 320400 + }, + { + "epoch": 1.62, + "learning_rate": 5.7523548138095255e-05, + "loss": 0.0071, + "step": 320410 + }, + { + "epoch": 1.62, + "learning_rate": 5.751598044508124e-05, + "loss": 0.0068, + "step": 320420 + }, + { + "epoch": 1.62, + "learning_rate": 5.750841275206723e-05, + "loss": 0.0078, + "step": 320430 + }, + { + "epoch": 1.62, + "learning_rate": 5.7500845059053226e-05, + "loss": 0.0063, + "step": 320440 + }, + { + "epoch": 1.62, + "learning_rate": 5.7493277366039214e-05, + "loss": 0.0086, + "step": 320450 + }, + { + "epoch": 1.62, + "learning_rate": 5.74857096730252e-05, + "loss": 0.0121, + "step": 320460 + }, + { + "epoch": 1.62, + "learning_rate": 5.74781419800112e-05, + "loss": 0.006, + "step": 320470 + }, + { + "epoch": 1.62, + "learning_rate": 5.7470574286997186e-05, + "loss": 0.0058, + "step": 320480 + }, + { + "epoch": 1.62, + "learning_rate": 5.7463006593983174e-05, + "loss": 0.0068, + "step": 320490 + }, + { + "epoch": 1.62, + "learning_rate": 5.745543890096916e-05, + "loss": 0.0085, + "step": 320500 + }, + { + "epoch": 1.62, + "learning_rate": 5.744787120795516e-05, + "loss": 0.0091, + "step": 320510 + }, + { + "epoch": 1.62, + "learning_rate": 5.7440303514941145e-05, + "loss": 0.0061, + "step": 320520 + }, + { + "epoch": 1.62, + "learning_rate": 5.7432735821927134e-05, + "loss": 0.0053, + "step": 320530 + }, + { + "epoch": 1.62, + "learning_rate": 5.742516812891312e-05, + "loss": 0.0058, + "step": 320540 + }, + { + "epoch": 1.62, + "learning_rate": 5.741760043589912e-05, + "loss": 0.0077, + "step": 320550 + }, + { + "epoch": 1.62, + "learning_rate": 5.7410032742885105e-05, + "loss": 0.0059, + "step": 320560 + }, + { + "epoch": 1.62, + "learning_rate": 5.740246504987109e-05, + "loss": 0.0064, + "step": 320570 + }, + { + "epoch": 1.62, + "learning_rate": 5.739489735685708e-05, + "loss": 0.0097, + "step": 320580 + }, + { + "epoch": 1.62, + "learning_rate": 5.7387329663843076e-05, + "loss": 0.0064, + "step": 320590 + }, + { + "epoch": 1.62, + "learning_rate": 5.7379761970829065e-05, + "loss": 0.0062, + "step": 320600 + }, + { + "epoch": 1.62, + "learning_rate": 5.737219427781505e-05, + "loss": 0.0073, + "step": 320610 + }, + { + "epoch": 1.62, + "learning_rate": 5.736462658480104e-05, + "loss": 0.0063, + "step": 320620 + }, + { + "epoch": 1.62, + "learning_rate": 5.7357058891787036e-05, + "loss": 0.0048, + "step": 320630 + }, + { + "epoch": 1.62, + "learning_rate": 5.7349491198773024e-05, + "loss": 0.0083, + "step": 320640 + }, + { + "epoch": 1.62, + "learning_rate": 5.734192350575901e-05, + "loss": 0.0062, + "step": 320650 + }, + { + "epoch": 1.62, + "learning_rate": 5.7334355812745e-05, + "loss": 0.0056, + "step": 320660 + }, + { + "epoch": 1.62, + "learning_rate": 5.732678811973098e-05, + "loss": 0.0065, + "step": 320670 + }, + { + "epoch": 1.62, + "learning_rate": 5.731922042671698e-05, + "loss": 0.0081, + "step": 320680 + }, + { + "epoch": 1.62, + "learning_rate": 5.7311652733702965e-05, + "loss": 0.0077, + "step": 320690 + }, + { + "epoch": 1.62, + "learning_rate": 5.7304085040688954e-05, + "loss": 0.0084, + "step": 320700 + }, + { + "epoch": 1.62, + "learning_rate": 5.729651734767494e-05, + "loss": 0.0056, + "step": 320710 + }, + { + "epoch": 1.62, + "learning_rate": 5.728894965466094e-05, + "loss": 0.0057, + "step": 320720 + }, + { + "epoch": 1.62, + "learning_rate": 5.7281381961646925e-05, + "loss": 0.0055, + "step": 320730 + }, + { + "epoch": 1.62, + "learning_rate": 5.727381426863291e-05, + "loss": 0.0072, + "step": 320740 + }, + { + "epoch": 1.62, + "learning_rate": 5.72662465756189e-05, + "loss": 0.0093, + "step": 320750 + }, + { + "epoch": 1.62, + "learning_rate": 5.7258678882604896e-05, + "loss": 0.0072, + "step": 320760 + }, + { + "epoch": 1.62, + "learning_rate": 5.7251111189590885e-05, + "loss": 0.0069, + "step": 320770 + }, + { + "epoch": 1.62, + "learning_rate": 5.724354349657687e-05, + "loss": 0.0053, + "step": 320780 + }, + { + "epoch": 1.62, + "learning_rate": 5.723597580356286e-05, + "loss": 0.005, + "step": 320790 + }, + { + "epoch": 1.62, + "learning_rate": 5.7228408110548856e-05, + "loss": 0.0065, + "step": 320800 + }, + { + "epoch": 1.62, + "learning_rate": 5.7220840417534844e-05, + "loss": 0.0106, + "step": 320810 + }, + { + "epoch": 1.62, + "learning_rate": 5.721327272452083e-05, + "loss": 0.0052, + "step": 320820 + }, + { + "epoch": 1.62, + "learning_rate": 5.720570503150682e-05, + "loss": 0.0081, + "step": 320830 + }, + { + "epoch": 1.62, + "learning_rate": 5.7198137338492816e-05, + "loss": 0.0075, + "step": 320840 + }, + { + "epoch": 1.62, + "learning_rate": 5.7190569645478804e-05, + "loss": 0.0066, + "step": 320850 + }, + { + "epoch": 1.62, + "learning_rate": 5.718300195246479e-05, + "loss": 0.0069, + "step": 320860 + }, + { + "epoch": 1.62, + "learning_rate": 5.717543425945078e-05, + "loss": 0.0069, + "step": 320870 + }, + { + "epoch": 1.62, + "learning_rate": 5.7167866566436775e-05, + "loss": 0.0077, + "step": 320880 + }, + { + "epoch": 1.62, + "learning_rate": 5.7160298873422764e-05, + "loss": 0.0083, + "step": 320890 + }, + { + "epoch": 1.62, + "learning_rate": 5.715273118040875e-05, + "loss": 0.0066, + "step": 320900 + }, + { + "epoch": 1.62, + "learning_rate": 5.714516348739474e-05, + "loss": 0.0062, + "step": 320910 + }, + { + "epoch": 1.62, + "learning_rate": 5.7137595794380735e-05, + "loss": 0.0055, + "step": 320920 + }, + { + "epoch": 1.62, + "learning_rate": 5.713002810136672e-05, + "loss": 0.0054, + "step": 320930 + }, + { + "epoch": 1.62, + "learning_rate": 5.712246040835271e-05, + "loss": 0.0047, + "step": 320940 + }, + { + "epoch": 1.62, + "learning_rate": 5.7114892715338707e-05, + "loss": 0.0066, + "step": 320950 + }, + { + "epoch": 1.62, + "learning_rate": 5.7107325022324695e-05, + "loss": 0.0055, + "step": 320960 + }, + { + "epoch": 1.62, + "learning_rate": 5.709975732931068e-05, + "loss": 0.0076, + "step": 320970 + }, + { + "epoch": 1.62, + "learning_rate": 5.7092189636296664e-05, + "loss": 0.006, + "step": 320980 + }, + { + "epoch": 1.62, + "learning_rate": 5.708462194328265e-05, + "loss": 0.0064, + "step": 320990 + }, + { + "epoch": 1.62, + "learning_rate": 5.707705425026865e-05, + "loss": 0.0058, + "step": 321000 + }, + { + "epoch": 1.62, + "eval_cer": 0.9144275584736445, + "eval_loss": 0.005066942423582077, + "eval_runtime": 116.3307, + "eval_samples_per_second": 17.192, + "eval_steps_per_second": 4.298, + "step": 321000 + }, + { + "epoch": 1.62, + "learning_rate": 5.7069486557254636e-05, + "loss": 0.0067, + "step": 321010 + }, + { + "epoch": 1.62, + "learning_rate": 5.7061918864240624e-05, + "loss": 0.0066, + "step": 321020 + }, + { + "epoch": 1.62, + "learning_rate": 5.705435117122661e-05, + "loss": 0.0074, + "step": 321030 + }, + { + "epoch": 1.62, + "learning_rate": 5.704678347821261e-05, + "loss": 0.0073, + "step": 321040 + }, + { + "epoch": 1.62, + "learning_rate": 5.7039215785198595e-05, + "loss": 0.006, + "step": 321050 + }, + { + "epoch": 1.62, + "learning_rate": 5.7031648092184584e-05, + "loss": 0.0063, + "step": 321060 + }, + { + "epoch": 1.62, + "learning_rate": 5.702408039917057e-05, + "loss": 0.0073, + "step": 321070 + }, + { + "epoch": 1.62, + "learning_rate": 5.701651270615657e-05, + "loss": 0.0084, + "step": 321080 + }, + { + "epoch": 1.62, + "learning_rate": 5.7008945013142555e-05, + "loss": 0.0063, + "step": 321090 + }, + { + "epoch": 1.62, + "learning_rate": 5.700137732012854e-05, + "loss": 0.0073, + "step": 321100 + }, + { + "epoch": 1.62, + "learning_rate": 5.699380962711453e-05, + "loss": 0.0075, + "step": 321110 + }, + { + "epoch": 1.62, + "learning_rate": 5.6986241934100527e-05, + "loss": 0.0048, + "step": 321120 + }, + { + "epoch": 1.62, + "learning_rate": 5.6978674241086515e-05, + "loss": 0.0081, + "step": 321130 + }, + { + "epoch": 1.62, + "learning_rate": 5.69711065480725e-05, + "loss": 0.0051, + "step": 321140 + }, + { + "epoch": 1.62, + "learning_rate": 5.696353885505849e-05, + "loss": 0.0049, + "step": 321150 + }, + { + "epoch": 1.62, + "learning_rate": 5.6955971162044486e-05, + "loss": 0.0075, + "step": 321160 + }, + { + "epoch": 1.62, + "learning_rate": 5.6948403469030474e-05, + "loss": 0.0055, + "step": 321170 + }, + { + "epoch": 1.62, + "learning_rate": 5.694083577601646e-05, + "loss": 0.006, + "step": 321180 + }, + { + "epoch": 1.62, + "learning_rate": 5.693326808300245e-05, + "loss": 0.0059, + "step": 321190 + }, + { + "epoch": 1.62, + "learning_rate": 5.6925700389988446e-05, + "loss": 0.0061, + "step": 321200 + }, + { + "epoch": 1.62, + "learning_rate": 5.6918132696974434e-05, + "loss": 0.0073, + "step": 321210 + }, + { + "epoch": 1.62, + "learning_rate": 5.691056500396042e-05, + "loss": 0.0091, + "step": 321220 + }, + { + "epoch": 1.62, + "learning_rate": 5.690299731094641e-05, + "loss": 0.0055, + "step": 321230 + }, + { + "epoch": 1.62, + "learning_rate": 5.6895429617932406e-05, + "loss": 0.0092, + "step": 321240 + }, + { + "epoch": 1.62, + "learning_rate": 5.6887861924918394e-05, + "loss": 0.0049, + "step": 321250 + }, + { + "epoch": 1.62, + "learning_rate": 5.688029423190438e-05, + "loss": 0.0062, + "step": 321260 + }, + { + "epoch": 1.62, + "learning_rate": 5.687272653889037e-05, + "loss": 0.008, + "step": 321270 + }, + { + "epoch": 1.62, + "learning_rate": 5.6865158845876365e-05, + "loss": 0.0071, + "step": 321280 + }, + { + "epoch": 1.62, + "learning_rate": 5.685759115286235e-05, + "loss": 0.0074, + "step": 321290 + }, + { + "epoch": 1.62, + "learning_rate": 5.6850023459848335e-05, + "loss": 0.0072, + "step": 321300 + }, + { + "epoch": 1.62, + "learning_rate": 5.684245576683432e-05, + "loss": 0.0055, + "step": 321310 + }, + { + "epoch": 1.62, + "learning_rate": 5.683488807382031e-05, + "loss": 0.0065, + "step": 321320 + }, + { + "epoch": 1.62, + "learning_rate": 5.6827320380806306e-05, + "loss": 0.0072, + "step": 321330 + }, + { + "epoch": 1.62, + "learning_rate": 5.6819752687792294e-05, + "loss": 0.0072, + "step": 321340 + }, + { + "epoch": 1.62, + "learning_rate": 5.681218499477828e-05, + "loss": 0.007, + "step": 321350 + }, + { + "epoch": 1.62, + "learning_rate": 5.680461730176427e-05, + "loss": 0.005, + "step": 321360 + }, + { + "epoch": 1.62, + "learning_rate": 5.6797049608750266e-05, + "loss": 0.0076, + "step": 321370 + }, + { + "epoch": 1.62, + "learning_rate": 5.6789481915736254e-05, + "loss": 0.0077, + "step": 321380 + }, + { + "epoch": 1.62, + "learning_rate": 5.678191422272224e-05, + "loss": 0.0076, + "step": 321390 + }, + { + "epoch": 1.62, + "learning_rate": 5.677434652970823e-05, + "loss": 0.0068, + "step": 321400 + }, + { + "epoch": 1.62, + "learning_rate": 5.6766778836694226e-05, + "loss": 0.0083, + "step": 321410 + }, + { + "epoch": 1.62, + "learning_rate": 5.6759211143680214e-05, + "loss": 0.0073, + "step": 321420 + }, + { + "epoch": 1.62, + "learning_rate": 5.67516434506662e-05, + "loss": 0.007, + "step": 321430 + }, + { + "epoch": 1.62, + "learning_rate": 5.67440757576522e-05, + "loss": 0.0064, + "step": 321440 + }, + { + "epoch": 1.62, + "learning_rate": 5.6736508064638185e-05, + "loss": 0.0048, + "step": 321450 + }, + { + "epoch": 1.62, + "learning_rate": 5.6728940371624173e-05, + "loss": 0.0069, + "step": 321460 + }, + { + "epoch": 1.62, + "learning_rate": 5.672137267861016e-05, + "loss": 0.0057, + "step": 321470 + }, + { + "epoch": 1.62, + "learning_rate": 5.671380498559616e-05, + "loss": 0.0065, + "step": 321480 + }, + { + "epoch": 1.62, + "learning_rate": 5.6706237292582145e-05, + "loss": 0.0063, + "step": 321490 + }, + { + "epoch": 1.62, + "learning_rate": 5.669866959956813e-05, + "loss": 0.007, + "step": 321500 + }, + { + "epoch": 1.62, + "learning_rate": 5.669110190655412e-05, + "loss": 0.0067, + "step": 321510 + }, + { + "epoch": 1.62, + "learning_rate": 5.6683534213540116e-05, + "loss": 0.0053, + "step": 321520 + }, + { + "epoch": 1.62, + "learning_rate": 5.6675966520526105e-05, + "loss": 0.0071, + "step": 321530 + }, + { + "epoch": 1.62, + "learning_rate": 5.666839882751209e-05, + "loss": 0.0053, + "step": 321540 + }, + { + "epoch": 1.62, + "learning_rate": 5.666083113449808e-05, + "loss": 0.0065, + "step": 321550 + }, + { + "epoch": 1.62, + "learning_rate": 5.6653263441484076e-05, + "loss": 0.0089, + "step": 321560 + }, + { + "epoch": 1.62, + "learning_rate": 5.6645695748470064e-05, + "loss": 0.0059, + "step": 321570 + }, + { + "epoch": 1.62, + "learning_rate": 5.663812805545605e-05, + "loss": 0.0062, + "step": 321580 + }, + { + "epoch": 1.62, + "learning_rate": 5.663056036244204e-05, + "loss": 0.008, + "step": 321590 + }, + { + "epoch": 1.62, + "learning_rate": 5.6622992669428036e-05, + "loss": 0.0064, + "step": 321600 + }, + { + "epoch": 1.62, + "learning_rate": 5.661542497641402e-05, + "loss": 0.0064, + "step": 321610 + }, + { + "epoch": 1.62, + "learning_rate": 5.6607857283400005e-05, + "loss": 0.0061, + "step": 321620 + }, + { + "epoch": 1.62, + "learning_rate": 5.6600289590385993e-05, + "loss": 0.0108, + "step": 321630 + }, + { + "epoch": 1.62, + "learning_rate": 5.659272189737198e-05, + "loss": 0.0069, + "step": 321640 + }, + { + "epoch": 1.62, + "learning_rate": 5.658515420435798e-05, + "loss": 0.0081, + "step": 321650 + }, + { + "epoch": 1.62, + "learning_rate": 5.6577586511343965e-05, + "loss": 0.0051, + "step": 321660 + }, + { + "epoch": 1.62, + "learning_rate": 5.657001881832995e-05, + "loss": 0.0055, + "step": 321670 + }, + { + "epoch": 1.62, + "learning_rate": 5.656245112531594e-05, + "loss": 0.0066, + "step": 321680 + }, + { + "epoch": 1.62, + "learning_rate": 5.6554883432301936e-05, + "loss": 0.007, + "step": 321690 + }, + { + "epoch": 1.62, + "learning_rate": 5.6547315739287925e-05, + "loss": 0.0076, + "step": 321700 + }, + { + "epoch": 1.62, + "learning_rate": 5.653974804627391e-05, + "loss": 0.0067, + "step": 321710 + }, + { + "epoch": 1.62, + "learning_rate": 5.65321803532599e-05, + "loss": 0.0083, + "step": 321720 + }, + { + "epoch": 1.62, + "learning_rate": 5.6524612660245896e-05, + "loss": 0.007, + "step": 321730 + }, + { + "epoch": 1.62, + "learning_rate": 5.6517044967231884e-05, + "loss": 0.0067, + "step": 321740 + }, + { + "epoch": 1.62, + "learning_rate": 5.650947727421787e-05, + "loss": 0.0053, + "step": 321750 + }, + { + "epoch": 1.62, + "learning_rate": 5.650190958120386e-05, + "loss": 0.0057, + "step": 321760 + }, + { + "epoch": 1.62, + "learning_rate": 5.6494341888189856e-05, + "loss": 0.0054, + "step": 321770 + }, + { + "epoch": 1.62, + "learning_rate": 5.6486774195175844e-05, + "loss": 0.0094, + "step": 321780 + }, + { + "epoch": 1.62, + "learning_rate": 5.647920650216183e-05, + "loss": 0.0074, + "step": 321790 + }, + { + "epoch": 1.62, + "learning_rate": 5.647163880914782e-05, + "loss": 0.0083, + "step": 321800 + }, + { + "epoch": 1.62, + "learning_rate": 5.6464071116133815e-05, + "loss": 0.0068, + "step": 321810 + }, + { + "epoch": 1.62, + "learning_rate": 5.6456503423119804e-05, + "loss": 0.0084, + "step": 321820 + }, + { + "epoch": 1.62, + "learning_rate": 5.644893573010579e-05, + "loss": 0.0065, + "step": 321830 + }, + { + "epoch": 1.62, + "learning_rate": 5.644136803709178e-05, + "loss": 0.0083, + "step": 321840 + }, + { + "epoch": 1.62, + "learning_rate": 5.6433800344077775e-05, + "loss": 0.0057, + "step": 321850 + }, + { + "epoch": 1.62, + "learning_rate": 5.642623265106376e-05, + "loss": 0.0073, + "step": 321860 + }, + { + "epoch": 1.62, + "learning_rate": 5.641866495804975e-05, + "loss": 0.0073, + "step": 321870 + }, + { + "epoch": 1.62, + "learning_rate": 5.641109726503574e-05, + "loss": 0.0058, + "step": 321880 + }, + { + "epoch": 1.62, + "learning_rate": 5.6403529572021735e-05, + "loss": 0.0077, + "step": 321890 + }, + { + "epoch": 1.62, + "learning_rate": 5.639596187900772e-05, + "loss": 0.0055, + "step": 321900 + }, + { + "epoch": 1.62, + "learning_rate": 5.638839418599371e-05, + "loss": 0.0082, + "step": 321910 + }, + { + "epoch": 1.62, + "learning_rate": 5.6380826492979706e-05, + "loss": 0.0059, + "step": 321920 + }, + { + "epoch": 1.62, + "learning_rate": 5.637325879996569e-05, + "loss": 0.008, + "step": 321930 + }, + { + "epoch": 1.62, + "learning_rate": 5.6365691106951676e-05, + "loss": 0.006, + "step": 321940 + }, + { + "epoch": 1.62, + "learning_rate": 5.6358123413937664e-05, + "loss": 0.006, + "step": 321950 + }, + { + "epoch": 1.62, + "learning_rate": 5.635055572092365e-05, + "loss": 0.0076, + "step": 321960 + }, + { + "epoch": 1.62, + "learning_rate": 5.634298802790965e-05, + "loss": 0.007, + "step": 321970 + }, + { + "epoch": 1.62, + "learning_rate": 5.6335420334895635e-05, + "loss": 0.0064, + "step": 321980 + }, + { + "epoch": 1.62, + "learning_rate": 5.6327852641881624e-05, + "loss": 0.0076, + "step": 321990 + }, + { + "epoch": 1.62, + "learning_rate": 5.632028494886761e-05, + "loss": 0.0095, + "step": 322000 + }, + { + "epoch": 1.62, + "eval_cer": 0.9144197953046413, + "eval_loss": 0.005024084821343422, + "eval_runtime": 116.2702, + "eval_samples_per_second": 17.201, + "eval_steps_per_second": 4.3, + "step": 322000 + }, + { + "epoch": 1.62, + "learning_rate": 5.631271725585361e-05, + "loss": 0.0047, + "step": 322010 + }, + { + "epoch": 1.62, + "learning_rate": 5.6305149562839595e-05, + "loss": 0.0077, + "step": 322020 + }, + { + "epoch": 1.62, + "learning_rate": 5.629758186982558e-05, + "loss": 0.0073, + "step": 322030 + }, + { + "epoch": 1.62, + "learning_rate": 5.629001417681157e-05, + "loss": 0.0077, + "step": 322040 + }, + { + "epoch": 1.62, + "learning_rate": 5.6282446483797566e-05, + "loss": 0.0058, + "step": 322050 + }, + { + "epoch": 1.62, + "learning_rate": 5.6274878790783555e-05, + "loss": 0.0077, + "step": 322060 + }, + { + "epoch": 1.62, + "learning_rate": 5.626731109776954e-05, + "loss": 0.0051, + "step": 322070 + }, + { + "epoch": 1.62, + "learning_rate": 5.625974340475553e-05, + "loss": 0.007, + "step": 322080 + }, + { + "epoch": 1.62, + "learning_rate": 5.6252175711741526e-05, + "loss": 0.0064, + "step": 322090 + }, + { + "epoch": 1.63, + "learning_rate": 5.6244608018727514e-05, + "loss": 0.0057, + "step": 322100 + }, + { + "epoch": 1.63, + "learning_rate": 5.62370403257135e-05, + "loss": 0.0074, + "step": 322110 + }, + { + "epoch": 1.63, + "learning_rate": 5.622947263269949e-05, + "loss": 0.0089, + "step": 322120 + }, + { + "epoch": 1.63, + "learning_rate": 5.6221904939685486e-05, + "loss": 0.0082, + "step": 322130 + }, + { + "epoch": 1.63, + "learning_rate": 5.6214337246671474e-05, + "loss": 0.0073, + "step": 322140 + }, + { + "epoch": 1.63, + "learning_rate": 5.620676955365746e-05, + "loss": 0.008, + "step": 322150 + }, + { + "epoch": 1.63, + "learning_rate": 5.619920186064345e-05, + "loss": 0.0058, + "step": 322160 + }, + { + "epoch": 1.63, + "learning_rate": 5.6191634167629445e-05, + "loss": 0.0068, + "step": 322170 + }, + { + "epoch": 1.63, + "learning_rate": 5.6184066474615434e-05, + "loss": 0.0082, + "step": 322180 + }, + { + "epoch": 1.63, + "learning_rate": 5.617649878160142e-05, + "loss": 0.0055, + "step": 322190 + }, + { + "epoch": 1.63, + "learning_rate": 5.616893108858741e-05, + "loss": 0.0061, + "step": 322200 + }, + { + "epoch": 1.63, + "learning_rate": 5.6161363395573405e-05, + "loss": 0.0058, + "step": 322210 + }, + { + "epoch": 1.63, + "learning_rate": 5.615379570255939e-05, + "loss": 0.0062, + "step": 322220 + }, + { + "epoch": 1.63, + "learning_rate": 5.614622800954538e-05, + "loss": 0.0057, + "step": 322230 + }, + { + "epoch": 1.63, + "learning_rate": 5.613866031653136e-05, + "loss": 0.007, + "step": 322240 + }, + { + "epoch": 1.63, + "learning_rate": 5.613109262351735e-05, + "loss": 0.0066, + "step": 322250 + }, + { + "epoch": 1.63, + "learning_rate": 5.6123524930503346e-05, + "loss": 0.0056, + "step": 322260 + }, + { + "epoch": 1.63, + "learning_rate": 5.6115957237489334e-05, + "loss": 0.0062, + "step": 322270 + }, + { + "epoch": 1.63, + "learning_rate": 5.610838954447532e-05, + "loss": 0.0075, + "step": 322280 + }, + { + "epoch": 1.63, + "learning_rate": 5.610082185146131e-05, + "loss": 0.0052, + "step": 322290 + }, + { + "epoch": 1.63, + "learning_rate": 5.6093254158447306e-05, + "loss": 0.005, + "step": 322300 + }, + { + "epoch": 1.63, + "learning_rate": 5.6085686465433294e-05, + "loss": 0.0066, + "step": 322310 + }, + { + "epoch": 1.63, + "learning_rate": 5.607811877241928e-05, + "loss": 0.0055, + "step": 322320 + }, + { + "epoch": 1.63, + "learning_rate": 5.607055107940527e-05, + "loss": 0.0098, + "step": 322330 + }, + { + "epoch": 1.63, + "learning_rate": 5.6062983386391265e-05, + "loss": 0.0065, + "step": 322340 + }, + { + "epoch": 1.63, + "learning_rate": 5.6055415693377254e-05, + "loss": 0.006, + "step": 322350 + }, + { + "epoch": 1.63, + "learning_rate": 5.604784800036324e-05, + "loss": 0.0069, + "step": 322360 + }, + { + "epoch": 1.63, + "learning_rate": 5.604028030734923e-05, + "loss": 0.0062, + "step": 322370 + }, + { + "epoch": 1.63, + "learning_rate": 5.6032712614335225e-05, + "loss": 0.0052, + "step": 322380 + }, + { + "epoch": 1.63, + "learning_rate": 5.602514492132121e-05, + "loss": 0.0063, + "step": 322390 + }, + { + "epoch": 1.63, + "learning_rate": 5.60175772283072e-05, + "loss": 0.0086, + "step": 322400 + }, + { + "epoch": 1.63, + "learning_rate": 5.6010009535293197e-05, + "loss": 0.0087, + "step": 322410 + }, + { + "epoch": 1.63, + "learning_rate": 5.6002441842279185e-05, + "loss": 0.0064, + "step": 322420 + }, + { + "epoch": 1.63, + "learning_rate": 5.599487414926517e-05, + "loss": 0.0066, + "step": 322430 + }, + { + "epoch": 1.63, + "learning_rate": 5.598730645625116e-05, + "loss": 0.0081, + "step": 322440 + }, + { + "epoch": 1.63, + "learning_rate": 5.5979738763237156e-05, + "loss": 0.0065, + "step": 322450 + }, + { + "epoch": 1.63, + "learning_rate": 5.5972171070223144e-05, + "loss": 0.0062, + "step": 322460 + }, + { + "epoch": 1.63, + "learning_rate": 5.596460337720913e-05, + "loss": 0.0076, + "step": 322470 + }, + { + "epoch": 1.63, + "learning_rate": 5.595703568419512e-05, + "loss": 0.0081, + "step": 322480 + }, + { + "epoch": 1.63, + "learning_rate": 5.5949467991181116e-05, + "loss": 0.0089, + "step": 322490 + }, + { + "epoch": 1.63, + "learning_rate": 5.5941900298167104e-05, + "loss": 0.0059, + "step": 322500 + }, + { + "epoch": 1.63, + "learning_rate": 5.593433260515309e-05, + "loss": 0.0063, + "step": 322510 + }, + { + "epoch": 1.63, + "learning_rate": 5.592676491213908e-05, + "loss": 0.0063, + "step": 322520 + }, + { + "epoch": 1.63, + "learning_rate": 5.5919197219125075e-05, + "loss": 0.0072, + "step": 322530 + }, + { + "epoch": 1.63, + "learning_rate": 5.5911629526111064e-05, + "loss": 0.007, + "step": 322540 + }, + { + "epoch": 1.63, + "learning_rate": 5.5904061833097045e-05, + "loss": 0.0074, + "step": 322550 + }, + { + "epoch": 1.63, + "learning_rate": 5.589649414008303e-05, + "loss": 0.0066, + "step": 322560 + }, + { + "epoch": 1.63, + "learning_rate": 5.588892644706902e-05, + "loss": 0.0079, + "step": 322570 + }, + { + "epoch": 1.63, + "learning_rate": 5.5881358754055017e-05, + "loss": 0.0072, + "step": 322580 + }, + { + "epoch": 1.63, + "learning_rate": 5.5873791061041005e-05, + "loss": 0.0077, + "step": 322590 + }, + { + "epoch": 1.63, + "learning_rate": 5.586622336802699e-05, + "loss": 0.0061, + "step": 322600 + }, + { + "epoch": 1.63, + "learning_rate": 5.585865567501298e-05, + "loss": 0.0073, + "step": 322610 + }, + { + "epoch": 1.63, + "learning_rate": 5.5851087981998976e-05, + "loss": 0.0057, + "step": 322620 + }, + { + "epoch": 1.63, + "learning_rate": 5.5843520288984964e-05, + "loss": 0.0065, + "step": 322630 + }, + { + "epoch": 1.63, + "learning_rate": 5.583595259597095e-05, + "loss": 0.0071, + "step": 322640 + }, + { + "epoch": 1.63, + "learning_rate": 5.582838490295694e-05, + "loss": 0.0054, + "step": 322650 + }, + { + "epoch": 1.63, + "learning_rate": 5.5820817209942936e-05, + "loss": 0.0065, + "step": 322660 + }, + { + "epoch": 1.63, + "learning_rate": 5.5813249516928924e-05, + "loss": 0.0087, + "step": 322670 + }, + { + "epoch": 1.63, + "learning_rate": 5.580568182391491e-05, + "loss": 0.0058, + "step": 322680 + }, + { + "epoch": 1.63, + "learning_rate": 5.57981141309009e-05, + "loss": 0.0066, + "step": 322690 + }, + { + "epoch": 1.63, + "learning_rate": 5.5790546437886896e-05, + "loss": 0.0063, + "step": 322700 + }, + { + "epoch": 1.63, + "learning_rate": 5.5782978744872884e-05, + "loss": 0.0073, + "step": 322710 + }, + { + "epoch": 1.63, + "learning_rate": 5.577541105185887e-05, + "loss": 0.0077, + "step": 322720 + }, + { + "epoch": 1.63, + "learning_rate": 5.576784335884486e-05, + "loss": 0.0062, + "step": 322730 + }, + { + "epoch": 1.63, + "learning_rate": 5.5760275665830855e-05, + "loss": 0.006, + "step": 322740 + }, + { + "epoch": 1.63, + "learning_rate": 5.5752707972816843e-05, + "loss": 0.0042, + "step": 322750 + }, + { + "epoch": 1.63, + "learning_rate": 5.574514027980283e-05, + "loss": 0.0058, + "step": 322760 + }, + { + "epoch": 1.63, + "learning_rate": 5.573757258678882e-05, + "loss": 0.0053, + "step": 322770 + }, + { + "epoch": 1.63, + "learning_rate": 5.5730004893774815e-05, + "loss": 0.0052, + "step": 322780 + }, + { + "epoch": 1.63, + "learning_rate": 5.57224372007608e-05, + "loss": 0.0082, + "step": 322790 + }, + { + "epoch": 1.63, + "learning_rate": 5.571486950774679e-05, + "loss": 0.0067, + "step": 322800 + }, + { + "epoch": 1.63, + "learning_rate": 5.570730181473278e-05, + "loss": 0.0055, + "step": 322810 + }, + { + "epoch": 1.63, + "learning_rate": 5.5699734121718774e-05, + "loss": 0.0075, + "step": 322820 + }, + { + "epoch": 1.63, + "learning_rate": 5.569216642870476e-05, + "loss": 0.0058, + "step": 322830 + }, + { + "epoch": 1.63, + "learning_rate": 5.568459873569075e-05, + "loss": 0.006, + "step": 322840 + }, + { + "epoch": 1.63, + "learning_rate": 5.567703104267674e-05, + "loss": 0.0076, + "step": 322850 + }, + { + "epoch": 1.63, + "learning_rate": 5.5669463349662734e-05, + "loss": 0.0065, + "step": 322860 + }, + { + "epoch": 1.63, + "learning_rate": 5.5661895656648716e-05, + "loss": 0.0074, + "step": 322870 + }, + { + "epoch": 1.63, + "learning_rate": 5.5654327963634704e-05, + "loss": 0.005, + "step": 322880 + }, + { + "epoch": 1.63, + "learning_rate": 5.564676027062069e-05, + "loss": 0.0075, + "step": 322890 + }, + { + "epoch": 1.63, + "learning_rate": 5.563919257760669e-05, + "loss": 0.0076, + "step": 322900 + }, + { + "epoch": 1.63, + "learning_rate": 5.5631624884592675e-05, + "loss": 0.0087, + "step": 322910 + }, + { + "epoch": 1.63, + "learning_rate": 5.5624057191578663e-05, + "loss": 0.0095, + "step": 322920 + }, + { + "epoch": 1.63, + "learning_rate": 5.561648949856465e-05, + "loss": 0.0069, + "step": 322930 + }, + { + "epoch": 1.63, + "learning_rate": 5.560892180555065e-05, + "loss": 0.0066, + "step": 322940 + }, + { + "epoch": 1.63, + "learning_rate": 5.5601354112536635e-05, + "loss": 0.0063, + "step": 322950 + }, + { + "epoch": 1.63, + "learning_rate": 5.559378641952262e-05, + "loss": 0.0069, + "step": 322960 + }, + { + "epoch": 1.63, + "learning_rate": 5.558621872650861e-05, + "loss": 0.0068, + "step": 322970 + }, + { + "epoch": 1.63, + "learning_rate": 5.5578651033494606e-05, + "loss": 0.0054, + "step": 322980 + }, + { + "epoch": 1.63, + "learning_rate": 5.5571083340480595e-05, + "loss": 0.0081, + "step": 322990 + }, + { + "epoch": 1.63, + "learning_rate": 5.556351564746658e-05, + "loss": 0.0101, + "step": 323000 + }, + { + "epoch": 1.63, + "eval_cer": 0.9144265880775191, + "eval_loss": 0.004934444557875395, + "eval_runtime": 116.3298, + "eval_samples_per_second": 17.192, + "eval_steps_per_second": 4.298, + "step": 323000 + }, + { + "epoch": 1.63, + "learning_rate": 5.555594795445257e-05, + "loss": 0.0076, + "step": 323010 + }, + { + "epoch": 1.63, + "learning_rate": 5.5548380261438566e-05, + "loss": 0.0071, + "step": 323020 + }, + { + "epoch": 1.63, + "learning_rate": 5.5540812568424554e-05, + "loss": 0.007, + "step": 323030 + }, + { + "epoch": 1.63, + "learning_rate": 5.553324487541054e-05, + "loss": 0.0069, + "step": 323040 + }, + { + "epoch": 1.63, + "learning_rate": 5.552567718239653e-05, + "loss": 0.0064, + "step": 323050 + }, + { + "epoch": 1.63, + "learning_rate": 5.5518109489382526e-05, + "loss": 0.0081, + "step": 323060 + }, + { + "epoch": 1.63, + "learning_rate": 5.5510541796368514e-05, + "loss": 0.0067, + "step": 323070 + }, + { + "epoch": 1.63, + "learning_rate": 5.55029741033545e-05, + "loss": 0.0052, + "step": 323080 + }, + { + "epoch": 1.63, + "learning_rate": 5.549540641034049e-05, + "loss": 0.0076, + "step": 323090 + }, + { + "epoch": 1.63, + "learning_rate": 5.5487838717326485e-05, + "loss": 0.0065, + "step": 323100 + }, + { + "epoch": 1.63, + "learning_rate": 5.5480271024312473e-05, + "loss": 0.0061, + "step": 323110 + }, + { + "epoch": 1.63, + "learning_rate": 5.547270333129846e-05, + "loss": 0.0058, + "step": 323120 + }, + { + "epoch": 1.63, + "learning_rate": 5.546513563828445e-05, + "loss": 0.0091, + "step": 323130 + }, + { + "epoch": 1.63, + "learning_rate": 5.5457567945270445e-05, + "loss": 0.0063, + "step": 323140 + }, + { + "epoch": 1.63, + "learning_rate": 5.545000025225643e-05, + "loss": 0.0047, + "step": 323150 + }, + { + "epoch": 1.63, + "learning_rate": 5.544243255924242e-05, + "loss": 0.0058, + "step": 323160 + }, + { + "epoch": 1.63, + "learning_rate": 5.543486486622841e-05, + "loss": 0.0081, + "step": 323170 + }, + { + "epoch": 1.63, + "learning_rate": 5.542729717321439e-05, + "loss": 0.0066, + "step": 323180 + }, + { + "epoch": 1.63, + "learning_rate": 5.5419729480200386e-05, + "loss": 0.0108, + "step": 323190 + }, + { + "epoch": 1.63, + "learning_rate": 5.5412161787186374e-05, + "loss": 0.0061, + "step": 323200 + }, + { + "epoch": 1.63, + "learning_rate": 5.540459409417236e-05, + "loss": 0.0065, + "step": 323210 + }, + { + "epoch": 1.63, + "learning_rate": 5.539702640115835e-05, + "loss": 0.0055, + "step": 323220 + }, + { + "epoch": 1.63, + "learning_rate": 5.5389458708144346e-05, + "loss": 0.0066, + "step": 323230 + }, + { + "epoch": 1.63, + "learning_rate": 5.5381891015130334e-05, + "loss": 0.0061, + "step": 323240 + }, + { + "epoch": 1.63, + "learning_rate": 5.537432332211632e-05, + "loss": 0.0073, + "step": 323250 + }, + { + "epoch": 1.63, + "learning_rate": 5.536675562910231e-05, + "loss": 0.0065, + "step": 323260 + }, + { + "epoch": 1.63, + "learning_rate": 5.5359187936088305e-05, + "loss": 0.0066, + "step": 323270 + }, + { + "epoch": 1.63, + "learning_rate": 5.5351620243074294e-05, + "loss": 0.0078, + "step": 323280 + }, + { + "epoch": 1.63, + "learning_rate": 5.534405255006028e-05, + "loss": 0.0071, + "step": 323290 + }, + { + "epoch": 1.63, + "learning_rate": 5.533648485704627e-05, + "loss": 0.0064, + "step": 323300 + }, + { + "epoch": 1.63, + "learning_rate": 5.5328917164032265e-05, + "loss": 0.0044, + "step": 323310 + }, + { + "epoch": 1.63, + "learning_rate": 5.532134947101825e-05, + "loss": 0.0085, + "step": 323320 + }, + { + "epoch": 1.63, + "learning_rate": 5.531378177800424e-05, + "loss": 0.0062, + "step": 323330 + }, + { + "epoch": 1.63, + "learning_rate": 5.530621408499023e-05, + "loss": 0.0063, + "step": 323340 + }, + { + "epoch": 1.63, + "learning_rate": 5.5298646391976225e-05, + "loss": 0.0052, + "step": 323350 + }, + { + "epoch": 1.63, + "learning_rate": 5.529107869896221e-05, + "loss": 0.0064, + "step": 323360 + }, + { + "epoch": 1.63, + "learning_rate": 5.52835110059482e-05, + "loss": 0.0067, + "step": 323370 + }, + { + "epoch": 1.63, + "learning_rate": 5.5275943312934196e-05, + "loss": 0.0062, + "step": 323380 + }, + { + "epoch": 1.63, + "learning_rate": 5.5268375619920184e-05, + "loss": 0.0066, + "step": 323390 + }, + { + "epoch": 1.63, + "learning_rate": 5.526080792690617e-05, + "loss": 0.0066, + "step": 323400 + }, + { + "epoch": 1.63, + "learning_rate": 5.525324023389216e-05, + "loss": 0.0072, + "step": 323410 + }, + { + "epoch": 1.63, + "learning_rate": 5.5245672540878156e-05, + "loss": 0.0057, + "step": 323420 + }, + { + "epoch": 1.63, + "learning_rate": 5.5238104847864144e-05, + "loss": 0.0056, + "step": 323430 + }, + { + "epoch": 1.63, + "learning_rate": 5.523053715485013e-05, + "loss": 0.0076, + "step": 323440 + }, + { + "epoch": 1.63, + "learning_rate": 5.522296946183612e-05, + "loss": 0.0077, + "step": 323450 + }, + { + "epoch": 1.63, + "learning_rate": 5.5215401768822115e-05, + "loss": 0.0054, + "step": 323460 + }, + { + "epoch": 1.63, + "learning_rate": 5.5207834075808104e-05, + "loss": 0.0079, + "step": 323470 + }, + { + "epoch": 1.63, + "learning_rate": 5.520026638279409e-05, + "loss": 0.0045, + "step": 323480 + }, + { + "epoch": 1.63, + "learning_rate": 5.519269868978008e-05, + "loss": 0.0053, + "step": 323490 + }, + { + "epoch": 1.63, + "learning_rate": 5.518513099676606e-05, + "loss": 0.0058, + "step": 323500 + }, + { + "epoch": 1.63, + "learning_rate": 5.5177563303752056e-05, + "loss": 0.0069, + "step": 323510 + }, + { + "epoch": 1.63, + "learning_rate": 5.5169995610738045e-05, + "loss": 0.0095, + "step": 323520 + }, + { + "epoch": 1.63, + "learning_rate": 5.516242791772403e-05, + "loss": 0.0064, + "step": 323530 + }, + { + "epoch": 1.63, + "learning_rate": 5.515486022471002e-05, + "loss": 0.0061, + "step": 323540 + }, + { + "epoch": 1.63, + "learning_rate": 5.5147292531696016e-05, + "loss": 0.0052, + "step": 323550 + }, + { + "epoch": 1.63, + "learning_rate": 5.5139724838682004e-05, + "loss": 0.0095, + "step": 323560 + }, + { + "epoch": 1.63, + "learning_rate": 5.513215714566799e-05, + "loss": 0.0071, + "step": 323570 + }, + { + "epoch": 1.63, + "learning_rate": 5.512458945265398e-05, + "loss": 0.0086, + "step": 323580 + }, + { + "epoch": 1.63, + "learning_rate": 5.5117021759639976e-05, + "loss": 0.007, + "step": 323590 + }, + { + "epoch": 1.63, + "learning_rate": 5.5109454066625964e-05, + "loss": 0.0049, + "step": 323600 + }, + { + "epoch": 1.63, + "learning_rate": 5.510188637361195e-05, + "loss": 0.0072, + "step": 323610 + }, + { + "epoch": 1.63, + "learning_rate": 5.509431868059794e-05, + "loss": 0.0065, + "step": 323620 + }, + { + "epoch": 1.63, + "learning_rate": 5.5086750987583935e-05, + "loss": 0.0077, + "step": 323630 + }, + { + "epoch": 1.63, + "learning_rate": 5.5079183294569924e-05, + "loss": 0.0056, + "step": 323640 + }, + { + "epoch": 1.63, + "learning_rate": 5.507161560155591e-05, + "loss": 0.0075, + "step": 323650 + }, + { + "epoch": 1.63, + "learning_rate": 5.50640479085419e-05, + "loss": 0.0072, + "step": 323660 + }, + { + "epoch": 1.63, + "learning_rate": 5.5056480215527895e-05, + "loss": 0.0085, + "step": 323670 + }, + { + "epoch": 1.63, + "learning_rate": 5.504891252251388e-05, + "loss": 0.0053, + "step": 323680 + }, + { + "epoch": 1.63, + "learning_rate": 5.504134482949987e-05, + "loss": 0.0074, + "step": 323690 + }, + { + "epoch": 1.63, + "learning_rate": 5.503377713648586e-05, + "loss": 0.0072, + "step": 323700 + }, + { + "epoch": 1.63, + "learning_rate": 5.5026209443471855e-05, + "loss": 0.0058, + "step": 323710 + }, + { + "epoch": 1.63, + "learning_rate": 5.501864175045784e-05, + "loss": 0.0072, + "step": 323720 + }, + { + "epoch": 1.63, + "learning_rate": 5.501107405744383e-05, + "loss": 0.0061, + "step": 323730 + }, + { + "epoch": 1.63, + "learning_rate": 5.500350636442982e-05, + "loss": 0.0036, + "step": 323740 + }, + { + "epoch": 1.63, + "learning_rate": 5.4995938671415814e-05, + "loss": 0.0065, + "step": 323750 + }, + { + "epoch": 1.63, + "learning_rate": 5.49883709784018e-05, + "loss": 0.0052, + "step": 323760 + }, + { + "epoch": 1.63, + "learning_rate": 5.498080328538779e-05, + "loss": 0.0075, + "step": 323770 + }, + { + "epoch": 1.63, + "learning_rate": 5.497323559237378e-05, + "loss": 0.0079, + "step": 323780 + }, + { + "epoch": 1.63, + "learning_rate": 5.4965667899359774e-05, + "loss": 0.0075, + "step": 323790 + }, + { + "epoch": 1.63, + "learning_rate": 5.495810020634576e-05, + "loss": 0.0076, + "step": 323800 + }, + { + "epoch": 1.63, + "learning_rate": 5.4950532513331744e-05, + "loss": 0.0067, + "step": 323810 + }, + { + "epoch": 1.63, + "learning_rate": 5.494296482031773e-05, + "loss": 0.0086, + "step": 323820 + }, + { + "epoch": 1.63, + "learning_rate": 5.493539712730373e-05, + "loss": 0.0076, + "step": 323830 + }, + { + "epoch": 1.63, + "learning_rate": 5.4927829434289715e-05, + "loss": 0.0071, + "step": 323840 + }, + { + "epoch": 1.63, + "learning_rate": 5.49202617412757e-05, + "loss": 0.0066, + "step": 323850 + }, + { + "epoch": 1.63, + "learning_rate": 5.491269404826169e-05, + "loss": 0.0059, + "step": 323860 + }, + { + "epoch": 1.63, + "learning_rate": 5.4905126355247687e-05, + "loss": 0.008, + "step": 323870 + }, + { + "epoch": 1.63, + "learning_rate": 5.4897558662233675e-05, + "loss": 0.0056, + "step": 323880 + }, + { + "epoch": 1.63, + "learning_rate": 5.488999096921966e-05, + "loss": 0.0103, + "step": 323890 + }, + { + "epoch": 1.63, + "learning_rate": 5.488242327620565e-05, + "loss": 0.0066, + "step": 323900 + }, + { + "epoch": 1.63, + "learning_rate": 5.4874855583191646e-05, + "loss": 0.0068, + "step": 323910 + }, + { + "epoch": 1.63, + "learning_rate": 5.4867287890177634e-05, + "loss": 0.0071, + "step": 323920 + }, + { + "epoch": 1.63, + "learning_rate": 5.485972019716362e-05, + "loss": 0.0086, + "step": 323930 + }, + { + "epoch": 1.63, + "learning_rate": 5.485215250414961e-05, + "loss": 0.0066, + "step": 323940 + }, + { + "epoch": 1.63, + "learning_rate": 5.4844584811135606e-05, + "loss": 0.0064, + "step": 323950 + }, + { + "epoch": 1.63, + "learning_rate": 5.4837017118121594e-05, + "loss": 0.0071, + "step": 323960 + }, + { + "epoch": 1.63, + "learning_rate": 5.482944942510758e-05, + "loss": 0.0073, + "step": 323970 + }, + { + "epoch": 1.63, + "learning_rate": 5.482188173209357e-05, + "loss": 0.0062, + "step": 323980 + }, + { + "epoch": 1.63, + "learning_rate": 5.4814314039079565e-05, + "loss": 0.0081, + "step": 323990 + }, + { + "epoch": 1.63, + "learning_rate": 5.4806746346065554e-05, + "loss": 0.0068, + "step": 324000 + }, + { + "epoch": 1.63, + "eval_cer": 0.9144275584736445, + "eval_loss": 0.0047448608092963696, + "eval_runtime": 116.3969, + "eval_samples_per_second": 17.183, + "eval_steps_per_second": 4.296, + "step": 324000 + }, + { + "epoch": 1.63, + "learning_rate": 5.479917865305154e-05, + "loss": 0.0069, + "step": 324010 + }, + { + "epoch": 1.63, + "learning_rate": 5.479161096003753e-05, + "loss": 0.0065, + "step": 324020 + }, + { + "epoch": 1.63, + "learning_rate": 5.4784043267023525e-05, + "loss": 0.0084, + "step": 324030 + }, + { + "epoch": 1.63, + "learning_rate": 5.477647557400951e-05, + "loss": 0.0074, + "step": 324040 + }, + { + "epoch": 1.63, + "learning_rate": 5.47689078809955e-05, + "loss": 0.0069, + "step": 324050 + }, + { + "epoch": 1.63, + "learning_rate": 5.476134018798149e-05, + "loss": 0.0065, + "step": 324060 + }, + { + "epoch": 1.63, + "learning_rate": 5.4753772494967485e-05, + "loss": 0.007, + "step": 324070 + }, + { + "epoch": 1.64, + "learning_rate": 5.474620480195347e-05, + "loss": 0.0067, + "step": 324080 + }, + { + "epoch": 1.64, + "learning_rate": 5.473863710893946e-05, + "loss": 0.0093, + "step": 324090 + }, + { + "epoch": 1.64, + "learning_rate": 5.473106941592545e-05, + "loss": 0.006, + "step": 324100 + }, + { + "epoch": 1.64, + "learning_rate": 5.4723501722911444e-05, + "loss": 0.0075, + "step": 324110 + }, + { + "epoch": 1.64, + "learning_rate": 5.4715934029897426e-05, + "loss": 0.0054, + "step": 324120 + }, + { + "epoch": 1.64, + "learning_rate": 5.4708366336883414e-05, + "loss": 0.0069, + "step": 324130 + }, + { + "epoch": 1.64, + "learning_rate": 5.47007986438694e-05, + "loss": 0.0072, + "step": 324140 + }, + { + "epoch": 1.64, + "learning_rate": 5.469323095085539e-05, + "loss": 0.0071, + "step": 324150 + }, + { + "epoch": 1.64, + "learning_rate": 5.4685663257841386e-05, + "loss": 0.0072, + "step": 324160 + }, + { + "epoch": 1.64, + "learning_rate": 5.4678095564827374e-05, + "loss": 0.0058, + "step": 324170 + }, + { + "epoch": 1.64, + "learning_rate": 5.467052787181336e-05, + "loss": 0.0061, + "step": 324180 + }, + { + "epoch": 1.64, + "learning_rate": 5.466296017879935e-05, + "loss": 0.0073, + "step": 324190 + }, + { + "epoch": 1.64, + "learning_rate": 5.4655392485785345e-05, + "loss": 0.0065, + "step": 324200 + }, + { + "epoch": 1.64, + "learning_rate": 5.4647824792771333e-05, + "loss": 0.0056, + "step": 324210 + }, + { + "epoch": 1.64, + "learning_rate": 5.464025709975732e-05, + "loss": 0.0056, + "step": 324220 + }, + { + "epoch": 1.64, + "learning_rate": 5.463268940674331e-05, + "loss": 0.0078, + "step": 324230 + }, + { + "epoch": 1.64, + "learning_rate": 5.4625121713729305e-05, + "loss": 0.0054, + "step": 324240 + }, + { + "epoch": 1.64, + "learning_rate": 5.461755402071529e-05, + "loss": 0.0061, + "step": 324250 + }, + { + "epoch": 1.64, + "learning_rate": 5.460998632770128e-05, + "loss": 0.0065, + "step": 324260 + }, + { + "epoch": 1.64, + "learning_rate": 5.460241863468727e-05, + "loss": 0.0062, + "step": 324270 + }, + { + "epoch": 1.64, + "learning_rate": 5.4594850941673264e-05, + "loss": 0.0072, + "step": 324280 + }, + { + "epoch": 1.64, + "learning_rate": 5.458728324865925e-05, + "loss": 0.0056, + "step": 324290 + }, + { + "epoch": 1.64, + "learning_rate": 5.457971555564524e-05, + "loss": 0.0071, + "step": 324300 + }, + { + "epoch": 1.64, + "learning_rate": 5.457214786263123e-05, + "loss": 0.0067, + "step": 324310 + }, + { + "epoch": 1.64, + "learning_rate": 5.4564580169617224e-05, + "loss": 0.0071, + "step": 324320 + }, + { + "epoch": 1.64, + "learning_rate": 5.455701247660321e-05, + "loss": 0.0051, + "step": 324330 + }, + { + "epoch": 1.64, + "learning_rate": 5.45494447835892e-05, + "loss": 0.0076, + "step": 324340 + }, + { + "epoch": 1.64, + "learning_rate": 5.4541877090575196e-05, + "loss": 0.0072, + "step": 324350 + }, + { + "epoch": 1.64, + "learning_rate": 5.4534309397561184e-05, + "loss": 0.0065, + "step": 324360 + }, + { + "epoch": 1.64, + "learning_rate": 5.452674170454717e-05, + "loss": 0.0089, + "step": 324370 + }, + { + "epoch": 1.64, + "learning_rate": 5.451917401153316e-05, + "loss": 0.0091, + "step": 324380 + }, + { + "epoch": 1.64, + "learning_rate": 5.4511606318519155e-05, + "loss": 0.0074, + "step": 324390 + }, + { + "epoch": 1.64, + "learning_rate": 5.4504038625505143e-05, + "loss": 0.0059, + "step": 324400 + }, + { + "epoch": 1.64, + "learning_rate": 5.449647093249113e-05, + "loss": 0.0057, + "step": 324410 + }, + { + "epoch": 1.64, + "learning_rate": 5.448890323947712e-05, + "loss": 0.0063, + "step": 324420 + }, + { + "epoch": 1.64, + "learning_rate": 5.4481335546463115e-05, + "loss": 0.0082, + "step": 324430 + }, + { + "epoch": 1.64, + "learning_rate": 5.4473767853449096e-05, + "loss": 0.0085, + "step": 324440 + }, + { + "epoch": 1.64, + "learning_rate": 5.4466200160435085e-05, + "loss": 0.0056, + "step": 324450 + }, + { + "epoch": 1.64, + "learning_rate": 5.445863246742107e-05, + "loss": 0.0079, + "step": 324460 + }, + { + "epoch": 1.64, + "learning_rate": 5.445106477440706e-05, + "loss": 0.0075, + "step": 324470 + }, + { + "epoch": 1.64, + "learning_rate": 5.4443497081393056e-05, + "loss": 0.0063, + "step": 324480 + }, + { + "epoch": 1.64, + "learning_rate": 5.4435929388379044e-05, + "loss": 0.0066, + "step": 324490 + }, + { + "epoch": 1.64, + "learning_rate": 5.442836169536503e-05, + "loss": 0.0084, + "step": 324500 + }, + { + "epoch": 1.64, + "learning_rate": 5.442079400235102e-05, + "loss": 0.0064, + "step": 324510 + }, + { + "epoch": 1.64, + "learning_rate": 5.4413226309337016e-05, + "loss": 0.0057, + "step": 324520 + }, + { + "epoch": 1.64, + "learning_rate": 5.4405658616323004e-05, + "loss": 0.0065, + "step": 324530 + }, + { + "epoch": 1.64, + "learning_rate": 5.439809092330899e-05, + "loss": 0.0057, + "step": 324540 + }, + { + "epoch": 1.64, + "learning_rate": 5.439052323029498e-05, + "loss": 0.0064, + "step": 324550 + }, + { + "epoch": 1.64, + "learning_rate": 5.4382955537280975e-05, + "loss": 0.0064, + "step": 324560 + }, + { + "epoch": 1.64, + "learning_rate": 5.4375387844266963e-05, + "loss": 0.0058, + "step": 324570 + }, + { + "epoch": 1.64, + "learning_rate": 5.436782015125295e-05, + "loss": 0.0059, + "step": 324580 + }, + { + "epoch": 1.64, + "learning_rate": 5.436025245823894e-05, + "loss": 0.0095, + "step": 324590 + }, + { + "epoch": 1.64, + "learning_rate": 5.4352684765224935e-05, + "loss": 0.0076, + "step": 324600 + }, + { + "epoch": 1.64, + "learning_rate": 5.434511707221092e-05, + "loss": 0.0049, + "step": 324610 + }, + { + "epoch": 1.64, + "learning_rate": 5.433754937919691e-05, + "loss": 0.01, + "step": 324620 + }, + { + "epoch": 1.64, + "learning_rate": 5.43299816861829e-05, + "loss": 0.0053, + "step": 324630 + }, + { + "epoch": 1.64, + "learning_rate": 5.4322413993168895e-05, + "loss": 0.0069, + "step": 324640 + }, + { + "epoch": 1.64, + "learning_rate": 5.431484630015488e-05, + "loss": 0.0045, + "step": 324650 + }, + { + "epoch": 1.64, + "learning_rate": 5.430727860714087e-05, + "loss": 0.0069, + "step": 324660 + }, + { + "epoch": 1.64, + "learning_rate": 5.429971091412686e-05, + "loss": 0.006, + "step": 324670 + }, + { + "epoch": 1.64, + "learning_rate": 5.4292143221112854e-05, + "loss": 0.0091, + "step": 324680 + }, + { + "epoch": 1.64, + "learning_rate": 5.428457552809884e-05, + "loss": 0.0076, + "step": 324690 + }, + { + "epoch": 1.64, + "learning_rate": 5.427700783508483e-05, + "loss": 0.0126, + "step": 324700 + }, + { + "epoch": 1.64, + "learning_rate": 5.426944014207082e-05, + "loss": 0.0071, + "step": 324710 + }, + { + "epoch": 1.64, + "learning_rate": 5.4261872449056814e-05, + "loss": 0.0073, + "step": 324720 + }, + { + "epoch": 1.64, + "learning_rate": 5.42543047560428e-05, + "loss": 0.0106, + "step": 324730 + }, + { + "epoch": 1.64, + "learning_rate": 5.424673706302879e-05, + "loss": 0.0081, + "step": 324740 + }, + { + "epoch": 1.64, + "learning_rate": 5.423916937001477e-05, + "loss": 0.0068, + "step": 324750 + }, + { + "epoch": 1.64, + "learning_rate": 5.423160167700076e-05, + "loss": 0.0057, + "step": 324760 + }, + { + "epoch": 1.64, + "learning_rate": 5.4224033983986755e-05, + "loss": 0.0072, + "step": 324770 + }, + { + "epoch": 1.64, + "learning_rate": 5.421646629097274e-05, + "loss": 0.007, + "step": 324780 + }, + { + "epoch": 1.64, + "learning_rate": 5.420889859795873e-05, + "loss": 0.0055, + "step": 324790 + }, + { + "epoch": 1.64, + "learning_rate": 5.4201330904944726e-05, + "loss": 0.005, + "step": 324800 + }, + { + "epoch": 1.64, + "learning_rate": 5.4193763211930715e-05, + "loss": 0.0055, + "step": 324810 + }, + { + "epoch": 1.64, + "learning_rate": 5.41861955189167e-05, + "loss": 0.0084, + "step": 324820 + }, + { + "epoch": 1.64, + "learning_rate": 5.417862782590269e-05, + "loss": 0.0056, + "step": 324830 + }, + { + "epoch": 1.64, + "learning_rate": 5.4171060132888686e-05, + "loss": 0.0082, + "step": 324840 + }, + { + "epoch": 1.64, + "learning_rate": 5.4163492439874674e-05, + "loss": 0.0076, + "step": 324850 + }, + { + "epoch": 1.64, + "learning_rate": 5.415592474686066e-05, + "loss": 0.0077, + "step": 324860 + }, + { + "epoch": 1.64, + "learning_rate": 5.414835705384665e-05, + "loss": 0.0074, + "step": 324870 + }, + { + "epoch": 1.64, + "learning_rate": 5.4140789360832646e-05, + "loss": 0.0086, + "step": 324880 + }, + { + "epoch": 1.64, + "learning_rate": 5.4133221667818634e-05, + "loss": 0.0054, + "step": 324890 + }, + { + "epoch": 1.64, + "learning_rate": 5.412565397480462e-05, + "loss": 0.0055, + "step": 324900 + }, + { + "epoch": 1.64, + "learning_rate": 5.411808628179061e-05, + "loss": 0.0066, + "step": 324910 + }, + { + "epoch": 1.64, + "learning_rate": 5.4110518588776605e-05, + "loss": 0.0067, + "step": 324920 + }, + { + "epoch": 1.64, + "learning_rate": 5.4102950895762594e-05, + "loss": 0.0068, + "step": 324930 + }, + { + "epoch": 1.64, + "learning_rate": 5.409538320274858e-05, + "loss": 0.0059, + "step": 324940 + }, + { + "epoch": 1.64, + "learning_rate": 5.408781550973457e-05, + "loss": 0.0069, + "step": 324950 + }, + { + "epoch": 1.64, + "learning_rate": 5.4080247816720565e-05, + "loss": 0.0056, + "step": 324960 + }, + { + "epoch": 1.64, + "learning_rate": 5.407268012370655e-05, + "loss": 0.008, + "step": 324970 + }, + { + "epoch": 1.64, + "learning_rate": 5.406511243069254e-05, + "loss": 0.0053, + "step": 324980 + }, + { + "epoch": 1.64, + "learning_rate": 5.405754473767853e-05, + "loss": 0.0056, + "step": 324990 + }, + { + "epoch": 1.64, + "learning_rate": 5.4049977044664525e-05, + "loss": 0.0063, + "step": 325000 + }, + { + "epoch": 1.64, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.005062679760158062, + "eval_runtime": 116.3486, + "eval_samples_per_second": 17.19, + "eval_steps_per_second": 4.297, + "step": 325000 + }, + { + "epoch": 1.64, + "learning_rate": 5.404240935165051e-05, + "loss": 0.007, + "step": 325010 + }, + { + "epoch": 1.64, + "learning_rate": 5.40348416586365e-05, + "loss": 0.0077, + "step": 325020 + }, + { + "epoch": 1.64, + "learning_rate": 5.402727396562249e-05, + "loss": 0.0079, + "step": 325030 + }, + { + "epoch": 1.64, + "learning_rate": 5.4019706272608484e-05, + "loss": 0.0076, + "step": 325040 + }, + { + "epoch": 1.64, + "learning_rate": 5.401213857959447e-05, + "loss": 0.006, + "step": 325050 + }, + { + "epoch": 1.64, + "learning_rate": 5.400457088658046e-05, + "loss": 0.0066, + "step": 325060 + }, + { + "epoch": 1.64, + "learning_rate": 5.399700319356644e-05, + "loss": 0.0053, + "step": 325070 + }, + { + "epoch": 1.64, + "learning_rate": 5.398943550055243e-05, + "loss": 0.007, + "step": 325080 + }, + { + "epoch": 1.64, + "learning_rate": 5.3981867807538425e-05, + "loss": 0.0064, + "step": 325090 + }, + { + "epoch": 1.64, + "learning_rate": 5.3974300114524414e-05, + "loss": 0.0067, + "step": 325100 + }, + { + "epoch": 1.64, + "learning_rate": 5.39667324215104e-05, + "loss": 0.0075, + "step": 325110 + }, + { + "epoch": 1.64, + "learning_rate": 5.395916472849639e-05, + "loss": 0.0091, + "step": 325120 + }, + { + "epoch": 1.64, + "learning_rate": 5.3951597035482385e-05, + "loss": 0.0125, + "step": 325130 + }, + { + "epoch": 1.64, + "learning_rate": 5.394402934246837e-05, + "loss": 0.0075, + "step": 325140 + }, + { + "epoch": 1.64, + "learning_rate": 5.393646164945436e-05, + "loss": 0.006, + "step": 325150 + }, + { + "epoch": 1.64, + "learning_rate": 5.392889395644035e-05, + "loss": 0.0045, + "step": 325160 + }, + { + "epoch": 1.64, + "learning_rate": 5.3921326263426345e-05, + "loss": 0.0059, + "step": 325170 + }, + { + "epoch": 1.64, + "learning_rate": 5.391375857041233e-05, + "loss": 0.0058, + "step": 325180 + }, + { + "epoch": 1.64, + "learning_rate": 5.390619087739832e-05, + "loss": 0.0107, + "step": 325190 + }, + { + "epoch": 1.64, + "learning_rate": 5.389862318438431e-05, + "loss": 0.0068, + "step": 325200 + }, + { + "epoch": 1.64, + "learning_rate": 5.3891055491370304e-05, + "loss": 0.0062, + "step": 325210 + }, + { + "epoch": 1.64, + "learning_rate": 5.388348779835629e-05, + "loss": 0.0075, + "step": 325220 + }, + { + "epoch": 1.64, + "learning_rate": 5.387592010534228e-05, + "loss": 0.005, + "step": 325230 + }, + { + "epoch": 1.64, + "learning_rate": 5.386835241232827e-05, + "loss": 0.0049, + "step": 325240 + }, + { + "epoch": 1.64, + "learning_rate": 5.3860784719314264e-05, + "loss": 0.0078, + "step": 325250 + }, + { + "epoch": 1.64, + "learning_rate": 5.385321702630025e-05, + "loss": 0.0071, + "step": 325260 + }, + { + "epoch": 1.64, + "learning_rate": 5.384564933328624e-05, + "loss": 0.0063, + "step": 325270 + }, + { + "epoch": 1.64, + "learning_rate": 5.383808164027223e-05, + "loss": 0.0062, + "step": 325280 + }, + { + "epoch": 1.64, + "learning_rate": 5.3830513947258224e-05, + "loss": 0.0057, + "step": 325290 + }, + { + "epoch": 1.64, + "learning_rate": 5.382294625424421e-05, + "loss": 0.0052, + "step": 325300 + }, + { + "epoch": 1.64, + "learning_rate": 5.38153785612302e-05, + "loss": 0.0066, + "step": 325310 + }, + { + "epoch": 1.64, + "learning_rate": 5.3807810868216195e-05, + "loss": 0.0076, + "step": 325320 + }, + { + "epoch": 1.64, + "learning_rate": 5.380024317520218e-05, + "loss": 0.0061, + "step": 325330 + }, + { + "epoch": 1.64, + "learning_rate": 5.379267548218817e-05, + "loss": 0.0056, + "step": 325340 + }, + { + "epoch": 1.64, + "learning_rate": 5.378510778917416e-05, + "loss": 0.0062, + "step": 325350 + }, + { + "epoch": 1.64, + "learning_rate": 5.3777540096160155e-05, + "loss": 0.0065, + "step": 325360 + }, + { + "epoch": 1.64, + "learning_rate": 5.376997240314614e-05, + "loss": 0.0066, + "step": 325370 + }, + { + "epoch": 1.64, + "learning_rate": 5.3762404710132124e-05, + "loss": 0.0066, + "step": 325380 + }, + { + "epoch": 1.64, + "learning_rate": 5.375483701711811e-05, + "loss": 0.0084, + "step": 325390 + }, + { + "epoch": 1.64, + "learning_rate": 5.37472693241041e-05, + "loss": 0.0073, + "step": 325400 + }, + { + "epoch": 1.64, + "learning_rate": 5.3739701631090096e-05, + "loss": 0.0084, + "step": 325410 + }, + { + "epoch": 1.64, + "learning_rate": 5.3732133938076084e-05, + "loss": 0.0061, + "step": 325420 + }, + { + "epoch": 1.64, + "learning_rate": 5.372456624506207e-05, + "loss": 0.0078, + "step": 325430 + }, + { + "epoch": 1.64, + "learning_rate": 5.371699855204806e-05, + "loss": 0.0065, + "step": 325440 + }, + { + "epoch": 1.64, + "learning_rate": 5.3709430859034055e-05, + "loss": 0.0085, + "step": 325450 + }, + { + "epoch": 1.64, + "learning_rate": 5.3701863166020044e-05, + "loss": 0.0056, + "step": 325460 + }, + { + "epoch": 1.64, + "learning_rate": 5.369429547300603e-05, + "loss": 0.0065, + "step": 325470 + }, + { + "epoch": 1.64, + "learning_rate": 5.368672777999202e-05, + "loss": 0.0058, + "step": 325480 + }, + { + "epoch": 1.64, + "learning_rate": 5.3679160086978015e-05, + "loss": 0.0061, + "step": 325490 + }, + { + "epoch": 1.64, + "learning_rate": 5.3671592393964e-05, + "loss": 0.0058, + "step": 325500 + }, + { + "epoch": 1.64, + "learning_rate": 5.366402470094999e-05, + "loss": 0.0066, + "step": 325510 + }, + { + "epoch": 1.64, + "learning_rate": 5.365645700793598e-05, + "loss": 0.006, + "step": 325520 + }, + { + "epoch": 1.64, + "learning_rate": 5.3648889314921975e-05, + "loss": 0.0062, + "step": 325530 + }, + { + "epoch": 1.64, + "learning_rate": 5.364132162190796e-05, + "loss": 0.0098, + "step": 325540 + }, + { + "epoch": 1.64, + "learning_rate": 5.363375392889395e-05, + "loss": 0.005, + "step": 325550 + }, + { + "epoch": 1.64, + "learning_rate": 5.362618623587994e-05, + "loss": 0.0064, + "step": 325560 + }, + { + "epoch": 1.64, + "learning_rate": 5.3618618542865934e-05, + "loss": 0.0107, + "step": 325570 + }, + { + "epoch": 1.64, + "learning_rate": 5.361105084985192e-05, + "loss": 0.0061, + "step": 325580 + }, + { + "epoch": 1.64, + "learning_rate": 5.360348315683791e-05, + "loss": 0.0074, + "step": 325590 + }, + { + "epoch": 1.64, + "learning_rate": 5.35959154638239e-05, + "loss": 0.0061, + "step": 325600 + }, + { + "epoch": 1.64, + "learning_rate": 5.3588347770809894e-05, + "loss": 0.0067, + "step": 325610 + }, + { + "epoch": 1.64, + "learning_rate": 5.358078007779588e-05, + "loss": 0.0098, + "step": 325620 + }, + { + "epoch": 1.64, + "learning_rate": 5.357321238478187e-05, + "loss": 0.0064, + "step": 325630 + }, + { + "epoch": 1.64, + "learning_rate": 5.356564469176786e-05, + "loss": 0.0078, + "step": 325640 + }, + { + "epoch": 1.64, + "learning_rate": 5.3558076998753854e-05, + "loss": 0.0058, + "step": 325650 + }, + { + "epoch": 1.64, + "learning_rate": 5.355050930573984e-05, + "loss": 0.0048, + "step": 325660 + }, + { + "epoch": 1.64, + "learning_rate": 5.354294161272583e-05, + "loss": 0.0049, + "step": 325670 + }, + { + "epoch": 1.64, + "learning_rate": 5.353537391971182e-05, + "loss": 0.0088, + "step": 325680 + }, + { + "epoch": 1.64, + "learning_rate": 5.3527806226697813e-05, + "loss": 0.0072, + "step": 325690 + }, + { + "epoch": 1.64, + "learning_rate": 5.3520238533683795e-05, + "loss": 0.0063, + "step": 325700 + }, + { + "epoch": 1.64, + "learning_rate": 5.351267084066978e-05, + "loss": 0.0052, + "step": 325710 + }, + { + "epoch": 1.64, + "learning_rate": 5.350510314765577e-05, + "loss": 0.006, + "step": 325720 + }, + { + "epoch": 1.64, + "learning_rate": 5.349753545464176e-05, + "loss": 0.0066, + "step": 325730 + }, + { + "epoch": 1.64, + "learning_rate": 5.3489967761627754e-05, + "loss": 0.0058, + "step": 325740 + }, + { + "epoch": 1.64, + "learning_rate": 5.348240006861374e-05, + "loss": 0.0047, + "step": 325750 + }, + { + "epoch": 1.64, + "learning_rate": 5.347483237559973e-05, + "loss": 0.0066, + "step": 325760 + }, + { + "epoch": 1.64, + "learning_rate": 5.3467264682585726e-05, + "loss": 0.0099, + "step": 325770 + }, + { + "epoch": 1.64, + "learning_rate": 5.3459696989571714e-05, + "loss": 0.0074, + "step": 325780 + }, + { + "epoch": 1.64, + "learning_rate": 5.34521292965577e-05, + "loss": 0.0064, + "step": 325790 + }, + { + "epoch": 1.64, + "learning_rate": 5.344456160354369e-05, + "loss": 0.006, + "step": 325800 + }, + { + "epoch": 1.64, + "learning_rate": 5.3436993910529686e-05, + "loss": 0.0066, + "step": 325810 + }, + { + "epoch": 1.64, + "learning_rate": 5.3429426217515674e-05, + "loss": 0.0056, + "step": 325820 + }, + { + "epoch": 1.64, + "learning_rate": 5.342185852450166e-05, + "loss": 0.0071, + "step": 325830 + }, + { + "epoch": 1.64, + "learning_rate": 5.341429083148765e-05, + "loss": 0.0056, + "step": 325840 + }, + { + "epoch": 1.64, + "learning_rate": 5.3406723138473645e-05, + "loss": 0.0098, + "step": 325850 + }, + { + "epoch": 1.64, + "learning_rate": 5.3399155445459633e-05, + "loss": 0.0076, + "step": 325860 + }, + { + "epoch": 1.64, + "learning_rate": 5.339158775244562e-05, + "loss": 0.0083, + "step": 325870 + }, + { + "epoch": 1.64, + "learning_rate": 5.338402005943161e-05, + "loss": 0.0071, + "step": 325880 + }, + { + "epoch": 1.64, + "learning_rate": 5.3376452366417605e-05, + "loss": 0.0045, + "step": 325890 + }, + { + "epoch": 1.64, + "learning_rate": 5.336888467340359e-05, + "loss": 0.0074, + "step": 325900 + }, + { + "epoch": 1.64, + "learning_rate": 5.336131698038958e-05, + "loss": 0.0057, + "step": 325910 + }, + { + "epoch": 1.64, + "learning_rate": 5.335374928737557e-05, + "loss": 0.0084, + "step": 325920 + }, + { + "epoch": 1.64, + "learning_rate": 5.3346181594361565e-05, + "loss": 0.0069, + "step": 325930 + }, + { + "epoch": 1.64, + "learning_rate": 5.333861390134755e-05, + "loss": 0.0058, + "step": 325940 + }, + { + "epoch": 1.64, + "learning_rate": 5.333104620833354e-05, + "loss": 0.0073, + "step": 325950 + }, + { + "epoch": 1.64, + "learning_rate": 5.332347851531953e-05, + "loss": 0.0063, + "step": 325960 + }, + { + "epoch": 1.64, + "learning_rate": 5.3315910822305524e-05, + "loss": 0.0053, + "step": 325970 + }, + { + "epoch": 1.64, + "learning_rate": 5.330834312929151e-05, + "loss": 0.0067, + "step": 325980 + }, + { + "epoch": 1.64, + "learning_rate": 5.33007754362775e-05, + "loss": 0.005, + "step": 325990 + }, + { + "epoch": 1.64, + "learning_rate": 5.329320774326349e-05, + "loss": 0.0066, + "step": 326000 + }, + { + "epoch": 1.64, + "eval_cer": 0.914412032135638, + "eval_loss": 0.004975411109626293, + "eval_runtime": 116.3509, + "eval_samples_per_second": 17.189, + "eval_steps_per_second": 4.297, + "step": 326000 + }, + { + "epoch": 1.64, + "learning_rate": 5.328564005024947e-05, + "loss": 0.011, + "step": 326010 + }, + { + "epoch": 1.64, + "learning_rate": 5.3278072357235465e-05, + "loss": 0.0051, + "step": 326020 + }, + { + "epoch": 1.64, + "learning_rate": 5.3270504664221453e-05, + "loss": 0.0072, + "step": 326030 + }, + { + "epoch": 1.64, + "learning_rate": 5.326293697120744e-05, + "loss": 0.0059, + "step": 326040 + }, + { + "epoch": 1.64, + "learning_rate": 5.325536927819343e-05, + "loss": 0.0075, + "step": 326050 + }, + { + "epoch": 1.65, + "learning_rate": 5.3247801585179425e-05, + "loss": 0.0085, + "step": 326060 + }, + { + "epoch": 1.65, + "learning_rate": 5.324023389216541e-05, + "loss": 0.0048, + "step": 326070 + }, + { + "epoch": 1.65, + "learning_rate": 5.32326661991514e-05, + "loss": 0.0082, + "step": 326080 + }, + { + "epoch": 1.65, + "learning_rate": 5.322509850613739e-05, + "loss": 0.0052, + "step": 326090 + }, + { + "epoch": 1.65, + "learning_rate": 5.3217530813123385e-05, + "loss": 0.0062, + "step": 326100 + }, + { + "epoch": 1.65, + "learning_rate": 5.320996312010937e-05, + "loss": 0.0062, + "step": 326110 + }, + { + "epoch": 1.65, + "learning_rate": 5.320239542709536e-05, + "loss": 0.0097, + "step": 326120 + }, + { + "epoch": 1.65, + "learning_rate": 5.319482773408135e-05, + "loss": 0.008, + "step": 326130 + }, + { + "epoch": 1.65, + "learning_rate": 5.3187260041067344e-05, + "loss": 0.0063, + "step": 326140 + }, + { + "epoch": 1.65, + "learning_rate": 5.317969234805333e-05, + "loss": 0.0053, + "step": 326150 + }, + { + "epoch": 1.65, + "learning_rate": 5.317212465503932e-05, + "loss": 0.0079, + "step": 326160 + }, + { + "epoch": 1.65, + "learning_rate": 5.316455696202531e-05, + "loss": 0.0066, + "step": 326170 + }, + { + "epoch": 1.65, + "learning_rate": 5.3156989269011304e-05, + "loss": 0.0106, + "step": 326180 + }, + { + "epoch": 1.65, + "learning_rate": 5.314942157599729e-05, + "loss": 0.0068, + "step": 326190 + }, + { + "epoch": 1.65, + "learning_rate": 5.314185388298328e-05, + "loss": 0.0056, + "step": 326200 + }, + { + "epoch": 1.65, + "learning_rate": 5.313428618996927e-05, + "loss": 0.0085, + "step": 326210 + }, + { + "epoch": 1.65, + "learning_rate": 5.3126718496955264e-05, + "loss": 0.0069, + "step": 326220 + }, + { + "epoch": 1.65, + "learning_rate": 5.311915080394125e-05, + "loss": 0.0075, + "step": 326230 + }, + { + "epoch": 1.65, + "learning_rate": 5.311158311092724e-05, + "loss": 0.0056, + "step": 326240 + }, + { + "epoch": 1.65, + "learning_rate": 5.310401541791323e-05, + "loss": 0.0067, + "step": 326250 + }, + { + "epoch": 1.65, + "learning_rate": 5.309644772489922e-05, + "loss": 0.0059, + "step": 326260 + }, + { + "epoch": 1.65, + "learning_rate": 5.308888003188521e-05, + "loss": 0.0073, + "step": 326270 + }, + { + "epoch": 1.65, + "learning_rate": 5.30813123388712e-05, + "loss": 0.0054, + "step": 326280 + }, + { + "epoch": 1.65, + "learning_rate": 5.3073744645857195e-05, + "loss": 0.0104, + "step": 326290 + }, + { + "epoch": 1.65, + "learning_rate": 5.306617695284318e-05, + "loss": 0.0088, + "step": 326300 + }, + { + "epoch": 1.65, + "learning_rate": 5.305860925982917e-05, + "loss": 0.0071, + "step": 326310 + }, + { + "epoch": 1.65, + "learning_rate": 5.305104156681515e-05, + "loss": 0.0067, + "step": 326320 + }, + { + "epoch": 1.65, + "learning_rate": 5.304347387380114e-05, + "loss": 0.0068, + "step": 326330 + }, + { + "epoch": 1.65, + "learning_rate": 5.3035906180787136e-05, + "loss": 0.0055, + "step": 326340 + }, + { + "epoch": 1.65, + "learning_rate": 5.3028338487773124e-05, + "loss": 0.0084, + "step": 326350 + }, + { + "epoch": 1.65, + "learning_rate": 5.302077079475911e-05, + "loss": 0.0065, + "step": 326360 + }, + { + "epoch": 1.65, + "learning_rate": 5.30132031017451e-05, + "loss": 0.0058, + "step": 326370 + }, + { + "epoch": 1.65, + "learning_rate": 5.3005635408731095e-05, + "loss": 0.0065, + "step": 326380 + }, + { + "epoch": 1.65, + "learning_rate": 5.2998067715717084e-05, + "loss": 0.0056, + "step": 326390 + }, + { + "epoch": 1.65, + "learning_rate": 5.299050002270307e-05, + "loss": 0.008, + "step": 326400 + }, + { + "epoch": 1.65, + "learning_rate": 5.298293232968906e-05, + "loss": 0.0062, + "step": 326410 + }, + { + "epoch": 1.65, + "learning_rate": 5.2975364636675055e-05, + "loss": 0.0047, + "step": 326420 + }, + { + "epoch": 1.65, + "learning_rate": 5.296779694366104e-05, + "loss": 0.0076, + "step": 326430 + }, + { + "epoch": 1.65, + "learning_rate": 5.296022925064703e-05, + "loss": 0.0056, + "step": 326440 + }, + { + "epoch": 1.65, + "learning_rate": 5.295266155763302e-05, + "loss": 0.0085, + "step": 326450 + }, + { + "epoch": 1.65, + "learning_rate": 5.2945093864619015e-05, + "loss": 0.0072, + "step": 326460 + }, + { + "epoch": 1.65, + "learning_rate": 5.2937526171605e-05, + "loss": 0.0063, + "step": 326470 + }, + { + "epoch": 1.65, + "learning_rate": 5.292995847859099e-05, + "loss": 0.0086, + "step": 326480 + }, + { + "epoch": 1.65, + "learning_rate": 5.292239078557698e-05, + "loss": 0.0087, + "step": 326490 + }, + { + "epoch": 1.65, + "learning_rate": 5.2914823092562974e-05, + "loss": 0.0062, + "step": 326500 + }, + { + "epoch": 1.65, + "learning_rate": 5.290725539954896e-05, + "loss": 0.0056, + "step": 326510 + }, + { + "epoch": 1.65, + "learning_rate": 5.289968770653495e-05, + "loss": 0.007, + "step": 326520 + }, + { + "epoch": 1.65, + "learning_rate": 5.289212001352094e-05, + "loss": 0.0064, + "step": 326530 + }, + { + "epoch": 1.65, + "learning_rate": 5.2884552320506934e-05, + "loss": 0.0077, + "step": 326540 + }, + { + "epoch": 1.65, + "learning_rate": 5.287698462749292e-05, + "loss": 0.0058, + "step": 326550 + }, + { + "epoch": 1.65, + "learning_rate": 5.286941693447891e-05, + "loss": 0.0064, + "step": 326560 + }, + { + "epoch": 1.65, + "learning_rate": 5.28618492414649e-05, + "loss": 0.005, + "step": 326570 + }, + { + "epoch": 1.65, + "learning_rate": 5.2854281548450894e-05, + "loss": 0.007, + "step": 326580 + }, + { + "epoch": 1.65, + "learning_rate": 5.284671385543688e-05, + "loss": 0.0078, + "step": 326590 + }, + { + "epoch": 1.65, + "learning_rate": 5.283914616242287e-05, + "loss": 0.0068, + "step": 326600 + }, + { + "epoch": 1.65, + "learning_rate": 5.283157846940886e-05, + "loss": 0.0074, + "step": 326610 + }, + { + "epoch": 1.65, + "learning_rate": 5.282401077639485e-05, + "loss": 0.0074, + "step": 326620 + }, + { + "epoch": 1.65, + "learning_rate": 5.281644308338084e-05, + "loss": 0.0056, + "step": 326630 + }, + { + "epoch": 1.65, + "learning_rate": 5.280887539036682e-05, + "loss": 0.0094, + "step": 326640 + }, + { + "epoch": 1.65, + "learning_rate": 5.280130769735281e-05, + "loss": 0.005, + "step": 326650 + }, + { + "epoch": 1.65, + "learning_rate": 5.27937400043388e-05, + "loss": 0.0063, + "step": 326660 + }, + { + "epoch": 1.65, + "learning_rate": 5.2786172311324794e-05, + "loss": 0.0066, + "step": 326670 + }, + { + "epoch": 1.65, + "learning_rate": 5.277860461831078e-05, + "loss": 0.006, + "step": 326680 + }, + { + "epoch": 1.65, + "learning_rate": 5.277103692529677e-05, + "loss": 0.0072, + "step": 326690 + }, + { + "epoch": 1.65, + "learning_rate": 5.276346923228276e-05, + "loss": 0.0085, + "step": 326700 + }, + { + "epoch": 1.65, + "learning_rate": 5.2755901539268754e-05, + "loss": 0.0073, + "step": 326710 + }, + { + "epoch": 1.65, + "learning_rate": 5.274833384625474e-05, + "loss": 0.0079, + "step": 326720 + }, + { + "epoch": 1.65, + "learning_rate": 5.274076615324073e-05, + "loss": 0.0054, + "step": 326730 + }, + { + "epoch": 1.65, + "learning_rate": 5.2733198460226725e-05, + "loss": 0.0058, + "step": 326740 + }, + { + "epoch": 1.65, + "learning_rate": 5.2725630767212714e-05, + "loss": 0.006, + "step": 326750 + }, + { + "epoch": 1.65, + "learning_rate": 5.27180630741987e-05, + "loss": 0.0063, + "step": 326760 + }, + { + "epoch": 1.65, + "learning_rate": 5.271049538118469e-05, + "loss": 0.0084, + "step": 326770 + }, + { + "epoch": 1.65, + "learning_rate": 5.2702927688170685e-05, + "loss": 0.0062, + "step": 326780 + }, + { + "epoch": 1.65, + "learning_rate": 5.269535999515667e-05, + "loss": 0.0049, + "step": 326790 + }, + { + "epoch": 1.65, + "learning_rate": 5.268779230214266e-05, + "loss": 0.005, + "step": 326800 + }, + { + "epoch": 1.65, + "learning_rate": 5.268022460912865e-05, + "loss": 0.0072, + "step": 326810 + }, + { + "epoch": 1.65, + "learning_rate": 5.2672656916114645e-05, + "loss": 0.0053, + "step": 326820 + }, + { + "epoch": 1.65, + "learning_rate": 5.266508922310063e-05, + "loss": 0.0061, + "step": 326830 + }, + { + "epoch": 1.65, + "learning_rate": 5.265752153008662e-05, + "loss": 0.0073, + "step": 326840 + }, + { + "epoch": 1.65, + "learning_rate": 5.264995383707261e-05, + "loss": 0.0075, + "step": 326850 + }, + { + "epoch": 1.65, + "learning_rate": 5.2642386144058604e-05, + "loss": 0.0065, + "step": 326860 + }, + { + "epoch": 1.65, + "learning_rate": 5.263481845104459e-05, + "loss": 0.0069, + "step": 326870 + }, + { + "epoch": 1.65, + "learning_rate": 5.262725075803058e-05, + "loss": 0.0062, + "step": 326880 + }, + { + "epoch": 1.65, + "learning_rate": 5.261968306501657e-05, + "loss": 0.0064, + "step": 326890 + }, + { + "epoch": 1.65, + "learning_rate": 5.2612115372002564e-05, + "loss": 0.0066, + "step": 326900 + }, + { + "epoch": 1.65, + "learning_rate": 5.260454767898855e-05, + "loss": 0.0084, + "step": 326910 + }, + { + "epoch": 1.65, + "learning_rate": 5.259697998597454e-05, + "loss": 0.0079, + "step": 326920 + }, + { + "epoch": 1.65, + "learning_rate": 5.258941229296053e-05, + "loss": 0.0051, + "step": 326930 + }, + { + "epoch": 1.65, + "learning_rate": 5.2581844599946524e-05, + "loss": 0.0061, + "step": 326940 + }, + { + "epoch": 1.65, + "learning_rate": 5.2574276906932505e-05, + "loss": 0.0071, + "step": 326950 + }, + { + "epoch": 1.65, + "learning_rate": 5.256670921391849e-05, + "loss": 0.0057, + "step": 326960 + }, + { + "epoch": 1.65, + "learning_rate": 5.255914152090448e-05, + "loss": 0.007, + "step": 326970 + }, + { + "epoch": 1.65, + "learning_rate": 5.255157382789047e-05, + "loss": 0.0067, + "step": 326980 + }, + { + "epoch": 1.65, + "learning_rate": 5.2544006134876465e-05, + "loss": 0.0071, + "step": 326990 + }, + { + "epoch": 1.65, + "learning_rate": 5.253643844186245e-05, + "loss": 0.0055, + "step": 327000 + }, + { + "epoch": 1.65, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.004966360051184893, + "eval_runtime": 116.3822, + "eval_samples_per_second": 17.185, + "eval_steps_per_second": 4.296, + "step": 327000 + }, + { + "epoch": 1.65, + "learning_rate": 5.252887074884844e-05, + "loss": 0.0079, + "step": 327010 + }, + { + "epoch": 1.65, + "learning_rate": 5.252130305583443e-05, + "loss": 0.0102, + "step": 327020 + }, + { + "epoch": 1.65, + "learning_rate": 5.2513735362820424e-05, + "loss": 0.0109, + "step": 327030 + }, + { + "epoch": 1.65, + "learning_rate": 5.250616766980641e-05, + "loss": 0.0065, + "step": 327040 + }, + { + "epoch": 1.65, + "learning_rate": 5.24985999767924e-05, + "loss": 0.0065, + "step": 327050 + }, + { + "epoch": 1.65, + "learning_rate": 5.249103228377839e-05, + "loss": 0.0087, + "step": 327060 + }, + { + "epoch": 1.65, + "learning_rate": 5.2483464590764384e-05, + "loss": 0.0074, + "step": 327070 + }, + { + "epoch": 1.65, + "learning_rate": 5.247589689775037e-05, + "loss": 0.0052, + "step": 327080 + }, + { + "epoch": 1.65, + "learning_rate": 5.246832920473636e-05, + "loss": 0.007, + "step": 327090 + }, + { + "epoch": 1.65, + "learning_rate": 5.246076151172235e-05, + "loss": 0.0056, + "step": 327100 + }, + { + "epoch": 1.65, + "learning_rate": 5.2453193818708344e-05, + "loss": 0.0069, + "step": 327110 + }, + { + "epoch": 1.65, + "learning_rate": 5.244562612569433e-05, + "loss": 0.0079, + "step": 327120 + }, + { + "epoch": 1.65, + "learning_rate": 5.243805843268032e-05, + "loss": 0.0064, + "step": 327130 + }, + { + "epoch": 1.65, + "learning_rate": 5.243049073966631e-05, + "loss": 0.0081, + "step": 327140 + }, + { + "epoch": 1.65, + "learning_rate": 5.2422923046652303e-05, + "loss": 0.007, + "step": 327150 + }, + { + "epoch": 1.65, + "learning_rate": 5.241535535363829e-05, + "loss": 0.0039, + "step": 327160 + }, + { + "epoch": 1.65, + "learning_rate": 5.240778766062428e-05, + "loss": 0.009, + "step": 327170 + }, + { + "epoch": 1.65, + "learning_rate": 5.240021996761027e-05, + "loss": 0.0051, + "step": 327180 + }, + { + "epoch": 1.65, + "learning_rate": 5.239265227459626e-05, + "loss": 0.0056, + "step": 327190 + }, + { + "epoch": 1.65, + "learning_rate": 5.238508458158225e-05, + "loss": 0.0177, + "step": 327200 + }, + { + "epoch": 1.65, + "learning_rate": 5.237751688856824e-05, + "loss": 0.0072, + "step": 327210 + }, + { + "epoch": 1.65, + "learning_rate": 5.236994919555423e-05, + "loss": 0.0075, + "step": 327220 + }, + { + "epoch": 1.65, + "learning_rate": 5.236238150254022e-05, + "loss": 0.0069, + "step": 327230 + }, + { + "epoch": 1.65, + "learning_rate": 5.235481380952621e-05, + "loss": 0.0094, + "step": 327240 + }, + { + "epoch": 1.65, + "learning_rate": 5.23472461165122e-05, + "loss": 0.007, + "step": 327250 + }, + { + "epoch": 1.65, + "learning_rate": 5.2339678423498194e-05, + "loss": 0.0071, + "step": 327260 + }, + { + "epoch": 1.65, + "learning_rate": 5.2332110730484176e-05, + "loss": 0.0079, + "step": 327270 + }, + { + "epoch": 1.65, + "learning_rate": 5.2324543037470164e-05, + "loss": 0.0082, + "step": 327280 + }, + { + "epoch": 1.65, + "learning_rate": 5.231697534445615e-05, + "loss": 0.0086, + "step": 327290 + }, + { + "epoch": 1.65, + "learning_rate": 5.230940765144214e-05, + "loss": 0.0068, + "step": 327300 + }, + { + "epoch": 1.65, + "learning_rate": 5.2301839958428135e-05, + "loss": 0.0058, + "step": 327310 + }, + { + "epoch": 1.65, + "learning_rate": 5.2294272265414123e-05, + "loss": 0.0074, + "step": 327320 + }, + { + "epoch": 1.65, + "learning_rate": 5.228670457240011e-05, + "loss": 0.006, + "step": 327330 + }, + { + "epoch": 1.65, + "learning_rate": 5.22791368793861e-05, + "loss": 0.0045, + "step": 327340 + }, + { + "epoch": 1.65, + "learning_rate": 5.2271569186372095e-05, + "loss": 0.0054, + "step": 327350 + }, + { + "epoch": 1.65, + "learning_rate": 5.226400149335808e-05, + "loss": 0.0073, + "step": 327360 + }, + { + "epoch": 1.65, + "learning_rate": 5.225643380034407e-05, + "loss": 0.007, + "step": 327370 + }, + { + "epoch": 1.65, + "learning_rate": 5.224886610733006e-05, + "loss": 0.0062, + "step": 327380 + }, + { + "epoch": 1.65, + "learning_rate": 5.2241298414316055e-05, + "loss": 0.0051, + "step": 327390 + }, + { + "epoch": 1.65, + "learning_rate": 5.223373072130204e-05, + "loss": 0.0068, + "step": 327400 + }, + { + "epoch": 1.65, + "learning_rate": 5.222616302828803e-05, + "loss": 0.0075, + "step": 327410 + }, + { + "epoch": 1.65, + "learning_rate": 5.221859533527402e-05, + "loss": 0.006, + "step": 327420 + }, + { + "epoch": 1.65, + "learning_rate": 5.2211027642260014e-05, + "loss": 0.0065, + "step": 327430 + }, + { + "epoch": 1.65, + "learning_rate": 5.2203459949246e-05, + "loss": 0.0067, + "step": 327440 + }, + { + "epoch": 1.65, + "learning_rate": 5.219589225623199e-05, + "loss": 0.0053, + "step": 327450 + }, + { + "epoch": 1.65, + "learning_rate": 5.218832456321798e-05, + "loss": 0.006, + "step": 327460 + }, + { + "epoch": 1.65, + "learning_rate": 5.2180756870203974e-05, + "loss": 0.0081, + "step": 327470 + }, + { + "epoch": 1.65, + "learning_rate": 5.217318917718996e-05, + "loss": 0.0066, + "step": 327480 + }, + { + "epoch": 1.65, + "learning_rate": 5.216562148417595e-05, + "loss": 0.0057, + "step": 327490 + }, + { + "epoch": 1.65, + "learning_rate": 5.215805379116194e-05, + "loss": 0.0068, + "step": 327500 + }, + { + "epoch": 1.65, + "learning_rate": 5.2150486098147933e-05, + "loss": 0.0053, + "step": 327510 + }, + { + "epoch": 1.65, + "learning_rate": 5.214291840513392e-05, + "loss": 0.0056, + "step": 327520 + }, + { + "epoch": 1.65, + "learning_rate": 5.213535071211991e-05, + "loss": 0.0052, + "step": 327530 + }, + { + "epoch": 1.65, + "learning_rate": 5.21277830191059e-05, + "loss": 0.0065, + "step": 327540 + }, + { + "epoch": 1.65, + "learning_rate": 5.212021532609189e-05, + "loss": 0.0069, + "step": 327550 + }, + { + "epoch": 1.65, + "learning_rate": 5.211264763307788e-05, + "loss": 0.0082, + "step": 327560 + }, + { + "epoch": 1.65, + "learning_rate": 5.210507994006387e-05, + "loss": 0.0077, + "step": 327570 + }, + { + "epoch": 1.65, + "learning_rate": 5.209751224704985e-05, + "loss": 0.0063, + "step": 327580 + }, + { + "epoch": 1.65, + "learning_rate": 5.208994455403584e-05, + "loss": 0.0051, + "step": 327590 + }, + { + "epoch": 1.65, + "learning_rate": 5.2082376861021834e-05, + "loss": 0.0084, + "step": 327600 + }, + { + "epoch": 1.65, + "learning_rate": 5.207480916800782e-05, + "loss": 0.0051, + "step": 327610 + }, + { + "epoch": 1.65, + "learning_rate": 5.206724147499381e-05, + "loss": 0.0061, + "step": 327620 + }, + { + "epoch": 1.65, + "learning_rate": 5.20596737819798e-05, + "loss": 0.0087, + "step": 327630 + }, + { + "epoch": 1.65, + "learning_rate": 5.2052106088965794e-05, + "loss": 0.0055, + "step": 327640 + }, + { + "epoch": 1.65, + "learning_rate": 5.204453839595178e-05, + "loss": 0.009, + "step": 327650 + }, + { + "epoch": 1.65, + "learning_rate": 5.203697070293777e-05, + "loss": 0.0076, + "step": 327660 + }, + { + "epoch": 1.65, + "learning_rate": 5.202940300992376e-05, + "loss": 0.0053, + "step": 327670 + }, + { + "epoch": 1.65, + "learning_rate": 5.2021835316909754e-05, + "loss": 0.005, + "step": 327680 + }, + { + "epoch": 1.65, + "learning_rate": 5.201426762389574e-05, + "loss": 0.007, + "step": 327690 + }, + { + "epoch": 1.65, + "learning_rate": 5.200669993088173e-05, + "loss": 0.008, + "step": 327700 + }, + { + "epoch": 1.65, + "learning_rate": 5.1999132237867725e-05, + "loss": 0.0068, + "step": 327710 + }, + { + "epoch": 1.65, + "learning_rate": 5.199156454485371e-05, + "loss": 0.0075, + "step": 327720 + }, + { + "epoch": 1.65, + "learning_rate": 5.19839968518397e-05, + "loss": 0.007, + "step": 327730 + }, + { + "epoch": 1.65, + "learning_rate": 5.197642915882569e-05, + "loss": 0.0112, + "step": 327740 + }, + { + "epoch": 1.65, + "learning_rate": 5.1968861465811685e-05, + "loss": 0.0058, + "step": 327750 + }, + { + "epoch": 1.65, + "learning_rate": 5.196129377279767e-05, + "loss": 0.0075, + "step": 327760 + }, + { + "epoch": 1.65, + "learning_rate": 5.195372607978366e-05, + "loss": 0.0057, + "step": 327770 + }, + { + "epoch": 1.65, + "learning_rate": 5.194615838676965e-05, + "loss": 0.0113, + "step": 327780 + }, + { + "epoch": 1.65, + "learning_rate": 5.1938590693755644e-05, + "loss": 0.0053, + "step": 327790 + }, + { + "epoch": 1.65, + "learning_rate": 5.193102300074163e-05, + "loss": 0.0079, + "step": 327800 + }, + { + "epoch": 1.65, + "learning_rate": 5.192345530772762e-05, + "loss": 0.0062, + "step": 327810 + }, + { + "epoch": 1.65, + "learning_rate": 5.191588761471361e-05, + "loss": 0.0065, + "step": 327820 + }, + { + "epoch": 1.65, + "learning_rate": 5.1908319921699604e-05, + "loss": 0.0099, + "step": 327830 + }, + { + "epoch": 1.65, + "learning_rate": 5.190075222868559e-05, + "loss": 0.0071, + "step": 327840 + }, + { + "epoch": 1.65, + "learning_rate": 5.189318453567158e-05, + "loss": 0.0053, + "step": 327850 + }, + { + "epoch": 1.65, + "learning_rate": 5.188561684265757e-05, + "loss": 0.0043, + "step": 327860 + }, + { + "epoch": 1.65, + "learning_rate": 5.1878049149643564e-05, + "loss": 0.0089, + "step": 327870 + }, + { + "epoch": 1.65, + "learning_rate": 5.187048145662955e-05, + "loss": 0.0082, + "step": 327880 + }, + { + "epoch": 1.65, + "learning_rate": 5.186291376361554e-05, + "loss": 0.0058, + "step": 327890 + }, + { + "epoch": 1.65, + "learning_rate": 5.185534607060152e-05, + "loss": 0.0063, + "step": 327900 + }, + { + "epoch": 1.65, + "learning_rate": 5.184777837758751e-05, + "loss": 0.0061, + "step": 327910 + }, + { + "epoch": 1.65, + "learning_rate": 5.1840210684573505e-05, + "loss": 0.007, + "step": 327920 + }, + { + "epoch": 1.65, + "learning_rate": 5.183264299155949e-05, + "loss": 0.0065, + "step": 327930 + }, + { + "epoch": 1.65, + "learning_rate": 5.182507529854548e-05, + "loss": 0.0063, + "step": 327940 + }, + { + "epoch": 1.65, + "learning_rate": 5.181750760553147e-05, + "loss": 0.005, + "step": 327950 + }, + { + "epoch": 1.65, + "learning_rate": 5.1809939912517464e-05, + "loss": 0.0075, + "step": 327960 + }, + { + "epoch": 1.65, + "learning_rate": 5.180237221950345e-05, + "loss": 0.0065, + "step": 327970 + }, + { + "epoch": 1.65, + "learning_rate": 5.179480452648944e-05, + "loss": 0.0056, + "step": 327980 + }, + { + "epoch": 1.65, + "learning_rate": 5.178723683347543e-05, + "loss": 0.0077, + "step": 327990 + }, + { + "epoch": 1.65, + "learning_rate": 5.1779669140461424e-05, + "loss": 0.0089, + "step": 328000 + }, + { + "epoch": 1.65, + "eval_cer": 0.9144556999612812, + "eval_loss": 0.0049345288425683975, + "eval_runtime": 116.3068, + "eval_samples_per_second": 17.196, + "eval_steps_per_second": 4.299, + "step": 328000 + }, + { + "epoch": 1.65, + "learning_rate": 5.177210144744741e-05, + "loss": 0.0068, + "step": 328010 + }, + { + "epoch": 1.65, + "learning_rate": 5.17645337544334e-05, + "loss": 0.0093, + "step": 328020 + }, + { + "epoch": 1.65, + "learning_rate": 5.175696606141939e-05, + "loss": 0.0074, + "step": 328030 + }, + { + "epoch": 1.65, + "learning_rate": 5.1749398368405384e-05, + "loss": 0.006, + "step": 328040 + }, + { + "epoch": 1.66, + "learning_rate": 5.174183067539137e-05, + "loss": 0.0054, + "step": 328050 + }, + { + "epoch": 1.66, + "learning_rate": 5.173426298237736e-05, + "loss": 0.0055, + "step": 328060 + }, + { + "epoch": 1.66, + "learning_rate": 5.172669528936335e-05, + "loss": 0.0067, + "step": 328070 + }, + { + "epoch": 1.66, + "learning_rate": 5.171912759634934e-05, + "loss": 0.0064, + "step": 328080 + }, + { + "epoch": 1.66, + "learning_rate": 5.171155990333533e-05, + "loss": 0.0057, + "step": 328090 + }, + { + "epoch": 1.66, + "learning_rate": 5.170399221032132e-05, + "loss": 0.0059, + "step": 328100 + }, + { + "epoch": 1.66, + "learning_rate": 5.169642451730731e-05, + "loss": 0.0055, + "step": 328110 + }, + { + "epoch": 1.66, + "learning_rate": 5.16888568242933e-05, + "loss": 0.0057, + "step": 328120 + }, + { + "epoch": 1.66, + "learning_rate": 5.168128913127929e-05, + "loss": 0.0062, + "step": 328130 + }, + { + "epoch": 1.66, + "learning_rate": 5.167372143826528e-05, + "loss": 0.008, + "step": 328140 + }, + { + "epoch": 1.66, + "learning_rate": 5.166615374525127e-05, + "loss": 0.0073, + "step": 328150 + }, + { + "epoch": 1.66, + "learning_rate": 5.165858605223726e-05, + "loss": 0.005, + "step": 328160 + }, + { + "epoch": 1.66, + "learning_rate": 5.165101835922325e-05, + "loss": 0.0052, + "step": 328170 + }, + { + "epoch": 1.66, + "learning_rate": 5.164345066620924e-05, + "loss": 0.0042, + "step": 328180 + }, + { + "epoch": 1.66, + "learning_rate": 5.163588297319523e-05, + "loss": 0.0054, + "step": 328190 + }, + { + "epoch": 1.66, + "learning_rate": 5.162831528018122e-05, + "loss": 0.007, + "step": 328200 + }, + { + "epoch": 1.66, + "learning_rate": 5.1620747587167204e-05, + "loss": 0.0072, + "step": 328210 + }, + { + "epoch": 1.66, + "learning_rate": 5.161317989415319e-05, + "loss": 0.0086, + "step": 328220 + }, + { + "epoch": 1.66, + "learning_rate": 5.160561220113918e-05, + "loss": 0.0044, + "step": 328230 + }, + { + "epoch": 1.66, + "learning_rate": 5.1598044508125175e-05, + "loss": 0.0058, + "step": 328240 + }, + { + "epoch": 1.66, + "learning_rate": 5.159047681511116e-05, + "loss": 0.0049, + "step": 328250 + }, + { + "epoch": 1.66, + "learning_rate": 5.158290912209715e-05, + "loss": 0.0066, + "step": 328260 + }, + { + "epoch": 1.66, + "learning_rate": 5.157534142908314e-05, + "loss": 0.0059, + "step": 328270 + }, + { + "epoch": 1.66, + "learning_rate": 5.1567773736069135e-05, + "loss": 0.0073, + "step": 328280 + }, + { + "epoch": 1.66, + "learning_rate": 5.156020604305512e-05, + "loss": 0.0068, + "step": 328290 + }, + { + "epoch": 1.66, + "learning_rate": 5.155263835004111e-05, + "loss": 0.008, + "step": 328300 + }, + { + "epoch": 1.66, + "learning_rate": 5.15450706570271e-05, + "loss": 0.0054, + "step": 328310 + }, + { + "epoch": 1.66, + "learning_rate": 5.1537502964013094e-05, + "loss": 0.0054, + "step": 328320 + }, + { + "epoch": 1.66, + "learning_rate": 5.152993527099908e-05, + "loss": 0.0074, + "step": 328330 + }, + { + "epoch": 1.66, + "learning_rate": 5.152236757798507e-05, + "loss": 0.0094, + "step": 328340 + }, + { + "epoch": 1.66, + "learning_rate": 5.151479988497106e-05, + "loss": 0.0084, + "step": 328350 + }, + { + "epoch": 1.66, + "learning_rate": 5.1507232191957054e-05, + "loss": 0.0069, + "step": 328360 + }, + { + "epoch": 1.66, + "learning_rate": 5.149966449894304e-05, + "loss": 0.005, + "step": 328370 + }, + { + "epoch": 1.66, + "learning_rate": 5.149209680592903e-05, + "loss": 0.0066, + "step": 328380 + }, + { + "epoch": 1.66, + "learning_rate": 5.148452911291502e-05, + "loss": 0.0059, + "step": 328390 + }, + { + "epoch": 1.66, + "learning_rate": 5.1476961419901014e-05, + "loss": 0.0079, + "step": 328400 + }, + { + "epoch": 1.66, + "learning_rate": 5.1469393726887e-05, + "loss": 0.0079, + "step": 328410 + }, + { + "epoch": 1.66, + "learning_rate": 5.146182603387299e-05, + "loss": 0.0074, + "step": 328420 + }, + { + "epoch": 1.66, + "learning_rate": 5.145425834085898e-05, + "loss": 0.0066, + "step": 328430 + }, + { + "epoch": 1.66, + "learning_rate": 5.144669064784497e-05, + "loss": 0.0048, + "step": 328440 + }, + { + "epoch": 1.66, + "learning_rate": 5.143912295483096e-05, + "loss": 0.0058, + "step": 328450 + }, + { + "epoch": 1.66, + "learning_rate": 5.143155526181695e-05, + "loss": 0.0061, + "step": 328460 + }, + { + "epoch": 1.66, + "learning_rate": 5.142398756880294e-05, + "loss": 0.0051, + "step": 328470 + }, + { + "epoch": 1.66, + "learning_rate": 5.141641987578893e-05, + "loss": 0.006, + "step": 328480 + }, + { + "epoch": 1.66, + "learning_rate": 5.140885218277492e-05, + "loss": 0.006, + "step": 328490 + }, + { + "epoch": 1.66, + "learning_rate": 5.140128448976091e-05, + "loss": 0.0077, + "step": 328500 + }, + { + "epoch": 1.66, + "learning_rate": 5.13937167967469e-05, + "loss": 0.0054, + "step": 328510 + }, + { + "epoch": 1.66, + "learning_rate": 5.138614910373288e-05, + "loss": 0.0043, + "step": 328520 + }, + { + "epoch": 1.66, + "learning_rate": 5.1378581410718874e-05, + "loss": 0.0055, + "step": 328530 + }, + { + "epoch": 1.66, + "learning_rate": 5.137101371770486e-05, + "loss": 0.0091, + "step": 328540 + }, + { + "epoch": 1.66, + "learning_rate": 5.136344602469085e-05, + "loss": 0.0063, + "step": 328550 + }, + { + "epoch": 1.66, + "learning_rate": 5.135587833167684e-05, + "loss": 0.0076, + "step": 328560 + }, + { + "epoch": 1.66, + "learning_rate": 5.1348310638662834e-05, + "loss": 0.0081, + "step": 328570 + }, + { + "epoch": 1.66, + "learning_rate": 5.134074294564882e-05, + "loss": 0.0067, + "step": 328580 + }, + { + "epoch": 1.66, + "learning_rate": 5.133317525263481e-05, + "loss": 0.0059, + "step": 328590 + }, + { + "epoch": 1.66, + "learning_rate": 5.13256075596208e-05, + "loss": 0.0071, + "step": 328600 + }, + { + "epoch": 1.66, + "learning_rate": 5.1318039866606793e-05, + "loss": 0.007, + "step": 328610 + }, + { + "epoch": 1.66, + "learning_rate": 5.131047217359278e-05, + "loss": 0.0085, + "step": 328620 + }, + { + "epoch": 1.66, + "learning_rate": 5.130290448057877e-05, + "loss": 0.0058, + "step": 328630 + }, + { + "epoch": 1.66, + "learning_rate": 5.129533678756476e-05, + "loss": 0.0056, + "step": 328640 + }, + { + "epoch": 1.66, + "learning_rate": 5.128776909455075e-05, + "loss": 0.0051, + "step": 328650 + }, + { + "epoch": 1.66, + "learning_rate": 5.128020140153674e-05, + "loss": 0.005, + "step": 328660 + }, + { + "epoch": 1.66, + "learning_rate": 5.127263370852273e-05, + "loss": 0.0089, + "step": 328670 + }, + { + "epoch": 1.66, + "learning_rate": 5.1265066015508724e-05, + "loss": 0.0107, + "step": 328680 + }, + { + "epoch": 1.66, + "learning_rate": 5.125749832249471e-05, + "loss": 0.0069, + "step": 328690 + }, + { + "epoch": 1.66, + "learning_rate": 5.12499306294807e-05, + "loss": 0.0051, + "step": 328700 + }, + { + "epoch": 1.66, + "learning_rate": 5.124236293646669e-05, + "loss": 0.006, + "step": 328710 + }, + { + "epoch": 1.66, + "learning_rate": 5.1234795243452684e-05, + "loss": 0.0064, + "step": 328720 + }, + { + "epoch": 1.66, + "learning_rate": 5.122722755043867e-05, + "loss": 0.0046, + "step": 328730 + }, + { + "epoch": 1.66, + "learning_rate": 5.121965985742466e-05, + "loss": 0.0052, + "step": 328740 + }, + { + "epoch": 1.66, + "learning_rate": 5.121209216441065e-05, + "loss": 0.0061, + "step": 328750 + }, + { + "epoch": 1.66, + "learning_rate": 5.1204524471396644e-05, + "loss": 0.0053, + "step": 328760 + }, + { + "epoch": 1.66, + "learning_rate": 5.119695677838263e-05, + "loss": 0.0052, + "step": 328770 + }, + { + "epoch": 1.66, + "learning_rate": 5.118938908536862e-05, + "loss": 0.0067, + "step": 328780 + }, + { + "epoch": 1.66, + "learning_rate": 5.118182139235461e-05, + "loss": 0.0086, + "step": 328790 + }, + { + "epoch": 1.66, + "learning_rate": 5.1174253699340603e-05, + "loss": 0.0061, + "step": 328800 + }, + { + "epoch": 1.66, + "learning_rate": 5.116668600632659e-05, + "loss": 0.0055, + "step": 328810 + }, + { + "epoch": 1.66, + "learning_rate": 5.115911831331258e-05, + "loss": 0.0063, + "step": 328820 + }, + { + "epoch": 1.66, + "learning_rate": 5.115155062029857e-05, + "loss": 0.006, + "step": 328830 + }, + { + "epoch": 1.66, + "learning_rate": 5.114398292728455e-05, + "loss": 0.005, + "step": 328840 + }, + { + "epoch": 1.66, + "learning_rate": 5.1136415234270545e-05, + "loss": 0.0048, + "step": 328850 + }, + { + "epoch": 1.66, + "learning_rate": 5.112884754125653e-05, + "loss": 0.0061, + "step": 328860 + }, + { + "epoch": 1.66, + "learning_rate": 5.112127984824252e-05, + "loss": 0.0079, + "step": 328870 + }, + { + "epoch": 1.66, + "learning_rate": 5.111371215522851e-05, + "loss": 0.0086, + "step": 328880 + }, + { + "epoch": 1.66, + "learning_rate": 5.1106144462214504e-05, + "loss": 0.0037, + "step": 328890 + }, + { + "epoch": 1.66, + "learning_rate": 5.109857676920049e-05, + "loss": 0.0052, + "step": 328900 + }, + { + "epoch": 1.66, + "learning_rate": 5.109100907618648e-05, + "loss": 0.0073, + "step": 328910 + }, + { + "epoch": 1.66, + "learning_rate": 5.108344138317247e-05, + "loss": 0.0055, + "step": 328920 + }, + { + "epoch": 1.66, + "learning_rate": 5.1075873690158464e-05, + "loss": 0.0083, + "step": 328930 + }, + { + "epoch": 1.66, + "learning_rate": 5.106830599714445e-05, + "loss": 0.0063, + "step": 328940 + }, + { + "epoch": 1.66, + "learning_rate": 5.106073830413044e-05, + "loss": 0.0069, + "step": 328950 + }, + { + "epoch": 1.66, + "learning_rate": 5.105317061111643e-05, + "loss": 0.0074, + "step": 328960 + }, + { + "epoch": 1.66, + "learning_rate": 5.1045602918102423e-05, + "loss": 0.006, + "step": 328970 + }, + { + "epoch": 1.66, + "learning_rate": 5.103803522508841e-05, + "loss": 0.0075, + "step": 328980 + }, + { + "epoch": 1.66, + "learning_rate": 5.10304675320744e-05, + "loss": 0.0056, + "step": 328990 + }, + { + "epoch": 1.66, + "learning_rate": 5.102289983906039e-05, + "loss": 0.0058, + "step": 329000 + }, + { + "epoch": 1.66, + "eval_cer": 0.914447936792278, + "eval_loss": 0.004932132083922625, + "eval_runtime": 116.3131, + "eval_samples_per_second": 17.195, + "eval_steps_per_second": 4.299, + "step": 329000 + }, + { + "epoch": 1.66, + "learning_rate": 5.101533214604638e-05, + "loss": 0.0061, + "step": 329010 + }, + { + "epoch": 1.66, + "learning_rate": 5.100776445303237e-05, + "loss": 0.0075, + "step": 329020 + }, + { + "epoch": 1.66, + "learning_rate": 5.100019676001836e-05, + "loss": 0.0103, + "step": 329030 + }, + { + "epoch": 1.66, + "learning_rate": 5.099262906700435e-05, + "loss": 0.0059, + "step": 329040 + }, + { + "epoch": 1.66, + "learning_rate": 5.098506137399034e-05, + "loss": 0.0064, + "step": 329050 + }, + { + "epoch": 1.66, + "learning_rate": 5.097749368097633e-05, + "loss": 0.0049, + "step": 329060 + }, + { + "epoch": 1.66, + "learning_rate": 5.096992598796232e-05, + "loss": 0.0054, + "step": 329070 + }, + { + "epoch": 1.66, + "learning_rate": 5.096235829494831e-05, + "loss": 0.007, + "step": 329080 + }, + { + "epoch": 1.66, + "learning_rate": 5.09547906019343e-05, + "loss": 0.0062, + "step": 329090 + }, + { + "epoch": 1.66, + "learning_rate": 5.094722290892029e-05, + "loss": 0.0097, + "step": 329100 + }, + { + "epoch": 1.66, + "learning_rate": 5.093965521590628e-05, + "loss": 0.0046, + "step": 329110 + }, + { + "epoch": 1.66, + "learning_rate": 5.093208752289227e-05, + "loss": 0.0081, + "step": 329120 + }, + { + "epoch": 1.66, + "learning_rate": 5.092451982987826e-05, + "loss": 0.0062, + "step": 329130 + }, + { + "epoch": 1.66, + "learning_rate": 5.091695213686425e-05, + "loss": 0.0056, + "step": 329140 + }, + { + "epoch": 1.66, + "learning_rate": 5.090938444385023e-05, + "loss": 0.0063, + "step": 329150 + }, + { + "epoch": 1.66, + "learning_rate": 5.090181675083622e-05, + "loss": 0.0051, + "step": 329160 + }, + { + "epoch": 1.66, + "learning_rate": 5.0894249057822215e-05, + "loss": 0.0069, + "step": 329170 + }, + { + "epoch": 1.66, + "learning_rate": 5.08866813648082e-05, + "loss": 0.0091, + "step": 329180 + }, + { + "epoch": 1.66, + "learning_rate": 5.087911367179419e-05, + "loss": 0.0064, + "step": 329190 + }, + { + "epoch": 1.66, + "learning_rate": 5.087154597878018e-05, + "loss": 0.0076, + "step": 329200 + }, + { + "epoch": 1.66, + "learning_rate": 5.0863978285766175e-05, + "loss": 0.0081, + "step": 329210 + }, + { + "epoch": 1.66, + "learning_rate": 5.085641059275216e-05, + "loss": 0.0079, + "step": 329220 + }, + { + "epoch": 1.66, + "learning_rate": 5.084884289973815e-05, + "loss": 0.0092, + "step": 329230 + }, + { + "epoch": 1.66, + "learning_rate": 5.084127520672414e-05, + "loss": 0.0064, + "step": 329240 + }, + { + "epoch": 1.66, + "learning_rate": 5.0833707513710134e-05, + "loss": 0.0042, + "step": 329250 + }, + { + "epoch": 1.66, + "learning_rate": 5.082613982069612e-05, + "loss": 0.0072, + "step": 329260 + }, + { + "epoch": 1.66, + "learning_rate": 5.081857212768211e-05, + "loss": 0.0075, + "step": 329270 + }, + { + "epoch": 1.66, + "learning_rate": 5.08110044346681e-05, + "loss": 0.0083, + "step": 329280 + }, + { + "epoch": 1.66, + "learning_rate": 5.0803436741654094e-05, + "loss": 0.0065, + "step": 329290 + }, + { + "epoch": 1.66, + "learning_rate": 5.079586904864008e-05, + "loss": 0.0045, + "step": 329300 + }, + { + "epoch": 1.66, + "learning_rate": 5.078830135562607e-05, + "loss": 0.0063, + "step": 329310 + }, + { + "epoch": 1.66, + "learning_rate": 5.078073366261206e-05, + "loss": 0.0064, + "step": 329320 + }, + { + "epoch": 1.66, + "learning_rate": 5.0773165969598054e-05, + "loss": 0.0069, + "step": 329330 + }, + { + "epoch": 1.66, + "learning_rate": 5.076559827658404e-05, + "loss": 0.0073, + "step": 329340 + }, + { + "epoch": 1.66, + "learning_rate": 5.075803058357003e-05, + "loss": 0.0062, + "step": 329350 + }, + { + "epoch": 1.66, + "learning_rate": 5.075046289055602e-05, + "loss": 0.0078, + "step": 329360 + }, + { + "epoch": 1.66, + "learning_rate": 5.074289519754201e-05, + "loss": 0.0059, + "step": 329370 + }, + { + "epoch": 1.66, + "learning_rate": 5.0735327504528e-05, + "loss": 0.0109, + "step": 329380 + }, + { + "epoch": 1.66, + "learning_rate": 5.072775981151399e-05, + "loss": 0.0044, + "step": 329390 + }, + { + "epoch": 1.66, + "learning_rate": 5.072019211849998e-05, + "loss": 0.0061, + "step": 329400 + }, + { + "epoch": 1.66, + "learning_rate": 5.071262442548597e-05, + "loss": 0.0076, + "step": 329410 + }, + { + "epoch": 1.66, + "learning_rate": 5.070505673247196e-05, + "loss": 0.0054, + "step": 329420 + }, + { + "epoch": 1.66, + "learning_rate": 5.069748903945795e-05, + "loss": 0.0061, + "step": 329430 + }, + { + "epoch": 1.66, + "learning_rate": 5.068992134644394e-05, + "loss": 0.0068, + "step": 329440 + }, + { + "epoch": 1.66, + "learning_rate": 5.068235365342993e-05, + "loss": 0.0077, + "step": 329450 + }, + { + "epoch": 1.66, + "learning_rate": 5.067478596041592e-05, + "loss": 0.008, + "step": 329460 + }, + { + "epoch": 1.66, + "learning_rate": 5.06672182674019e-05, + "loss": 0.0062, + "step": 329470 + }, + { + "epoch": 1.66, + "learning_rate": 5.065965057438789e-05, + "loss": 0.0064, + "step": 329480 + }, + { + "epoch": 1.66, + "learning_rate": 5.065208288137388e-05, + "loss": 0.0072, + "step": 329490 + }, + { + "epoch": 1.66, + "learning_rate": 5.0644515188359874e-05, + "loss": 0.0054, + "step": 329500 + }, + { + "epoch": 1.66, + "learning_rate": 5.063694749534586e-05, + "loss": 0.0047, + "step": 329510 + }, + { + "epoch": 1.66, + "learning_rate": 5.062937980233185e-05, + "loss": 0.0085, + "step": 329520 + }, + { + "epoch": 1.66, + "learning_rate": 5.062181210931784e-05, + "loss": 0.007, + "step": 329530 + }, + { + "epoch": 1.66, + "learning_rate": 5.061424441630383e-05, + "loss": 0.0064, + "step": 329540 + }, + { + "epoch": 1.66, + "learning_rate": 5.060667672328982e-05, + "loss": 0.0057, + "step": 329550 + }, + { + "epoch": 1.66, + "learning_rate": 5.059910903027581e-05, + "loss": 0.0054, + "step": 329560 + }, + { + "epoch": 1.66, + "learning_rate": 5.05915413372618e-05, + "loss": 0.0071, + "step": 329570 + }, + { + "epoch": 1.66, + "learning_rate": 5.058397364424779e-05, + "loss": 0.0069, + "step": 329580 + }, + { + "epoch": 1.66, + "learning_rate": 5.057640595123378e-05, + "loss": 0.0068, + "step": 329590 + }, + { + "epoch": 1.66, + "learning_rate": 5.056883825821977e-05, + "loss": 0.0047, + "step": 329600 + }, + { + "epoch": 1.66, + "learning_rate": 5.056127056520576e-05, + "loss": 0.006, + "step": 329610 + }, + { + "epoch": 1.66, + "learning_rate": 5.055370287219175e-05, + "loss": 0.0069, + "step": 329620 + }, + { + "epoch": 1.66, + "learning_rate": 5.054613517917774e-05, + "loss": 0.0072, + "step": 329630 + }, + { + "epoch": 1.66, + "learning_rate": 5.053856748616373e-05, + "loss": 0.0065, + "step": 329640 + }, + { + "epoch": 1.66, + "learning_rate": 5.0530999793149724e-05, + "loss": 0.0072, + "step": 329650 + }, + { + "epoch": 1.66, + "learning_rate": 5.052343210013571e-05, + "loss": 0.0083, + "step": 329660 + }, + { + "epoch": 1.66, + "learning_rate": 5.05158644071217e-05, + "loss": 0.0061, + "step": 329670 + }, + { + "epoch": 1.66, + "learning_rate": 5.050829671410769e-05, + "loss": 0.0061, + "step": 329680 + }, + { + "epoch": 1.66, + "learning_rate": 5.0500729021093684e-05, + "loss": 0.0079, + "step": 329690 + }, + { + "epoch": 1.66, + "learning_rate": 5.049316132807967e-05, + "loss": 0.0057, + "step": 329700 + }, + { + "epoch": 1.66, + "learning_rate": 5.048559363506566e-05, + "loss": 0.0061, + "step": 329710 + }, + { + "epoch": 1.66, + "learning_rate": 5.047802594205165e-05, + "loss": 0.0071, + "step": 329720 + }, + { + "epoch": 1.66, + "learning_rate": 5.047045824903764e-05, + "loss": 0.0062, + "step": 329730 + }, + { + "epoch": 1.66, + "learning_rate": 5.046289055602363e-05, + "loss": 0.0075, + "step": 329740 + }, + { + "epoch": 1.66, + "learning_rate": 5.045532286300962e-05, + "loss": 0.0062, + "step": 329750 + }, + { + "epoch": 1.66, + "learning_rate": 5.044775516999561e-05, + "loss": 0.0061, + "step": 329760 + }, + { + "epoch": 1.66, + "learning_rate": 5.04401874769816e-05, + "loss": 0.0073, + "step": 329770 + }, + { + "epoch": 1.66, + "learning_rate": 5.0432619783967584e-05, + "loss": 0.0082, + "step": 329780 + }, + { + "epoch": 1.66, + "learning_rate": 5.042505209095357e-05, + "loss": 0.0096, + "step": 329790 + }, + { + "epoch": 1.66, + "learning_rate": 5.041748439793956e-05, + "loss": 0.0054, + "step": 329800 + }, + { + "epoch": 1.66, + "learning_rate": 5.040991670492555e-05, + "loss": 0.0064, + "step": 329810 + }, + { + "epoch": 1.66, + "learning_rate": 5.0402349011911544e-05, + "loss": 0.0067, + "step": 329820 + }, + { + "epoch": 1.66, + "learning_rate": 5.039478131889753e-05, + "loss": 0.0074, + "step": 329830 + }, + { + "epoch": 1.66, + "learning_rate": 5.038721362588352e-05, + "loss": 0.0054, + "step": 329840 + }, + { + "epoch": 1.66, + "learning_rate": 5.037964593286951e-05, + "loss": 0.006, + "step": 329850 + }, + { + "epoch": 1.66, + "learning_rate": 5.0372078239855504e-05, + "loss": 0.0051, + "step": 329860 + }, + { + "epoch": 1.66, + "learning_rate": 5.036451054684149e-05, + "loss": 0.0104, + "step": 329870 + }, + { + "epoch": 1.66, + "learning_rate": 5.035694285382748e-05, + "loss": 0.0092, + "step": 329880 + }, + { + "epoch": 1.66, + "learning_rate": 5.034937516081347e-05, + "loss": 0.0056, + "step": 329890 + }, + { + "epoch": 1.66, + "learning_rate": 5.034180746779946e-05, + "loss": 0.0066, + "step": 329900 + }, + { + "epoch": 1.66, + "learning_rate": 5.033423977478545e-05, + "loss": 0.0043, + "step": 329910 + }, + { + "epoch": 1.66, + "learning_rate": 5.032667208177144e-05, + "loss": 0.0056, + "step": 329920 + }, + { + "epoch": 1.66, + "learning_rate": 5.031910438875743e-05, + "loss": 0.0056, + "step": 329930 + }, + { + "epoch": 1.66, + "learning_rate": 5.031153669574342e-05, + "loss": 0.0047, + "step": 329940 + }, + { + "epoch": 1.66, + "learning_rate": 5.030396900272941e-05, + "loss": 0.0059, + "step": 329950 + }, + { + "epoch": 1.66, + "learning_rate": 5.02964013097154e-05, + "loss": 0.0065, + "step": 329960 + }, + { + "epoch": 1.66, + "learning_rate": 5.028883361670139e-05, + "loss": 0.0067, + "step": 329970 + }, + { + "epoch": 1.66, + "learning_rate": 5.028126592368738e-05, + "loss": 0.0058, + "step": 329980 + }, + { + "epoch": 1.66, + "learning_rate": 5.027369823067337e-05, + "loss": 0.0065, + "step": 329990 + }, + { + "epoch": 1.66, + "learning_rate": 5.026613053765936e-05, + "loss": 0.0077, + "step": 330000 + }, + { + "epoch": 1.66, + "eval_cer": 0.9144411440194001, + "eval_loss": 0.0048608663491904736, + "eval_runtime": 116.3415, + "eval_samples_per_second": 17.191, + "eval_steps_per_second": 4.298, + "step": 330000 + }, + { + "epoch": 1.66, + "learning_rate": 5.025856284464535e-05, + "loss": 0.0047, + "step": 330010 + }, + { + "epoch": 1.66, + "learning_rate": 5.025099515163134e-05, + "loss": 0.0089, + "step": 330020 + }, + { + "epoch": 1.67, + "learning_rate": 5.024342745861733e-05, + "loss": 0.0044, + "step": 330030 + }, + { + "epoch": 1.67, + "learning_rate": 5.023585976560332e-05, + "loss": 0.0054, + "step": 330040 + }, + { + "epoch": 1.67, + "learning_rate": 5.022829207258931e-05, + "loss": 0.0054, + "step": 330050 + }, + { + "epoch": 1.67, + "learning_rate": 5.02207243795753e-05, + "loss": 0.0059, + "step": 330060 + }, + { + "epoch": 1.67, + "learning_rate": 5.021315668656129e-05, + "loss": 0.0058, + "step": 330070 + }, + { + "epoch": 1.67, + "learning_rate": 5.020558899354728e-05, + "loss": 0.0048, + "step": 330080 + }, + { + "epoch": 1.67, + "learning_rate": 5.019802130053326e-05, + "loss": 0.0071, + "step": 330090 + }, + { + "epoch": 1.67, + "learning_rate": 5.0190453607519255e-05, + "loss": 0.0059, + "step": 330100 + }, + { + "epoch": 1.67, + "learning_rate": 5.018288591450524e-05, + "loss": 0.0076, + "step": 330110 + }, + { + "epoch": 1.67, + "learning_rate": 5.017531822149123e-05, + "loss": 0.0066, + "step": 330120 + }, + { + "epoch": 1.67, + "learning_rate": 5.016775052847722e-05, + "loss": 0.0075, + "step": 330130 + }, + { + "epoch": 1.67, + "learning_rate": 5.0160182835463214e-05, + "loss": 0.007, + "step": 330140 + }, + { + "epoch": 1.67, + "learning_rate": 5.01526151424492e-05, + "loss": 0.01, + "step": 330150 + }, + { + "epoch": 1.67, + "learning_rate": 5.014504744943519e-05, + "loss": 0.0053, + "step": 330160 + }, + { + "epoch": 1.67, + "learning_rate": 5.013747975642118e-05, + "loss": 0.0063, + "step": 330170 + }, + { + "epoch": 1.67, + "learning_rate": 5.0129912063407174e-05, + "loss": 0.0064, + "step": 330180 + }, + { + "epoch": 1.67, + "learning_rate": 5.012234437039316e-05, + "loss": 0.0063, + "step": 330190 + }, + { + "epoch": 1.67, + "learning_rate": 5.011477667737915e-05, + "loss": 0.0055, + "step": 330200 + }, + { + "epoch": 1.67, + "learning_rate": 5.010720898436514e-05, + "loss": 0.0057, + "step": 330210 + }, + { + "epoch": 1.67, + "learning_rate": 5.0099641291351134e-05, + "loss": 0.0065, + "step": 330220 + }, + { + "epoch": 1.67, + "learning_rate": 5.009207359833712e-05, + "loss": 0.0079, + "step": 330230 + }, + { + "epoch": 1.67, + "learning_rate": 5.008450590532311e-05, + "loss": 0.0063, + "step": 330240 + }, + { + "epoch": 1.67, + "learning_rate": 5.00769382123091e-05, + "loss": 0.005, + "step": 330250 + }, + { + "epoch": 1.67, + "learning_rate": 5.0069370519295093e-05, + "loss": 0.0066, + "step": 330260 + }, + { + "epoch": 1.67, + "learning_rate": 5.006180282628108e-05, + "loss": 0.0073, + "step": 330270 + }, + { + "epoch": 1.67, + "learning_rate": 5.005423513326707e-05, + "loss": 0.0053, + "step": 330280 + }, + { + "epoch": 1.67, + "learning_rate": 5.004666744025306e-05, + "loss": 0.0074, + "step": 330290 + }, + { + "epoch": 1.67, + "learning_rate": 5.003909974723905e-05, + "loss": 0.006, + "step": 330300 + }, + { + "epoch": 1.67, + "learning_rate": 5.003153205422504e-05, + "loss": 0.0068, + "step": 330310 + }, + { + "epoch": 1.67, + "learning_rate": 5.002396436121103e-05, + "loss": 0.006, + "step": 330320 + }, + { + "epoch": 1.67, + "learning_rate": 5.001639666819702e-05, + "loss": 0.0099, + "step": 330330 + }, + { + "epoch": 1.67, + "learning_rate": 5.000882897518301e-05, + "loss": 0.0059, + "step": 330340 + }, + { + "epoch": 1.67, + "learning_rate": 5.0001261282169e-05, + "loss": 0.0059, + "step": 330350 + }, + { + "epoch": 1.67, + "learning_rate": 4.999369358915499e-05, + "loss": 0.0065, + "step": 330360 + }, + { + "epoch": 1.67, + "learning_rate": 4.998612589614098e-05, + "loss": 0.0073, + "step": 330370 + }, + { + "epoch": 1.67, + "learning_rate": 4.997855820312697e-05, + "loss": 0.0072, + "step": 330380 + }, + { + "epoch": 1.67, + "learning_rate": 4.997099051011296e-05, + "loss": 0.0075, + "step": 330390 + }, + { + "epoch": 1.67, + "learning_rate": 4.996342281709895e-05, + "loss": 0.0042, + "step": 330400 + }, + { + "epoch": 1.67, + "learning_rate": 4.995585512408493e-05, + "loss": 0.0054, + "step": 330410 + }, + { + "epoch": 1.67, + "learning_rate": 4.994828743107092e-05, + "loss": 0.0071, + "step": 330420 + }, + { + "epoch": 1.67, + "learning_rate": 4.9940719738056913e-05, + "loss": 0.0069, + "step": 330430 + }, + { + "epoch": 1.67, + "learning_rate": 4.99331520450429e-05, + "loss": 0.0085, + "step": 330440 + }, + { + "epoch": 1.67, + "learning_rate": 4.992558435202889e-05, + "loss": 0.0114, + "step": 330450 + }, + { + "epoch": 1.67, + "learning_rate": 4.991801665901488e-05, + "loss": 0.0063, + "step": 330460 + }, + { + "epoch": 1.67, + "learning_rate": 4.991044896600087e-05, + "loss": 0.0049, + "step": 330470 + }, + { + "epoch": 1.67, + "learning_rate": 4.990288127298686e-05, + "loss": 0.0147, + "step": 330480 + }, + { + "epoch": 1.67, + "learning_rate": 4.989531357997285e-05, + "loss": 0.0079, + "step": 330490 + }, + { + "epoch": 1.67, + "learning_rate": 4.988774588695884e-05, + "loss": 0.0078, + "step": 330500 + }, + { + "epoch": 1.67, + "learning_rate": 4.988017819394483e-05, + "loss": 0.0068, + "step": 330510 + }, + { + "epoch": 1.67, + "learning_rate": 4.987261050093082e-05, + "loss": 0.0068, + "step": 330520 + }, + { + "epoch": 1.67, + "learning_rate": 4.986504280791681e-05, + "loss": 0.0074, + "step": 330530 + }, + { + "epoch": 1.67, + "learning_rate": 4.98574751149028e-05, + "loss": 0.0063, + "step": 330540 + }, + { + "epoch": 1.67, + "learning_rate": 4.984990742188879e-05, + "loss": 0.0065, + "step": 330550 + }, + { + "epoch": 1.67, + "learning_rate": 4.984233972887478e-05, + "loss": 0.0055, + "step": 330560 + }, + { + "epoch": 1.67, + "learning_rate": 4.983477203586077e-05, + "loss": 0.0076, + "step": 330570 + }, + { + "epoch": 1.67, + "learning_rate": 4.982720434284676e-05, + "loss": 0.0055, + "step": 330580 + }, + { + "epoch": 1.67, + "learning_rate": 4.981963664983275e-05, + "loss": 0.0046, + "step": 330590 + }, + { + "epoch": 1.67, + "learning_rate": 4.981206895681874e-05, + "loss": 0.0068, + "step": 330600 + }, + { + "epoch": 1.67, + "learning_rate": 4.980450126380473e-05, + "loss": 0.0074, + "step": 330610 + }, + { + "epoch": 1.67, + "learning_rate": 4.9796933570790724e-05, + "loss": 0.006, + "step": 330620 + }, + { + "epoch": 1.67, + "learning_rate": 4.978936587777671e-05, + "loss": 0.0085, + "step": 330630 + }, + { + "epoch": 1.67, + "learning_rate": 4.97817981847627e-05, + "loss": 0.0052, + "step": 330640 + }, + { + "epoch": 1.67, + "learning_rate": 4.977423049174869e-05, + "loss": 0.0072, + "step": 330650 + }, + { + "epoch": 1.67, + "learning_rate": 4.976666279873468e-05, + "loss": 0.0066, + "step": 330660 + }, + { + "epoch": 1.67, + "learning_rate": 4.975909510572067e-05, + "loss": 0.0069, + "step": 330670 + }, + { + "epoch": 1.67, + "learning_rate": 4.975152741270666e-05, + "loss": 0.0071, + "step": 330680 + }, + { + "epoch": 1.67, + "learning_rate": 4.974395971969265e-05, + "loss": 0.0065, + "step": 330690 + }, + { + "epoch": 1.67, + "learning_rate": 4.973639202667864e-05, + "loss": 0.0071, + "step": 330700 + }, + { + "epoch": 1.67, + "learning_rate": 4.972882433366463e-05, + "loss": 0.0089, + "step": 330710 + }, + { + "epoch": 1.67, + "learning_rate": 4.972125664065061e-05, + "loss": 0.0071, + "step": 330720 + }, + { + "epoch": 1.67, + "learning_rate": 4.97136889476366e-05, + "loss": 0.0068, + "step": 330730 + }, + { + "epoch": 1.67, + "learning_rate": 4.970612125462259e-05, + "loss": 0.0069, + "step": 330740 + }, + { + "epoch": 1.67, + "learning_rate": 4.9698553561608584e-05, + "loss": 0.0073, + "step": 330750 + }, + { + "epoch": 1.67, + "learning_rate": 4.969098586859457e-05, + "loss": 0.005, + "step": 330760 + }, + { + "epoch": 1.67, + "learning_rate": 4.968341817558056e-05, + "loss": 0.0039, + "step": 330770 + }, + { + "epoch": 1.67, + "learning_rate": 4.967585048256655e-05, + "loss": 0.0102, + "step": 330780 + }, + { + "epoch": 1.67, + "learning_rate": 4.9668282789552544e-05, + "loss": 0.0076, + "step": 330790 + }, + { + "epoch": 1.67, + "learning_rate": 4.966071509653853e-05, + "loss": 0.006, + "step": 330800 + }, + { + "epoch": 1.67, + "learning_rate": 4.965314740352452e-05, + "loss": 0.0046, + "step": 330810 + }, + { + "epoch": 1.67, + "learning_rate": 4.964557971051051e-05, + "loss": 0.0051, + "step": 330820 + }, + { + "epoch": 1.67, + "learning_rate": 4.96380120174965e-05, + "loss": 0.0071, + "step": 330830 + }, + { + "epoch": 1.67, + "learning_rate": 4.963044432448249e-05, + "loss": 0.0065, + "step": 330840 + }, + { + "epoch": 1.67, + "learning_rate": 4.962287663146848e-05, + "loss": 0.0063, + "step": 330850 + }, + { + "epoch": 1.67, + "learning_rate": 4.961530893845447e-05, + "loss": 0.0069, + "step": 330860 + }, + { + "epoch": 1.67, + "learning_rate": 4.960774124544046e-05, + "loss": 0.0075, + "step": 330870 + }, + { + "epoch": 1.67, + "learning_rate": 4.960017355242645e-05, + "loss": 0.0052, + "step": 330880 + }, + { + "epoch": 1.67, + "learning_rate": 4.959260585941244e-05, + "loss": 0.0052, + "step": 330890 + }, + { + "epoch": 1.67, + "learning_rate": 4.958503816639843e-05, + "loss": 0.0063, + "step": 330900 + }, + { + "epoch": 1.67, + "learning_rate": 4.957747047338442e-05, + "loss": 0.0069, + "step": 330910 + }, + { + "epoch": 1.67, + "learning_rate": 4.956990278037041e-05, + "loss": 0.007, + "step": 330920 + }, + { + "epoch": 1.67, + "learning_rate": 4.95623350873564e-05, + "loss": 0.0081, + "step": 330930 + }, + { + "epoch": 1.67, + "learning_rate": 4.955476739434239e-05, + "loss": 0.0058, + "step": 330940 + }, + { + "epoch": 1.67, + "learning_rate": 4.954719970132838e-05, + "loss": 0.0089, + "step": 330950 + }, + { + "epoch": 1.67, + "learning_rate": 4.953963200831437e-05, + "loss": 0.007, + "step": 330960 + }, + { + "epoch": 1.67, + "learning_rate": 4.953206431530036e-05, + "loss": 0.006, + "step": 330970 + }, + { + "epoch": 1.67, + "learning_rate": 4.952449662228635e-05, + "loss": 0.0066, + "step": 330980 + }, + { + "epoch": 1.67, + "learning_rate": 4.951692892927234e-05, + "loss": 0.0059, + "step": 330990 + }, + { + "epoch": 1.67, + "learning_rate": 4.950936123625833e-05, + "loss": 0.0054, + "step": 331000 + }, + { + "epoch": 1.67, + "eval_cer": 0.9144440552077764, + "eval_loss": 0.004910916555672884, + "eval_runtime": 116.3705, + "eval_samples_per_second": 17.186, + "eval_steps_per_second": 4.297, + "step": 331000 + }, + { + "epoch": 1.67, + "learning_rate": 4.950179354324432e-05, + "loss": 0.0073, + "step": 331010 + }, + { + "epoch": 1.67, + "learning_rate": 4.9494225850230306e-05, + "loss": 0.0054, + "step": 331020 + }, + { + "epoch": 1.67, + "learning_rate": 4.94866581572163e-05, + "loss": 0.0066, + "step": 331030 + }, + { + "epoch": 1.67, + "learning_rate": 4.947909046420228e-05, + "loss": 0.0073, + "step": 331040 + }, + { + "epoch": 1.67, + "learning_rate": 4.947152277118827e-05, + "loss": 0.0093, + "step": 331050 + }, + { + "epoch": 1.67, + "learning_rate": 4.946395507817426e-05, + "loss": 0.0066, + "step": 331060 + }, + { + "epoch": 1.67, + "learning_rate": 4.9456387385160254e-05, + "loss": 0.0041, + "step": 331070 + }, + { + "epoch": 1.67, + "learning_rate": 4.944881969214624e-05, + "loss": 0.0065, + "step": 331080 + }, + { + "epoch": 1.67, + "learning_rate": 4.944125199913223e-05, + "loss": 0.005, + "step": 331090 + }, + { + "epoch": 1.67, + "learning_rate": 4.943368430611822e-05, + "loss": 0.0068, + "step": 331100 + }, + { + "epoch": 1.67, + "learning_rate": 4.9426116613104214e-05, + "loss": 0.0081, + "step": 331110 + }, + { + "epoch": 1.67, + "learning_rate": 4.94185489200902e-05, + "loss": 0.006, + "step": 331120 + }, + { + "epoch": 1.67, + "learning_rate": 4.941098122707619e-05, + "loss": 0.0072, + "step": 331130 + }, + { + "epoch": 1.67, + "learning_rate": 4.940341353406218e-05, + "loss": 0.0058, + "step": 331140 + }, + { + "epoch": 1.67, + "learning_rate": 4.9395845841048174e-05, + "loss": 0.0077, + "step": 331150 + }, + { + "epoch": 1.67, + "learning_rate": 4.938827814803416e-05, + "loss": 0.005, + "step": 331160 + }, + { + "epoch": 1.67, + "learning_rate": 4.938071045502015e-05, + "loss": 0.0091, + "step": 331170 + }, + { + "epoch": 1.67, + "learning_rate": 4.937314276200614e-05, + "loss": 0.006, + "step": 331180 + }, + { + "epoch": 1.67, + "learning_rate": 4.936557506899213e-05, + "loss": 0.0051, + "step": 331190 + }, + { + "epoch": 1.67, + "learning_rate": 4.935800737597812e-05, + "loss": 0.0047, + "step": 331200 + }, + { + "epoch": 1.67, + "learning_rate": 4.935043968296411e-05, + "loss": 0.006, + "step": 331210 + }, + { + "epoch": 1.67, + "learning_rate": 4.93428719899501e-05, + "loss": 0.0071, + "step": 331220 + }, + { + "epoch": 1.67, + "learning_rate": 4.933530429693609e-05, + "loss": 0.0066, + "step": 331230 + }, + { + "epoch": 1.67, + "learning_rate": 4.932773660392208e-05, + "loss": 0.0072, + "step": 331240 + }, + { + "epoch": 1.67, + "learning_rate": 4.932016891090807e-05, + "loss": 0.0072, + "step": 331250 + }, + { + "epoch": 1.67, + "learning_rate": 4.931260121789406e-05, + "loss": 0.0077, + "step": 331260 + }, + { + "epoch": 1.67, + "learning_rate": 4.930503352488005e-05, + "loss": 0.0057, + "step": 331270 + }, + { + "epoch": 1.67, + "learning_rate": 4.929746583186604e-05, + "loss": 0.0063, + "step": 331280 + }, + { + "epoch": 1.67, + "learning_rate": 4.928989813885203e-05, + "loss": 0.0064, + "step": 331290 + }, + { + "epoch": 1.67, + "learning_rate": 4.928233044583802e-05, + "loss": 0.0052, + "step": 331300 + }, + { + "epoch": 1.67, + "learning_rate": 4.927476275282401e-05, + "loss": 0.008, + "step": 331310 + }, + { + "epoch": 1.67, + "learning_rate": 4.926719505981e-05, + "loss": 0.0098, + "step": 331320 + }, + { + "epoch": 1.67, + "learning_rate": 4.925962736679599e-05, + "loss": 0.0051, + "step": 331330 + }, + { + "epoch": 1.67, + "learning_rate": 4.925205967378198e-05, + "loss": 0.0079, + "step": 331340 + }, + { + "epoch": 1.67, + "learning_rate": 4.924449198076796e-05, + "loss": 0.0053, + "step": 331350 + }, + { + "epoch": 1.67, + "learning_rate": 4.923692428775395e-05, + "loss": 0.0054, + "step": 331360 + }, + { + "epoch": 1.67, + "learning_rate": 4.922935659473994e-05, + "loss": 0.0062, + "step": 331370 + }, + { + "epoch": 1.67, + "learning_rate": 4.922178890172593e-05, + "loss": 0.0085, + "step": 331380 + }, + { + "epoch": 1.67, + "learning_rate": 4.921422120871192e-05, + "loss": 0.0054, + "step": 331390 + }, + { + "epoch": 1.67, + "learning_rate": 4.920665351569791e-05, + "loss": 0.006, + "step": 331400 + }, + { + "epoch": 1.67, + "learning_rate": 4.91990858226839e-05, + "loss": 0.007, + "step": 331410 + }, + { + "epoch": 1.67, + "learning_rate": 4.919151812966989e-05, + "loss": 0.0071, + "step": 331420 + }, + { + "epoch": 1.67, + "learning_rate": 4.918395043665588e-05, + "loss": 0.0067, + "step": 331430 + }, + { + "epoch": 1.67, + "learning_rate": 4.917638274364187e-05, + "loss": 0.0056, + "step": 331440 + }, + { + "epoch": 1.67, + "learning_rate": 4.916881505062786e-05, + "loss": 0.005, + "step": 331450 + }, + { + "epoch": 1.67, + "learning_rate": 4.916124735761385e-05, + "loss": 0.0062, + "step": 331460 + }, + { + "epoch": 1.67, + "learning_rate": 4.915367966459984e-05, + "loss": 0.0053, + "step": 331470 + }, + { + "epoch": 1.67, + "learning_rate": 4.914611197158583e-05, + "loss": 0.0065, + "step": 331480 + }, + { + "epoch": 1.67, + "learning_rate": 4.913854427857182e-05, + "loss": 0.0052, + "step": 331490 + }, + { + "epoch": 1.67, + "learning_rate": 4.913097658555781e-05, + "loss": 0.0074, + "step": 331500 + }, + { + "epoch": 1.67, + "learning_rate": 4.91234088925438e-05, + "loss": 0.0082, + "step": 331510 + }, + { + "epoch": 1.67, + "learning_rate": 4.911584119952979e-05, + "loss": 0.0073, + "step": 331520 + }, + { + "epoch": 1.67, + "learning_rate": 4.910827350651578e-05, + "loss": 0.0059, + "step": 331530 + }, + { + "epoch": 1.67, + "learning_rate": 4.910070581350177e-05, + "loss": 0.0064, + "step": 331540 + }, + { + "epoch": 1.67, + "learning_rate": 4.909313812048776e-05, + "loss": 0.0079, + "step": 331550 + }, + { + "epoch": 1.67, + "learning_rate": 4.908557042747375e-05, + "loss": 0.0069, + "step": 331560 + }, + { + "epoch": 1.67, + "learning_rate": 4.907800273445974e-05, + "loss": 0.0056, + "step": 331570 + }, + { + "epoch": 1.67, + "learning_rate": 4.907043504144573e-05, + "loss": 0.0063, + "step": 331580 + }, + { + "epoch": 1.67, + "learning_rate": 4.906286734843172e-05, + "loss": 0.0058, + "step": 331590 + }, + { + "epoch": 1.67, + "learning_rate": 4.905529965541771e-05, + "loss": 0.0055, + "step": 331600 + }, + { + "epoch": 1.67, + "learning_rate": 4.90477319624037e-05, + "loss": 0.0057, + "step": 331610 + }, + { + "epoch": 1.67, + "learning_rate": 4.904016426938969e-05, + "loss": 0.0061, + "step": 331620 + }, + { + "epoch": 1.67, + "learning_rate": 4.903259657637568e-05, + "loss": 0.0098, + "step": 331630 + }, + { + "epoch": 1.67, + "learning_rate": 4.902502888336167e-05, + "loss": 0.0059, + "step": 331640 + }, + { + "epoch": 1.67, + "learning_rate": 4.901746119034766e-05, + "loss": 0.0063, + "step": 331650 + }, + { + "epoch": 1.67, + "learning_rate": 4.900989349733365e-05, + "loss": 0.0059, + "step": 331660 + }, + { + "epoch": 1.67, + "learning_rate": 4.900232580431963e-05, + "loss": 0.0053, + "step": 331670 + }, + { + "epoch": 1.67, + "learning_rate": 4.8994758111305624e-05, + "loss": 0.0057, + "step": 331680 + }, + { + "epoch": 1.67, + "learning_rate": 4.898719041829161e-05, + "loss": 0.0047, + "step": 331690 + }, + { + "epoch": 1.67, + "learning_rate": 4.89796227252776e-05, + "loss": 0.0072, + "step": 331700 + }, + { + "epoch": 1.67, + "learning_rate": 4.897205503226359e-05, + "loss": 0.0072, + "step": 331710 + }, + { + "epoch": 1.67, + "learning_rate": 4.8964487339249583e-05, + "loss": 0.006, + "step": 331720 + }, + { + "epoch": 1.67, + "learning_rate": 4.895691964623557e-05, + "loss": 0.0048, + "step": 331730 + }, + { + "epoch": 1.67, + "learning_rate": 4.894935195322156e-05, + "loss": 0.0062, + "step": 331740 + }, + { + "epoch": 1.67, + "learning_rate": 4.894178426020755e-05, + "loss": 0.0061, + "step": 331750 + }, + { + "epoch": 1.67, + "learning_rate": 4.893421656719354e-05, + "loss": 0.006, + "step": 331760 + }, + { + "epoch": 1.67, + "learning_rate": 4.892664887417953e-05, + "loss": 0.0085, + "step": 331770 + }, + { + "epoch": 1.67, + "learning_rate": 4.891908118116552e-05, + "loss": 0.007, + "step": 331780 + }, + { + "epoch": 1.67, + "learning_rate": 4.891151348815151e-05, + "loss": 0.0071, + "step": 331790 + }, + { + "epoch": 1.67, + "learning_rate": 4.89039457951375e-05, + "loss": 0.0085, + "step": 331800 + }, + { + "epoch": 1.67, + "learning_rate": 4.889637810212349e-05, + "loss": 0.0073, + "step": 331810 + }, + { + "epoch": 1.67, + "learning_rate": 4.888881040910948e-05, + "loss": 0.0093, + "step": 331820 + }, + { + "epoch": 1.67, + "learning_rate": 4.888124271609547e-05, + "loss": 0.0111, + "step": 331830 + }, + { + "epoch": 1.67, + "learning_rate": 4.887367502308146e-05, + "loss": 0.0066, + "step": 331840 + }, + { + "epoch": 1.67, + "learning_rate": 4.886610733006745e-05, + "loss": 0.0075, + "step": 331850 + }, + { + "epoch": 1.67, + "learning_rate": 4.885853963705344e-05, + "loss": 0.0053, + "step": 331860 + }, + { + "epoch": 1.67, + "learning_rate": 4.885097194403943e-05, + "loss": 0.008, + "step": 331870 + }, + { + "epoch": 1.67, + "learning_rate": 4.884340425102542e-05, + "loss": 0.0072, + "step": 331880 + }, + { + "epoch": 1.67, + "learning_rate": 4.883583655801141e-05, + "loss": 0.0046, + "step": 331890 + }, + { + "epoch": 1.67, + "learning_rate": 4.88282688649974e-05, + "loss": 0.0066, + "step": 331900 + }, + { + "epoch": 1.67, + "learning_rate": 4.882070117198339e-05, + "loss": 0.0073, + "step": 331910 + }, + { + "epoch": 1.67, + "learning_rate": 4.881313347896938e-05, + "loss": 0.0062, + "step": 331920 + }, + { + "epoch": 1.67, + "learning_rate": 4.880556578595537e-05, + "loss": 0.0063, + "step": 331930 + }, + { + "epoch": 1.67, + "learning_rate": 4.879799809294136e-05, + "loss": 0.0088, + "step": 331940 + }, + { + "epoch": 1.67, + "learning_rate": 4.8790430399927346e-05, + "loss": 0.0054, + "step": 331950 + }, + { + "epoch": 1.67, + "learning_rate": 4.878286270691334e-05, + "loss": 0.0048, + "step": 331960 + }, + { + "epoch": 1.67, + "learning_rate": 4.877529501389933e-05, + "loss": 0.0063, + "step": 331970 + }, + { + "epoch": 1.67, + "learning_rate": 4.876772732088531e-05, + "loss": 0.0073, + "step": 331980 + }, + { + "epoch": 1.67, + "learning_rate": 4.87601596278713e-05, + "loss": 0.0064, + "step": 331990 + }, + { + "epoch": 1.67, + "learning_rate": 4.875259193485729e-05, + "loss": 0.0059, + "step": 332000 + }, + { + "epoch": 1.67, + "eval_cer": 0.9144421144155256, + "eval_loss": 0.004793255589902401, + "eval_runtime": 116.2412, + "eval_samples_per_second": 17.206, + "eval_steps_per_second": 4.301, + "step": 332000 + }, + { + "epoch": 1.68, + "learning_rate": 4.874502424184328e-05, + "loss": 0.0078, + "step": 332010 + }, + { + "epoch": 1.68, + "learning_rate": 4.873745654882927e-05, + "loss": 0.0072, + "step": 332020 + }, + { + "epoch": 1.68, + "learning_rate": 4.872988885581526e-05, + "loss": 0.0064, + "step": 332030 + }, + { + "epoch": 1.68, + "learning_rate": 4.8722321162801254e-05, + "loss": 0.0058, + "step": 332040 + }, + { + "epoch": 1.68, + "learning_rate": 4.871475346978724e-05, + "loss": 0.0059, + "step": 332050 + }, + { + "epoch": 1.68, + "learning_rate": 4.870718577677323e-05, + "loss": 0.0055, + "step": 332060 + }, + { + "epoch": 1.68, + "learning_rate": 4.869961808375922e-05, + "loss": 0.0055, + "step": 332070 + }, + { + "epoch": 1.68, + "learning_rate": 4.8692050390745214e-05, + "loss": 0.0047, + "step": 332080 + }, + { + "epoch": 1.68, + "learning_rate": 4.86844826977312e-05, + "loss": 0.0085, + "step": 332090 + }, + { + "epoch": 1.68, + "learning_rate": 4.867691500471719e-05, + "loss": 0.0058, + "step": 332100 + }, + { + "epoch": 1.68, + "learning_rate": 4.866934731170318e-05, + "loss": 0.0076, + "step": 332110 + }, + { + "epoch": 1.68, + "learning_rate": 4.866177961868917e-05, + "loss": 0.0057, + "step": 332120 + }, + { + "epoch": 1.68, + "learning_rate": 4.865421192567516e-05, + "loss": 0.0072, + "step": 332130 + }, + { + "epoch": 1.68, + "learning_rate": 4.864664423266115e-05, + "loss": 0.0079, + "step": 332140 + }, + { + "epoch": 1.68, + "learning_rate": 4.863907653964714e-05, + "loss": 0.0051, + "step": 332150 + }, + { + "epoch": 1.68, + "learning_rate": 4.863150884663313e-05, + "loss": 0.0096, + "step": 332160 + }, + { + "epoch": 1.68, + "learning_rate": 4.862394115361912e-05, + "loss": 0.0077, + "step": 332170 + }, + { + "epoch": 1.68, + "learning_rate": 4.861637346060511e-05, + "loss": 0.0078, + "step": 332180 + }, + { + "epoch": 1.68, + "learning_rate": 4.86088057675911e-05, + "loss": 0.0073, + "step": 332190 + }, + { + "epoch": 1.68, + "learning_rate": 4.860123807457709e-05, + "loss": 0.006, + "step": 332200 + }, + { + "epoch": 1.68, + "learning_rate": 4.859367038156308e-05, + "loss": 0.007, + "step": 332210 + }, + { + "epoch": 1.68, + "learning_rate": 4.858610268854907e-05, + "loss": 0.006, + "step": 332220 + }, + { + "epoch": 1.68, + "learning_rate": 4.857853499553506e-05, + "loss": 0.0058, + "step": 332230 + }, + { + "epoch": 1.68, + "learning_rate": 4.857096730252105e-05, + "loss": 0.0128, + "step": 332240 + }, + { + "epoch": 1.68, + "learning_rate": 4.856339960950704e-05, + "loss": 0.0053, + "step": 332250 + }, + { + "epoch": 1.68, + "learning_rate": 4.855583191649303e-05, + "loss": 0.0079, + "step": 332260 + }, + { + "epoch": 1.68, + "learning_rate": 4.854826422347902e-05, + "loss": 0.0048, + "step": 332270 + }, + { + "epoch": 1.68, + "learning_rate": 4.854069653046501e-05, + "loss": 0.0041, + "step": 332280 + }, + { + "epoch": 1.68, + "learning_rate": 4.853312883745099e-05, + "loss": 0.0061, + "step": 332290 + }, + { + "epoch": 1.68, + "learning_rate": 4.852556114443698e-05, + "loss": 0.0059, + "step": 332300 + }, + { + "epoch": 1.68, + "learning_rate": 4.851799345142297e-05, + "loss": 0.0077, + "step": 332310 + }, + { + "epoch": 1.68, + "learning_rate": 4.851042575840896e-05, + "loss": 0.0062, + "step": 332320 + }, + { + "epoch": 1.68, + "learning_rate": 4.850285806539495e-05, + "loss": 0.0076, + "step": 332330 + }, + { + "epoch": 1.68, + "learning_rate": 4.849529037238094e-05, + "loss": 0.0054, + "step": 332340 + }, + { + "epoch": 1.68, + "learning_rate": 4.848772267936693e-05, + "loss": 0.0063, + "step": 332350 + }, + { + "epoch": 1.68, + "learning_rate": 4.848015498635292e-05, + "loss": 0.0049, + "step": 332360 + }, + { + "epoch": 1.68, + "learning_rate": 4.847258729333891e-05, + "loss": 0.0073, + "step": 332370 + }, + { + "epoch": 1.68, + "learning_rate": 4.84650196003249e-05, + "loss": 0.0047, + "step": 332380 + }, + { + "epoch": 1.68, + "learning_rate": 4.845745190731089e-05, + "loss": 0.0057, + "step": 332390 + }, + { + "epoch": 1.68, + "learning_rate": 4.844988421429688e-05, + "loss": 0.0062, + "step": 332400 + }, + { + "epoch": 1.68, + "learning_rate": 4.844231652128287e-05, + "loss": 0.0053, + "step": 332410 + }, + { + "epoch": 1.68, + "learning_rate": 4.843474882826886e-05, + "loss": 0.0067, + "step": 332420 + }, + { + "epoch": 1.68, + "learning_rate": 4.842718113525485e-05, + "loss": 0.0082, + "step": 332430 + }, + { + "epoch": 1.68, + "learning_rate": 4.841961344224084e-05, + "loss": 0.0077, + "step": 332440 + }, + { + "epoch": 1.68, + "learning_rate": 4.841204574922683e-05, + "loss": 0.0062, + "step": 332450 + }, + { + "epoch": 1.68, + "learning_rate": 4.840447805621282e-05, + "loss": 0.0062, + "step": 332460 + }, + { + "epoch": 1.68, + "learning_rate": 4.839691036319881e-05, + "loss": 0.0064, + "step": 332470 + }, + { + "epoch": 1.68, + "learning_rate": 4.8389342670184797e-05, + "loss": 0.0048, + "step": 332480 + }, + { + "epoch": 1.68, + "learning_rate": 4.838177497717079e-05, + "loss": 0.0069, + "step": 332490 + }, + { + "epoch": 1.68, + "learning_rate": 4.837420728415678e-05, + "loss": 0.0083, + "step": 332500 + }, + { + "epoch": 1.68, + "learning_rate": 4.836663959114277e-05, + "loss": 0.0052, + "step": 332510 + }, + { + "epoch": 1.68, + "learning_rate": 4.8359071898128756e-05, + "loss": 0.0063, + "step": 332520 + }, + { + "epoch": 1.68, + "learning_rate": 4.835150420511475e-05, + "loss": 0.0067, + "step": 332530 + }, + { + "epoch": 1.68, + "learning_rate": 4.834393651210074e-05, + "loss": 0.0063, + "step": 332540 + }, + { + "epoch": 1.68, + "learning_rate": 4.833636881908673e-05, + "loss": 0.0054, + "step": 332550 + }, + { + "epoch": 1.68, + "learning_rate": 4.832880112607272e-05, + "loss": 0.0073, + "step": 332560 + }, + { + "epoch": 1.68, + "learning_rate": 4.832123343305871e-05, + "loss": 0.0052, + "step": 332570 + }, + { + "epoch": 1.68, + "learning_rate": 4.83136657400447e-05, + "loss": 0.006, + "step": 332580 + }, + { + "epoch": 1.68, + "learning_rate": 4.830609804703069e-05, + "loss": 0.0072, + "step": 332590 + }, + { + "epoch": 1.68, + "learning_rate": 4.829853035401668e-05, + "loss": 0.0064, + "step": 332600 + }, + { + "epoch": 1.68, + "learning_rate": 4.8290962661002664e-05, + "loss": 0.0056, + "step": 332610 + }, + { + "epoch": 1.68, + "learning_rate": 4.828339496798865e-05, + "loss": 0.0087, + "step": 332620 + }, + { + "epoch": 1.68, + "learning_rate": 4.827582727497464e-05, + "loss": 0.0063, + "step": 332630 + }, + { + "epoch": 1.68, + "learning_rate": 4.826825958196063e-05, + "loss": 0.0065, + "step": 332640 + }, + { + "epoch": 1.68, + "learning_rate": 4.826069188894662e-05, + "loss": 0.0103, + "step": 332650 + }, + { + "epoch": 1.68, + "learning_rate": 4.825312419593261e-05, + "loss": 0.0067, + "step": 332660 + }, + { + "epoch": 1.68, + "learning_rate": 4.82455565029186e-05, + "loss": 0.0058, + "step": 332670 + }, + { + "epoch": 1.68, + "learning_rate": 4.823798880990459e-05, + "loss": 0.0103, + "step": 332680 + }, + { + "epoch": 1.68, + "learning_rate": 4.823042111689058e-05, + "loss": 0.0078, + "step": 332690 + }, + { + "epoch": 1.68, + "learning_rate": 4.822285342387657e-05, + "loss": 0.0063, + "step": 332700 + }, + { + "epoch": 1.68, + "learning_rate": 4.821528573086256e-05, + "loss": 0.0053, + "step": 332710 + }, + { + "epoch": 1.68, + "learning_rate": 4.820771803784855e-05, + "loss": 0.0062, + "step": 332720 + }, + { + "epoch": 1.68, + "learning_rate": 4.820015034483454e-05, + "loss": 0.006, + "step": 332730 + }, + { + "epoch": 1.68, + "learning_rate": 4.819258265182053e-05, + "loss": 0.0092, + "step": 332740 + }, + { + "epoch": 1.68, + "learning_rate": 4.818501495880652e-05, + "loss": 0.0075, + "step": 332750 + }, + { + "epoch": 1.68, + "learning_rate": 4.817744726579251e-05, + "loss": 0.0056, + "step": 332760 + }, + { + "epoch": 1.68, + "learning_rate": 4.81698795727785e-05, + "loss": 0.0045, + "step": 332770 + }, + { + "epoch": 1.68, + "learning_rate": 4.816231187976449e-05, + "loss": 0.0064, + "step": 332780 + }, + { + "epoch": 1.68, + "learning_rate": 4.815474418675048e-05, + "loss": 0.0082, + "step": 332790 + }, + { + "epoch": 1.68, + "learning_rate": 4.814717649373647e-05, + "loss": 0.0057, + "step": 332800 + }, + { + "epoch": 1.68, + "learning_rate": 4.813960880072246e-05, + "loss": 0.0071, + "step": 332810 + }, + { + "epoch": 1.68, + "learning_rate": 4.813204110770845e-05, + "loss": 0.0075, + "step": 332820 + }, + { + "epoch": 1.68, + "learning_rate": 4.812447341469444e-05, + "loss": 0.0053, + "step": 332830 + }, + { + "epoch": 1.68, + "learning_rate": 4.8116905721680427e-05, + "loss": 0.0061, + "step": 332840 + }, + { + "epoch": 1.68, + "learning_rate": 4.810933802866642e-05, + "loss": 0.0057, + "step": 332850 + }, + { + "epoch": 1.68, + "learning_rate": 4.810177033565241e-05, + "loss": 0.0053, + "step": 332860 + }, + { + "epoch": 1.68, + "learning_rate": 4.80942026426384e-05, + "loss": 0.0063, + "step": 332870 + }, + { + "epoch": 1.68, + "learning_rate": 4.8086634949624386e-05, + "loss": 0.0077, + "step": 332880 + }, + { + "epoch": 1.68, + "learning_rate": 4.807906725661038e-05, + "loss": 0.0077, + "step": 332890 + }, + { + "epoch": 1.68, + "learning_rate": 4.807149956359637e-05, + "loss": 0.0059, + "step": 332900 + }, + { + "epoch": 1.68, + "learning_rate": 4.806393187058236e-05, + "loss": 0.0076, + "step": 332910 + }, + { + "epoch": 1.68, + "learning_rate": 4.805636417756834e-05, + "loss": 0.0043, + "step": 332920 + }, + { + "epoch": 1.68, + "learning_rate": 4.804879648455433e-05, + "loss": 0.0062, + "step": 332930 + }, + { + "epoch": 1.68, + "learning_rate": 4.804122879154032e-05, + "loss": 0.0071, + "step": 332940 + }, + { + "epoch": 1.68, + "learning_rate": 4.803366109852631e-05, + "loss": 0.0102, + "step": 332950 + }, + { + "epoch": 1.68, + "learning_rate": 4.80260934055123e-05, + "loss": 0.0053, + "step": 332960 + }, + { + "epoch": 1.68, + "learning_rate": 4.801852571249829e-05, + "loss": 0.0071, + "step": 332970 + }, + { + "epoch": 1.68, + "learning_rate": 4.801095801948428e-05, + "loss": 0.005, + "step": 332980 + }, + { + "epoch": 1.68, + "learning_rate": 4.800339032647027e-05, + "loss": 0.0076, + "step": 332990 + }, + { + "epoch": 1.68, + "learning_rate": 4.799582263345626e-05, + "loss": 0.0072, + "step": 333000 + }, + { + "epoch": 1.68, + "eval_cer": 0.9144343512465224, + "eval_loss": 0.004823221359401941, + "eval_runtime": 116.4518, + "eval_samples_per_second": 17.174, + "eval_steps_per_second": 4.294, + "step": 333000 + }, + { + "epoch": 1.68, + "learning_rate": 4.7988254940442253e-05, + "loss": 0.0063, + "step": 333010 + }, + { + "epoch": 1.68, + "learning_rate": 4.798068724742824e-05, + "loss": 0.0085, + "step": 333020 + }, + { + "epoch": 1.68, + "learning_rate": 4.797311955441423e-05, + "loss": 0.0098, + "step": 333030 + }, + { + "epoch": 1.68, + "learning_rate": 4.796555186140022e-05, + "loss": 0.0063, + "step": 333040 + }, + { + "epoch": 1.68, + "learning_rate": 4.795798416838621e-05, + "loss": 0.007, + "step": 333050 + }, + { + "epoch": 1.68, + "learning_rate": 4.79504164753722e-05, + "loss": 0.0047, + "step": 333060 + }, + { + "epoch": 1.68, + "learning_rate": 4.794284878235819e-05, + "loss": 0.0058, + "step": 333070 + }, + { + "epoch": 1.68, + "learning_rate": 4.793528108934418e-05, + "loss": 0.0054, + "step": 333080 + }, + { + "epoch": 1.68, + "learning_rate": 4.792771339633017e-05, + "loss": 0.005, + "step": 333090 + }, + { + "epoch": 1.68, + "learning_rate": 4.792014570331616e-05, + "loss": 0.0067, + "step": 333100 + }, + { + "epoch": 1.68, + "learning_rate": 4.791257801030215e-05, + "loss": 0.0078, + "step": 333110 + }, + { + "epoch": 1.68, + "learning_rate": 4.790501031728814e-05, + "loss": 0.0058, + "step": 333120 + }, + { + "epoch": 1.68, + "learning_rate": 4.789744262427413e-05, + "loss": 0.0052, + "step": 333130 + }, + { + "epoch": 1.68, + "learning_rate": 4.788987493126012e-05, + "loss": 0.0071, + "step": 333140 + }, + { + "epoch": 1.68, + "learning_rate": 4.788230723824611e-05, + "loss": 0.0071, + "step": 333150 + }, + { + "epoch": 1.68, + "learning_rate": 4.78747395452321e-05, + "loss": 0.0076, + "step": 333160 + }, + { + "epoch": 1.68, + "learning_rate": 4.786717185221809e-05, + "loss": 0.0059, + "step": 333170 + }, + { + "epoch": 1.68, + "learning_rate": 4.785960415920408e-05, + "loss": 0.0061, + "step": 333180 + }, + { + "epoch": 1.68, + "learning_rate": 4.785203646619007e-05, + "loss": 0.0063, + "step": 333190 + }, + { + "epoch": 1.68, + "learning_rate": 4.784446877317606e-05, + "loss": 0.0068, + "step": 333200 + }, + { + "epoch": 1.68, + "learning_rate": 4.783690108016205e-05, + "loss": 0.0064, + "step": 333210 + }, + { + "epoch": 1.68, + "learning_rate": 4.782933338714804e-05, + "loss": 0.0055, + "step": 333220 + }, + { + "epoch": 1.68, + "learning_rate": 4.782176569413403e-05, + "loss": 0.009, + "step": 333230 + }, + { + "epoch": 1.68, + "learning_rate": 4.781419800112001e-05, + "loss": 0.0056, + "step": 333240 + }, + { + "epoch": 1.68, + "learning_rate": 4.7806630308106e-05, + "loss": 0.0065, + "step": 333250 + }, + { + "epoch": 1.68, + "learning_rate": 4.779906261509199e-05, + "loss": 0.0059, + "step": 333260 + }, + { + "epoch": 1.68, + "learning_rate": 4.779149492207798e-05, + "loss": 0.0052, + "step": 333270 + }, + { + "epoch": 1.68, + "learning_rate": 4.778392722906397e-05, + "loss": 0.007, + "step": 333280 + }, + { + "epoch": 1.68, + "learning_rate": 4.777635953604996e-05, + "loss": 0.0054, + "step": 333290 + }, + { + "epoch": 1.68, + "learning_rate": 4.776879184303595e-05, + "loss": 0.0061, + "step": 333300 + }, + { + "epoch": 1.68, + "learning_rate": 4.776122415002194e-05, + "loss": 0.0083, + "step": 333310 + }, + { + "epoch": 1.68, + "learning_rate": 4.775365645700793e-05, + "loss": 0.0088, + "step": 333320 + }, + { + "epoch": 1.68, + "learning_rate": 4.774608876399392e-05, + "loss": 0.0064, + "step": 333330 + }, + { + "epoch": 1.68, + "learning_rate": 4.773852107097991e-05, + "loss": 0.0067, + "step": 333340 + }, + { + "epoch": 1.68, + "learning_rate": 4.77309533779659e-05, + "loss": 0.0057, + "step": 333350 + }, + { + "epoch": 1.68, + "learning_rate": 4.772338568495189e-05, + "loss": 0.0064, + "step": 333360 + }, + { + "epoch": 1.68, + "learning_rate": 4.771581799193788e-05, + "loss": 0.0083, + "step": 333370 + }, + { + "epoch": 1.68, + "learning_rate": 4.770825029892387e-05, + "loss": 0.0071, + "step": 333380 + }, + { + "epoch": 1.68, + "learning_rate": 4.770068260590986e-05, + "loss": 0.007, + "step": 333390 + }, + { + "epoch": 1.68, + "learning_rate": 4.769311491289585e-05, + "loss": 0.0073, + "step": 333400 + }, + { + "epoch": 1.68, + "learning_rate": 4.7685547219881836e-05, + "loss": 0.0054, + "step": 333410 + }, + { + "epoch": 1.68, + "learning_rate": 4.767797952686783e-05, + "loss": 0.0053, + "step": 333420 + }, + { + "epoch": 1.68, + "learning_rate": 4.767041183385382e-05, + "loss": 0.0076, + "step": 333430 + }, + { + "epoch": 1.68, + "learning_rate": 4.766284414083981e-05, + "loss": 0.0068, + "step": 333440 + }, + { + "epoch": 1.68, + "learning_rate": 4.7655276447825796e-05, + "loss": 0.0053, + "step": 333450 + }, + { + "epoch": 1.68, + "learning_rate": 4.764770875481179e-05, + "loss": 0.0062, + "step": 333460 + }, + { + "epoch": 1.68, + "learning_rate": 4.764014106179778e-05, + "loss": 0.0041, + "step": 333470 + }, + { + "epoch": 1.68, + "learning_rate": 4.763257336878377e-05, + "loss": 0.0063, + "step": 333480 + }, + { + "epoch": 1.68, + "learning_rate": 4.7625005675769756e-05, + "loss": 0.0047, + "step": 333490 + }, + { + "epoch": 1.68, + "learning_rate": 4.761743798275575e-05, + "loss": 0.0067, + "step": 333500 + }, + { + "epoch": 1.68, + "learning_rate": 4.760987028974174e-05, + "loss": 0.0066, + "step": 333510 + }, + { + "epoch": 1.68, + "learning_rate": 4.760230259672773e-05, + "loss": 0.0079, + "step": 333520 + }, + { + "epoch": 1.68, + "learning_rate": 4.759473490371372e-05, + "loss": 0.0053, + "step": 333530 + }, + { + "epoch": 1.68, + "learning_rate": 4.758716721069971e-05, + "loss": 0.0076, + "step": 333540 + }, + { + "epoch": 1.68, + "learning_rate": 4.757959951768569e-05, + "loss": 0.0054, + "step": 333550 + }, + { + "epoch": 1.68, + "learning_rate": 4.757203182467168e-05, + "loss": 0.0064, + "step": 333560 + }, + { + "epoch": 1.68, + "learning_rate": 4.756446413165767e-05, + "loss": 0.0072, + "step": 333570 + }, + { + "epoch": 1.68, + "learning_rate": 4.755689643864366e-05, + "loss": 0.0075, + "step": 333580 + }, + { + "epoch": 1.68, + "learning_rate": 4.754932874562965e-05, + "loss": 0.0073, + "step": 333590 + }, + { + "epoch": 1.68, + "learning_rate": 4.754176105261564e-05, + "loss": 0.005, + "step": 333600 + }, + { + "epoch": 1.68, + "learning_rate": 4.753419335960163e-05, + "loss": 0.0054, + "step": 333610 + }, + { + "epoch": 1.68, + "learning_rate": 4.752662566658762e-05, + "loss": 0.0049, + "step": 333620 + }, + { + "epoch": 1.68, + "learning_rate": 4.751905797357361e-05, + "loss": 0.0068, + "step": 333630 + }, + { + "epoch": 1.68, + "learning_rate": 4.75114902805596e-05, + "loss": 0.0076, + "step": 333640 + }, + { + "epoch": 1.68, + "learning_rate": 4.750392258754559e-05, + "loss": 0.0063, + "step": 333650 + }, + { + "epoch": 1.68, + "learning_rate": 4.749635489453158e-05, + "loss": 0.006, + "step": 333660 + }, + { + "epoch": 1.68, + "learning_rate": 4.748878720151757e-05, + "loss": 0.0072, + "step": 333670 + }, + { + "epoch": 1.68, + "learning_rate": 4.748121950850356e-05, + "loss": 0.0076, + "step": 333680 + }, + { + "epoch": 1.68, + "learning_rate": 4.747365181548955e-05, + "loss": 0.0061, + "step": 333690 + }, + { + "epoch": 1.68, + "learning_rate": 4.746608412247554e-05, + "loss": 0.0067, + "step": 333700 + }, + { + "epoch": 1.68, + "learning_rate": 4.745851642946153e-05, + "loss": 0.0062, + "step": 333710 + }, + { + "epoch": 1.68, + "learning_rate": 4.745094873644752e-05, + "loss": 0.0057, + "step": 333720 + }, + { + "epoch": 1.68, + "learning_rate": 4.744338104343351e-05, + "loss": 0.006, + "step": 333730 + }, + { + "epoch": 1.68, + "learning_rate": 4.74358133504195e-05, + "loss": 0.0053, + "step": 333740 + }, + { + "epoch": 1.68, + "learning_rate": 4.742824565740549e-05, + "loss": 0.0064, + "step": 333750 + }, + { + "epoch": 1.68, + "learning_rate": 4.742067796439148e-05, + "loss": 0.0058, + "step": 333760 + }, + { + "epoch": 1.68, + "learning_rate": 4.7413110271377466e-05, + "loss": 0.0072, + "step": 333770 + }, + { + "epoch": 1.68, + "learning_rate": 4.740554257836346e-05, + "loss": 0.0066, + "step": 333780 + }, + { + "epoch": 1.68, + "learning_rate": 4.739797488534945e-05, + "loss": 0.0058, + "step": 333790 + }, + { + "epoch": 1.68, + "learning_rate": 4.739040719233544e-05, + "loss": 0.0045, + "step": 333800 + }, + { + "epoch": 1.68, + "learning_rate": 4.7382839499321426e-05, + "loss": 0.0066, + "step": 333810 + }, + { + "epoch": 1.68, + "learning_rate": 4.737527180630742e-05, + "loss": 0.0061, + "step": 333820 + }, + { + "epoch": 1.68, + "learning_rate": 4.736770411329341e-05, + "loss": 0.0084, + "step": 333830 + }, + { + "epoch": 1.68, + "learning_rate": 4.73601364202794e-05, + "loss": 0.0077, + "step": 333840 + }, + { + "epoch": 1.68, + "learning_rate": 4.7352568727265386e-05, + "loss": 0.0063, + "step": 333850 + }, + { + "epoch": 1.68, + "learning_rate": 4.734500103425138e-05, + "loss": 0.0057, + "step": 333860 + }, + { + "epoch": 1.68, + "learning_rate": 4.733743334123736e-05, + "loss": 0.0069, + "step": 333870 + }, + { + "epoch": 1.68, + "learning_rate": 4.732986564822335e-05, + "loss": 0.0082, + "step": 333880 + }, + { + "epoch": 1.68, + "learning_rate": 4.732229795520934e-05, + "loss": 0.0067, + "step": 333890 + }, + { + "epoch": 1.68, + "learning_rate": 4.731473026219533e-05, + "loss": 0.0067, + "step": 333900 + }, + { + "epoch": 1.68, + "learning_rate": 4.730716256918132e-05, + "loss": 0.0056, + "step": 333910 + }, + { + "epoch": 1.68, + "learning_rate": 4.729959487616731e-05, + "loss": 0.0071, + "step": 333920 + }, + { + "epoch": 1.68, + "learning_rate": 4.72920271831533e-05, + "loss": 0.0055, + "step": 333930 + }, + { + "epoch": 1.68, + "learning_rate": 4.7284459490139287e-05, + "loss": 0.0058, + "step": 333940 + }, + { + "epoch": 1.68, + "learning_rate": 4.727689179712528e-05, + "loss": 0.0054, + "step": 333950 + }, + { + "epoch": 1.68, + "learning_rate": 4.726932410411127e-05, + "loss": 0.0055, + "step": 333960 + }, + { + "epoch": 1.68, + "learning_rate": 4.726175641109726e-05, + "loss": 0.0065, + "step": 333970 + }, + { + "epoch": 1.68, + "learning_rate": 4.725418871808325e-05, + "loss": 0.0061, + "step": 333980 + }, + { + "epoch": 1.69, + "learning_rate": 4.724662102506924e-05, + "loss": 0.0064, + "step": 333990 + }, + { + "epoch": 1.69, + "learning_rate": 4.723905333205523e-05, + "loss": 0.0081, + "step": 334000 + }, + { + "epoch": 1.69, + "eval_cer": 0.9144139729278888, + "eval_loss": 0.004758420865982771, + "eval_runtime": 116.3871, + "eval_samples_per_second": 17.184, + "eval_steps_per_second": 4.296, + "step": 334000 + }, + { + "epoch": 1.69, + "learning_rate": 4.723148563904122e-05, + "loss": 0.0067, + "step": 334010 + }, + { + "epoch": 1.69, + "learning_rate": 4.722391794602721e-05, + "loss": 0.0079, + "step": 334020 + }, + { + "epoch": 1.69, + "learning_rate": 4.72163502530132e-05, + "loss": 0.0056, + "step": 334030 + }, + { + "epoch": 1.69, + "learning_rate": 4.720878255999919e-05, + "loss": 0.0057, + "step": 334040 + }, + { + "epoch": 1.69, + "learning_rate": 4.720121486698518e-05, + "loss": 0.0066, + "step": 334050 + }, + { + "epoch": 1.69, + "learning_rate": 4.719364717397117e-05, + "loss": 0.0047, + "step": 334060 + }, + { + "epoch": 1.69, + "learning_rate": 4.718607948095716e-05, + "loss": 0.0055, + "step": 334070 + }, + { + "epoch": 1.69, + "learning_rate": 4.717851178794315e-05, + "loss": 0.0054, + "step": 334080 + }, + { + "epoch": 1.69, + "learning_rate": 4.717094409492914e-05, + "loss": 0.0056, + "step": 334090 + }, + { + "epoch": 1.69, + "learning_rate": 4.716337640191513e-05, + "loss": 0.0063, + "step": 334100 + }, + { + "epoch": 1.69, + "learning_rate": 4.715580870890112e-05, + "loss": 0.0049, + "step": 334110 + }, + { + "epoch": 1.69, + "learning_rate": 4.714824101588711e-05, + "loss": 0.0084, + "step": 334120 + }, + { + "epoch": 1.69, + "learning_rate": 4.7140673322873097e-05, + "loss": 0.0062, + "step": 334130 + }, + { + "epoch": 1.69, + "learning_rate": 4.713310562985909e-05, + "loss": 0.0079, + "step": 334140 + }, + { + "epoch": 1.69, + "learning_rate": 4.712553793684508e-05, + "loss": 0.0068, + "step": 334150 + }, + { + "epoch": 1.69, + "learning_rate": 4.711797024383107e-05, + "loss": 0.005, + "step": 334160 + }, + { + "epoch": 1.69, + "learning_rate": 4.7110402550817056e-05, + "loss": 0.0062, + "step": 334170 + }, + { + "epoch": 1.69, + "learning_rate": 4.710283485780304e-05, + "loss": 0.0061, + "step": 334180 + }, + { + "epoch": 1.69, + "learning_rate": 4.709526716478903e-05, + "loss": 0.0077, + "step": 334190 + }, + { + "epoch": 1.69, + "learning_rate": 4.708769947177502e-05, + "loss": 0.0071, + "step": 334200 + }, + { + "epoch": 1.69, + "learning_rate": 4.708013177876101e-05, + "loss": 0.0054, + "step": 334210 + }, + { + "epoch": 1.69, + "learning_rate": 4.7072564085747e-05, + "loss": 0.0055, + "step": 334220 + }, + { + "epoch": 1.69, + "learning_rate": 4.706499639273299e-05, + "loss": 0.0054, + "step": 334230 + }, + { + "epoch": 1.69, + "learning_rate": 4.705742869971898e-05, + "loss": 0.0063, + "step": 334240 + }, + { + "epoch": 1.69, + "learning_rate": 4.704986100670497e-05, + "loss": 0.0072, + "step": 334250 + }, + { + "epoch": 1.69, + "learning_rate": 4.704229331369096e-05, + "loss": 0.0065, + "step": 334260 + }, + { + "epoch": 1.69, + "learning_rate": 4.703472562067695e-05, + "loss": 0.0057, + "step": 334270 + }, + { + "epoch": 1.69, + "learning_rate": 4.702715792766294e-05, + "loss": 0.007, + "step": 334280 + }, + { + "epoch": 1.69, + "learning_rate": 4.701959023464893e-05, + "loss": 0.0077, + "step": 334290 + }, + { + "epoch": 1.69, + "learning_rate": 4.7012022541634917e-05, + "loss": 0.0053, + "step": 334300 + }, + { + "epoch": 1.69, + "learning_rate": 4.700445484862091e-05, + "loss": 0.0077, + "step": 334310 + }, + { + "epoch": 1.69, + "learning_rate": 4.69968871556069e-05, + "loss": 0.006, + "step": 334320 + }, + { + "epoch": 1.69, + "learning_rate": 4.698931946259289e-05, + "loss": 0.0054, + "step": 334330 + }, + { + "epoch": 1.69, + "learning_rate": 4.6981751769578876e-05, + "loss": 0.007, + "step": 334340 + }, + { + "epoch": 1.69, + "learning_rate": 4.697418407656487e-05, + "loss": 0.0092, + "step": 334350 + }, + { + "epoch": 1.69, + "learning_rate": 4.696661638355086e-05, + "loss": 0.0062, + "step": 334360 + }, + { + "epoch": 1.69, + "learning_rate": 4.695904869053685e-05, + "loss": 0.0054, + "step": 334370 + }, + { + "epoch": 1.69, + "learning_rate": 4.6951480997522836e-05, + "loss": 0.0071, + "step": 334380 + }, + { + "epoch": 1.69, + "learning_rate": 4.694391330450883e-05, + "loss": 0.0065, + "step": 334390 + }, + { + "epoch": 1.69, + "learning_rate": 4.693634561149482e-05, + "loss": 0.0054, + "step": 334400 + }, + { + "epoch": 1.69, + "learning_rate": 4.692877791848081e-05, + "loss": 0.0058, + "step": 334410 + }, + { + "epoch": 1.69, + "learning_rate": 4.6921210225466796e-05, + "loss": 0.0064, + "step": 334420 + }, + { + "epoch": 1.69, + "learning_rate": 4.691364253245279e-05, + "loss": 0.0092, + "step": 334430 + }, + { + "epoch": 1.69, + "learning_rate": 4.690607483943878e-05, + "loss": 0.0063, + "step": 334440 + }, + { + "epoch": 1.69, + "learning_rate": 4.689850714642477e-05, + "loss": 0.007, + "step": 334450 + }, + { + "epoch": 1.69, + "learning_rate": 4.6890939453410755e-05, + "loss": 0.008, + "step": 334460 + }, + { + "epoch": 1.69, + "learning_rate": 4.688337176039675e-05, + "loss": 0.0057, + "step": 334470 + }, + { + "epoch": 1.69, + "learning_rate": 4.687580406738274e-05, + "loss": 0.0063, + "step": 334480 + }, + { + "epoch": 1.69, + "learning_rate": 4.686823637436872e-05, + "loss": 0.007, + "step": 334490 + }, + { + "epoch": 1.69, + "learning_rate": 4.686066868135471e-05, + "loss": 0.005, + "step": 334500 + }, + { + "epoch": 1.69, + "learning_rate": 4.68531009883407e-05, + "loss": 0.0052, + "step": 334510 + }, + { + "epoch": 1.69, + "learning_rate": 4.684553329532669e-05, + "loss": 0.0083, + "step": 334520 + }, + { + "epoch": 1.69, + "learning_rate": 4.683796560231268e-05, + "loss": 0.0053, + "step": 334530 + }, + { + "epoch": 1.69, + "learning_rate": 4.683039790929867e-05, + "loss": 0.0062, + "step": 334540 + }, + { + "epoch": 1.69, + "learning_rate": 4.682283021628466e-05, + "loss": 0.0061, + "step": 334550 + }, + { + "epoch": 1.69, + "learning_rate": 4.681526252327065e-05, + "loss": 0.0077, + "step": 334560 + }, + { + "epoch": 1.69, + "learning_rate": 4.680769483025664e-05, + "loss": 0.0069, + "step": 334570 + }, + { + "epoch": 1.69, + "learning_rate": 4.680012713724263e-05, + "loss": 0.0068, + "step": 334580 + }, + { + "epoch": 1.69, + "learning_rate": 4.679255944422862e-05, + "loss": 0.0057, + "step": 334590 + }, + { + "epoch": 1.69, + "learning_rate": 4.678499175121461e-05, + "loss": 0.0062, + "step": 334600 + }, + { + "epoch": 1.69, + "learning_rate": 4.67774240582006e-05, + "loss": 0.0063, + "step": 334610 + }, + { + "epoch": 1.69, + "learning_rate": 4.676985636518659e-05, + "loss": 0.0067, + "step": 334620 + }, + { + "epoch": 1.69, + "learning_rate": 4.676228867217258e-05, + "loss": 0.0064, + "step": 334630 + }, + { + "epoch": 1.69, + "learning_rate": 4.675472097915857e-05, + "loss": 0.0065, + "step": 334640 + }, + { + "epoch": 1.69, + "learning_rate": 4.674715328614456e-05, + "loss": 0.0052, + "step": 334650 + }, + { + "epoch": 1.69, + "learning_rate": 4.673958559313055e-05, + "loss": 0.0077, + "step": 334660 + }, + { + "epoch": 1.69, + "learning_rate": 4.673201790011654e-05, + "loss": 0.0085, + "step": 334670 + }, + { + "epoch": 1.69, + "learning_rate": 4.672445020710253e-05, + "loss": 0.0051, + "step": 334680 + }, + { + "epoch": 1.69, + "learning_rate": 4.671688251408852e-05, + "loss": 0.0065, + "step": 334690 + }, + { + "epoch": 1.69, + "learning_rate": 4.6709314821074506e-05, + "loss": 0.0103, + "step": 334700 + }, + { + "epoch": 1.69, + "learning_rate": 4.67017471280605e-05, + "loss": 0.006, + "step": 334710 + }, + { + "epoch": 1.69, + "learning_rate": 4.669417943504649e-05, + "loss": 0.0038, + "step": 334720 + }, + { + "epoch": 1.69, + "learning_rate": 4.668661174203248e-05, + "loss": 0.0072, + "step": 334730 + }, + { + "epoch": 1.69, + "learning_rate": 4.6679044049018466e-05, + "loss": 0.0054, + "step": 334740 + }, + { + "epoch": 1.69, + "learning_rate": 4.667147635600446e-05, + "loss": 0.0074, + "step": 334750 + }, + { + "epoch": 1.69, + "learning_rate": 4.666390866299045e-05, + "loss": 0.0067, + "step": 334760 + }, + { + "epoch": 1.69, + "learning_rate": 4.665634096997644e-05, + "loss": 0.006, + "step": 334770 + }, + { + "epoch": 1.69, + "learning_rate": 4.6648773276962426e-05, + "loss": 0.0057, + "step": 334780 + }, + { + "epoch": 1.69, + "learning_rate": 4.664120558394842e-05, + "loss": 0.007, + "step": 334790 + }, + { + "epoch": 1.69, + "learning_rate": 4.663363789093441e-05, + "loss": 0.0046, + "step": 334800 + }, + { + "epoch": 1.69, + "learning_rate": 4.662607019792039e-05, + "loss": 0.0064, + "step": 334810 + }, + { + "epoch": 1.69, + "learning_rate": 4.661850250490638e-05, + "loss": 0.0055, + "step": 334820 + }, + { + "epoch": 1.69, + "learning_rate": 4.661093481189237e-05, + "loss": 0.0067, + "step": 334830 + }, + { + "epoch": 1.69, + "learning_rate": 4.660336711887836e-05, + "loss": 0.006, + "step": 334840 + }, + { + "epoch": 1.69, + "learning_rate": 4.659579942586435e-05, + "loss": 0.008, + "step": 334850 + }, + { + "epoch": 1.69, + "learning_rate": 4.658823173285034e-05, + "loss": 0.0054, + "step": 334860 + }, + { + "epoch": 1.69, + "learning_rate": 4.6580664039836326e-05, + "loss": 0.0061, + "step": 334870 + }, + { + "epoch": 1.69, + "learning_rate": 4.657309634682232e-05, + "loss": 0.0051, + "step": 334880 + }, + { + "epoch": 1.69, + "learning_rate": 4.656552865380831e-05, + "loss": 0.0077, + "step": 334890 + }, + { + "epoch": 1.69, + "learning_rate": 4.65579609607943e-05, + "loss": 0.0082, + "step": 334900 + }, + { + "epoch": 1.69, + "learning_rate": 4.6550393267780286e-05, + "loss": 0.0065, + "step": 334910 + }, + { + "epoch": 1.69, + "learning_rate": 4.654282557476628e-05, + "loss": 0.0058, + "step": 334920 + }, + { + "epoch": 1.69, + "learning_rate": 4.653525788175227e-05, + "loss": 0.0081, + "step": 334930 + }, + { + "epoch": 1.69, + "learning_rate": 4.652769018873826e-05, + "loss": 0.0062, + "step": 334940 + }, + { + "epoch": 1.69, + "learning_rate": 4.652012249572425e-05, + "loss": 0.0059, + "step": 334950 + }, + { + "epoch": 1.69, + "learning_rate": 4.651255480271024e-05, + "loss": 0.006, + "step": 334960 + }, + { + "epoch": 1.69, + "learning_rate": 4.650498710969623e-05, + "loss": 0.0077, + "step": 334970 + }, + { + "epoch": 1.69, + "learning_rate": 4.649741941668222e-05, + "loss": 0.0078, + "step": 334980 + }, + { + "epoch": 1.69, + "learning_rate": 4.648985172366821e-05, + "loss": 0.0055, + "step": 334990 + }, + { + "epoch": 1.69, + "learning_rate": 4.64822840306542e-05, + "loss": 0.0063, + "step": 335000 + }, + { + "epoch": 1.69, + "eval_cer": 0.914412032135638, + "eval_loss": 0.004865641705691814, + "eval_runtime": 116.3195, + "eval_samples_per_second": 17.194, + "eval_steps_per_second": 4.299, + "step": 335000 + }, + { + "epoch": 1.69, + "learning_rate": 4.647471633764019e-05, + "loss": 0.0069, + "step": 335010 + }, + { + "epoch": 1.69, + "learning_rate": 4.646714864462618e-05, + "loss": 0.0059, + "step": 335020 + }, + { + "epoch": 1.69, + "learning_rate": 4.645958095161217e-05, + "loss": 0.0082, + "step": 335030 + }, + { + "epoch": 1.69, + "learning_rate": 4.645201325859816e-05, + "loss": 0.0048, + "step": 335040 + }, + { + "epoch": 1.69, + "learning_rate": 4.644444556558415e-05, + "loss": 0.0066, + "step": 335050 + }, + { + "epoch": 1.69, + "learning_rate": 4.6436877872570136e-05, + "loss": 0.0062, + "step": 335060 + }, + { + "epoch": 1.69, + "learning_rate": 4.642931017955613e-05, + "loss": 0.0057, + "step": 335070 + }, + { + "epoch": 1.69, + "learning_rate": 4.642174248654212e-05, + "loss": 0.0091, + "step": 335080 + }, + { + "epoch": 1.69, + "learning_rate": 4.641417479352811e-05, + "loss": 0.0062, + "step": 335090 + }, + { + "epoch": 1.69, + "learning_rate": 4.6406607100514096e-05, + "loss": 0.0069, + "step": 335100 + }, + { + "epoch": 1.69, + "learning_rate": 4.639903940750009e-05, + "loss": 0.0076, + "step": 335110 + }, + { + "epoch": 1.69, + "learning_rate": 4.639147171448607e-05, + "loss": 0.0059, + "step": 335120 + }, + { + "epoch": 1.69, + "learning_rate": 4.638390402147206e-05, + "loss": 0.0074, + "step": 335130 + }, + { + "epoch": 1.69, + "learning_rate": 4.637633632845805e-05, + "loss": 0.0059, + "step": 335140 + }, + { + "epoch": 1.69, + "learning_rate": 4.636876863544404e-05, + "loss": 0.0051, + "step": 335150 + }, + { + "epoch": 1.69, + "learning_rate": 4.636120094243003e-05, + "loss": 0.0076, + "step": 335160 + }, + { + "epoch": 1.69, + "learning_rate": 4.635363324941602e-05, + "loss": 0.0045, + "step": 335170 + }, + { + "epoch": 1.69, + "learning_rate": 4.634606555640201e-05, + "loss": 0.0079, + "step": 335180 + }, + { + "epoch": 1.69, + "learning_rate": 4.6338497863388e-05, + "loss": 0.0068, + "step": 335190 + }, + { + "epoch": 1.69, + "learning_rate": 4.633093017037399e-05, + "loss": 0.0057, + "step": 335200 + }, + { + "epoch": 1.69, + "learning_rate": 4.632336247735998e-05, + "loss": 0.0059, + "step": 335210 + }, + { + "epoch": 1.69, + "learning_rate": 4.631579478434597e-05, + "loss": 0.0055, + "step": 335220 + }, + { + "epoch": 1.69, + "learning_rate": 4.6308227091331956e-05, + "loss": 0.006, + "step": 335230 + }, + { + "epoch": 1.69, + "learning_rate": 4.630065939831795e-05, + "loss": 0.0073, + "step": 335240 + }, + { + "epoch": 1.69, + "learning_rate": 4.629309170530394e-05, + "loss": 0.0068, + "step": 335250 + }, + { + "epoch": 1.69, + "learning_rate": 4.628552401228993e-05, + "loss": 0.0061, + "step": 335260 + }, + { + "epoch": 1.69, + "learning_rate": 4.6277956319275916e-05, + "loss": 0.006, + "step": 335270 + }, + { + "epoch": 1.69, + "learning_rate": 4.627038862626191e-05, + "loss": 0.0042, + "step": 335280 + }, + { + "epoch": 1.69, + "learning_rate": 4.62628209332479e-05, + "loss": 0.0061, + "step": 335290 + }, + { + "epoch": 1.69, + "learning_rate": 4.625525324023389e-05, + "loss": 0.0066, + "step": 335300 + }, + { + "epoch": 1.69, + "learning_rate": 4.6247685547219876e-05, + "loss": 0.0051, + "step": 335310 + }, + { + "epoch": 1.69, + "learning_rate": 4.624011785420587e-05, + "loss": 0.0057, + "step": 335320 + }, + { + "epoch": 1.69, + "learning_rate": 4.623255016119186e-05, + "loss": 0.0054, + "step": 335330 + }, + { + "epoch": 1.69, + "learning_rate": 4.622498246817785e-05, + "loss": 0.0044, + "step": 335340 + }, + { + "epoch": 1.69, + "learning_rate": 4.6217414775163835e-05, + "loss": 0.0059, + "step": 335350 + }, + { + "epoch": 1.69, + "learning_rate": 4.620984708214983e-05, + "loss": 0.0078, + "step": 335360 + }, + { + "epoch": 1.69, + "learning_rate": 4.620227938913582e-05, + "loss": 0.0073, + "step": 335370 + }, + { + "epoch": 1.69, + "learning_rate": 4.619471169612181e-05, + "loss": 0.0075, + "step": 335380 + }, + { + "epoch": 1.69, + "learning_rate": 4.6187144003107795e-05, + "loss": 0.0086, + "step": 335390 + }, + { + "epoch": 1.69, + "learning_rate": 4.617957631009379e-05, + "loss": 0.0073, + "step": 335400 + }, + { + "epoch": 1.69, + "learning_rate": 4.617200861707978e-05, + "loss": 0.0049, + "step": 335410 + }, + { + "epoch": 1.69, + "learning_rate": 4.6164440924065767e-05, + "loss": 0.0059, + "step": 335420 + }, + { + "epoch": 1.69, + "learning_rate": 4.6156873231051755e-05, + "loss": 0.0082, + "step": 335430 + }, + { + "epoch": 1.69, + "learning_rate": 4.614930553803774e-05, + "loss": 0.0066, + "step": 335440 + }, + { + "epoch": 1.69, + "learning_rate": 4.614173784502373e-05, + "loss": 0.0059, + "step": 335450 + }, + { + "epoch": 1.69, + "learning_rate": 4.613417015200972e-05, + "loss": 0.0082, + "step": 335460 + }, + { + "epoch": 1.69, + "learning_rate": 4.612660245899571e-05, + "loss": 0.0087, + "step": 335470 + }, + { + "epoch": 1.69, + "learning_rate": 4.61190347659817e-05, + "loss": 0.0059, + "step": 335480 + }, + { + "epoch": 1.69, + "learning_rate": 4.611146707296769e-05, + "loss": 0.0066, + "step": 335490 + }, + { + "epoch": 1.69, + "learning_rate": 4.610389937995368e-05, + "loss": 0.0058, + "step": 335500 + }, + { + "epoch": 1.69, + "learning_rate": 4.609633168693967e-05, + "loss": 0.0061, + "step": 335510 + }, + { + "epoch": 1.69, + "learning_rate": 4.608876399392566e-05, + "loss": 0.0069, + "step": 335520 + }, + { + "epoch": 1.69, + "learning_rate": 4.608119630091165e-05, + "loss": 0.0057, + "step": 335530 + }, + { + "epoch": 1.69, + "learning_rate": 4.607362860789764e-05, + "loss": 0.0062, + "step": 335540 + }, + { + "epoch": 1.69, + "learning_rate": 4.606606091488363e-05, + "loss": 0.0069, + "step": 335550 + }, + { + "epoch": 1.69, + "learning_rate": 4.605849322186962e-05, + "loss": 0.0059, + "step": 335560 + }, + { + "epoch": 1.69, + "learning_rate": 4.605092552885561e-05, + "loss": 0.0071, + "step": 335570 + }, + { + "epoch": 1.69, + "learning_rate": 4.60433578358416e-05, + "loss": 0.0059, + "step": 335580 + }, + { + "epoch": 1.69, + "learning_rate": 4.6035790142827587e-05, + "loss": 0.0078, + "step": 335590 + }, + { + "epoch": 1.69, + "learning_rate": 4.602822244981358e-05, + "loss": 0.007, + "step": 335600 + }, + { + "epoch": 1.69, + "learning_rate": 4.602065475679957e-05, + "loss": 0.0075, + "step": 335610 + }, + { + "epoch": 1.69, + "learning_rate": 4.601308706378556e-05, + "loss": 0.005, + "step": 335620 + }, + { + "epoch": 1.69, + "learning_rate": 4.6005519370771546e-05, + "loss": 0.0069, + "step": 335630 + }, + { + "epoch": 1.69, + "learning_rate": 4.599795167775754e-05, + "loss": 0.0056, + "step": 335640 + }, + { + "epoch": 1.69, + "learning_rate": 4.599038398474353e-05, + "loss": 0.0063, + "step": 335650 + }, + { + "epoch": 1.69, + "learning_rate": 4.598281629172952e-05, + "loss": 0.0057, + "step": 335660 + }, + { + "epoch": 1.69, + "learning_rate": 4.5975248598715506e-05, + "loss": 0.0081, + "step": 335670 + }, + { + "epoch": 1.69, + "learning_rate": 4.59676809057015e-05, + "loss": 0.0072, + "step": 335680 + }, + { + "epoch": 1.69, + "learning_rate": 4.596011321268749e-05, + "loss": 0.0059, + "step": 335690 + }, + { + "epoch": 1.69, + "learning_rate": 4.595254551967348e-05, + "loss": 0.0053, + "step": 335700 + }, + { + "epoch": 1.69, + "learning_rate": 4.5944977826659466e-05, + "loss": 0.0068, + "step": 335710 + }, + { + "epoch": 1.69, + "learning_rate": 4.593741013364546e-05, + "loss": 0.0073, + "step": 335720 + }, + { + "epoch": 1.69, + "learning_rate": 4.592984244063145e-05, + "loss": 0.0072, + "step": 335730 + }, + { + "epoch": 1.69, + "learning_rate": 4.592227474761744e-05, + "loss": 0.0061, + "step": 335740 + }, + { + "epoch": 1.69, + "learning_rate": 4.591470705460342e-05, + "loss": 0.0065, + "step": 335750 + }, + { + "epoch": 1.69, + "learning_rate": 4.5907139361589407e-05, + "loss": 0.0057, + "step": 335760 + }, + { + "epoch": 1.69, + "learning_rate": 4.58995716685754e-05, + "loss": 0.0083, + "step": 335770 + }, + { + "epoch": 1.69, + "learning_rate": 4.589200397556139e-05, + "loss": 0.0059, + "step": 335780 + }, + { + "epoch": 1.69, + "learning_rate": 4.588443628254738e-05, + "loss": 0.0071, + "step": 335790 + }, + { + "epoch": 1.69, + "learning_rate": 4.5876868589533366e-05, + "loss": 0.0055, + "step": 335800 + }, + { + "epoch": 1.69, + "learning_rate": 4.586930089651936e-05, + "loss": 0.0068, + "step": 335810 + }, + { + "epoch": 1.69, + "learning_rate": 4.586173320350535e-05, + "loss": 0.0072, + "step": 335820 + }, + { + "epoch": 1.69, + "learning_rate": 4.585416551049134e-05, + "loss": 0.0105, + "step": 335830 + }, + { + "epoch": 1.69, + "learning_rate": 4.5846597817477326e-05, + "loss": 0.0052, + "step": 335840 + }, + { + "epoch": 1.69, + "learning_rate": 4.583903012446332e-05, + "loss": 0.0067, + "step": 335850 + }, + { + "epoch": 1.69, + "learning_rate": 4.583146243144931e-05, + "loss": 0.0062, + "step": 335860 + }, + { + "epoch": 1.69, + "learning_rate": 4.58238947384353e-05, + "loss": 0.0067, + "step": 335870 + }, + { + "epoch": 1.69, + "learning_rate": 4.5816327045421286e-05, + "loss": 0.0083, + "step": 335880 + }, + { + "epoch": 1.69, + "learning_rate": 4.580875935240728e-05, + "loss": 0.0067, + "step": 335890 + }, + { + "epoch": 1.69, + "learning_rate": 4.580119165939327e-05, + "loss": 0.0049, + "step": 335900 + }, + { + "epoch": 1.69, + "learning_rate": 4.579362396637926e-05, + "loss": 0.0074, + "step": 335910 + }, + { + "epoch": 1.69, + "learning_rate": 4.578605627336525e-05, + "loss": 0.0057, + "step": 335920 + }, + { + "epoch": 1.69, + "learning_rate": 4.577848858035124e-05, + "loss": 0.0063, + "step": 335930 + }, + { + "epoch": 1.69, + "learning_rate": 4.577092088733723e-05, + "loss": 0.0054, + "step": 335940 + }, + { + "epoch": 1.69, + "learning_rate": 4.576335319432322e-05, + "loss": 0.0056, + "step": 335950 + }, + { + "epoch": 1.69, + "learning_rate": 4.575578550130921e-05, + "loss": 0.0079, + "step": 335960 + }, + { + "epoch": 1.7, + "learning_rate": 4.57482178082952e-05, + "loss": 0.0071, + "step": 335970 + }, + { + "epoch": 1.7, + "learning_rate": 4.574065011528119e-05, + "loss": 0.0078, + "step": 335980 + }, + { + "epoch": 1.7, + "learning_rate": 4.5733082422267176e-05, + "loss": 0.0053, + "step": 335990 + }, + { + "epoch": 1.7, + "learning_rate": 4.572551472925317e-05, + "loss": 0.0091, + "step": 336000 + }, + { + "epoch": 1.7, + "eval_cer": 0.9144372624348985, + "eval_loss": 0.004783105570822954, + "eval_runtime": 116.4347, + "eval_samples_per_second": 17.177, + "eval_steps_per_second": 4.294, + "step": 336000 + }, + { + "epoch": 1.7, + "learning_rate": 4.571794703623916e-05, + "loss": 0.0069, + "step": 336010 + }, + { + "epoch": 1.7, + "learning_rate": 4.571037934322515e-05, + "loss": 0.0058, + "step": 336020 + }, + { + "epoch": 1.7, + "learning_rate": 4.5702811650211136e-05, + "loss": 0.0051, + "step": 336030 + }, + { + "epoch": 1.7, + "learning_rate": 4.569524395719713e-05, + "loss": 0.0056, + "step": 336040 + }, + { + "epoch": 1.7, + "learning_rate": 4.568767626418312e-05, + "loss": 0.0051, + "step": 336050 + }, + { + "epoch": 1.7, + "learning_rate": 4.568010857116911e-05, + "loss": 0.0053, + "step": 336060 + }, + { + "epoch": 1.7, + "learning_rate": 4.567254087815509e-05, + "loss": 0.0045, + "step": 336070 + }, + { + "epoch": 1.7, + "learning_rate": 4.566497318514108e-05, + "loss": 0.0095, + "step": 336080 + }, + { + "epoch": 1.7, + "learning_rate": 4.565740549212707e-05, + "loss": 0.0062, + "step": 336090 + }, + { + "epoch": 1.7, + "learning_rate": 4.564983779911306e-05, + "loss": 0.0072, + "step": 336100 + }, + { + "epoch": 1.7, + "learning_rate": 4.564227010609905e-05, + "loss": 0.0063, + "step": 336110 + }, + { + "epoch": 1.7, + "learning_rate": 4.563470241308504e-05, + "loss": 0.0064, + "step": 336120 + }, + { + "epoch": 1.7, + "learning_rate": 4.562713472007103e-05, + "loss": 0.0051, + "step": 336130 + }, + { + "epoch": 1.7, + "learning_rate": 4.561956702705702e-05, + "loss": 0.0052, + "step": 336140 + }, + { + "epoch": 1.7, + "learning_rate": 4.561199933404301e-05, + "loss": 0.0054, + "step": 336150 + }, + { + "epoch": 1.7, + "learning_rate": 4.5604431641028996e-05, + "loss": 0.0078, + "step": 336160 + }, + { + "epoch": 1.7, + "learning_rate": 4.559686394801499e-05, + "loss": 0.0081, + "step": 336170 + }, + { + "epoch": 1.7, + "learning_rate": 4.558929625500098e-05, + "loss": 0.0054, + "step": 336180 + }, + { + "epoch": 1.7, + "learning_rate": 4.558172856198697e-05, + "loss": 0.0065, + "step": 336190 + }, + { + "epoch": 1.7, + "learning_rate": 4.5574160868972956e-05, + "loss": 0.0063, + "step": 336200 + }, + { + "epoch": 1.7, + "learning_rate": 4.556659317595895e-05, + "loss": 0.0074, + "step": 336210 + }, + { + "epoch": 1.7, + "learning_rate": 4.555902548294494e-05, + "loss": 0.006, + "step": 336220 + }, + { + "epoch": 1.7, + "learning_rate": 4.555145778993093e-05, + "loss": 0.0054, + "step": 336230 + }, + { + "epoch": 1.7, + "learning_rate": 4.5543890096916916e-05, + "loss": 0.0071, + "step": 336240 + }, + { + "epoch": 1.7, + "learning_rate": 4.553632240390291e-05, + "loss": 0.0063, + "step": 336250 + }, + { + "epoch": 1.7, + "learning_rate": 4.55287547108889e-05, + "loss": 0.008, + "step": 336260 + }, + { + "epoch": 1.7, + "learning_rate": 4.552118701787489e-05, + "loss": 0.0064, + "step": 336270 + }, + { + "epoch": 1.7, + "learning_rate": 4.5513619324860875e-05, + "loss": 0.0058, + "step": 336280 + }, + { + "epoch": 1.7, + "learning_rate": 4.550605163184687e-05, + "loss": 0.0053, + "step": 336290 + }, + { + "epoch": 1.7, + "learning_rate": 4.549848393883286e-05, + "loss": 0.0078, + "step": 336300 + }, + { + "epoch": 1.7, + "learning_rate": 4.549091624581885e-05, + "loss": 0.0067, + "step": 336310 + }, + { + "epoch": 1.7, + "learning_rate": 4.5483348552804835e-05, + "loss": 0.0065, + "step": 336320 + }, + { + "epoch": 1.7, + "learning_rate": 4.547578085979083e-05, + "loss": 0.0051, + "step": 336330 + }, + { + "epoch": 1.7, + "learning_rate": 4.546821316677682e-05, + "loss": 0.0046, + "step": 336340 + }, + { + "epoch": 1.7, + "learning_rate": 4.5460645473762806e-05, + "loss": 0.0062, + "step": 336350 + }, + { + "epoch": 1.7, + "learning_rate": 4.5453077780748795e-05, + "loss": 0.0053, + "step": 336360 + }, + { + "epoch": 1.7, + "learning_rate": 4.544551008773479e-05, + "loss": 0.0066, + "step": 336370 + }, + { + "epoch": 1.7, + "learning_rate": 4.543794239472077e-05, + "loss": 0.0047, + "step": 336380 + }, + { + "epoch": 1.7, + "learning_rate": 4.543037470170676e-05, + "loss": 0.0074, + "step": 336390 + }, + { + "epoch": 1.7, + "learning_rate": 4.542280700869275e-05, + "loss": 0.006, + "step": 336400 + }, + { + "epoch": 1.7, + "learning_rate": 4.541523931567874e-05, + "loss": 0.0055, + "step": 336410 + }, + { + "epoch": 1.7, + "learning_rate": 4.540767162266473e-05, + "loss": 0.0057, + "step": 336420 + }, + { + "epoch": 1.7, + "learning_rate": 4.540010392965072e-05, + "loss": 0.0078, + "step": 336430 + }, + { + "epoch": 1.7, + "learning_rate": 4.539253623663671e-05, + "loss": 0.0083, + "step": 336440 + }, + { + "epoch": 1.7, + "learning_rate": 4.53849685436227e-05, + "loss": 0.0073, + "step": 336450 + }, + { + "epoch": 1.7, + "learning_rate": 4.537740085060869e-05, + "loss": 0.0081, + "step": 336460 + }, + { + "epoch": 1.7, + "learning_rate": 4.536983315759468e-05, + "loss": 0.0101, + "step": 336470 + }, + { + "epoch": 1.7, + "learning_rate": 4.536226546458067e-05, + "loss": 0.0045, + "step": 336480 + }, + { + "epoch": 1.7, + "learning_rate": 4.535469777156666e-05, + "loss": 0.0062, + "step": 336490 + }, + { + "epoch": 1.7, + "learning_rate": 4.534713007855265e-05, + "loss": 0.0068, + "step": 336500 + }, + { + "epoch": 1.7, + "learning_rate": 4.533956238553864e-05, + "loss": 0.0059, + "step": 336510 + }, + { + "epoch": 1.7, + "learning_rate": 4.5331994692524626e-05, + "loss": 0.0054, + "step": 336520 + }, + { + "epoch": 1.7, + "learning_rate": 4.532442699951062e-05, + "loss": 0.0053, + "step": 336530 + }, + { + "epoch": 1.7, + "learning_rate": 4.531685930649661e-05, + "loss": 0.0053, + "step": 336540 + }, + { + "epoch": 1.7, + "learning_rate": 4.53092916134826e-05, + "loss": 0.0074, + "step": 336550 + }, + { + "epoch": 1.7, + "learning_rate": 4.5301723920468586e-05, + "loss": 0.006, + "step": 336560 + }, + { + "epoch": 1.7, + "learning_rate": 4.529415622745458e-05, + "loss": 0.0074, + "step": 336570 + }, + { + "epoch": 1.7, + "learning_rate": 4.528658853444057e-05, + "loss": 0.008, + "step": 336580 + }, + { + "epoch": 1.7, + "learning_rate": 4.527902084142656e-05, + "loss": 0.0058, + "step": 336590 + }, + { + "epoch": 1.7, + "learning_rate": 4.5271453148412546e-05, + "loss": 0.0074, + "step": 336600 + }, + { + "epoch": 1.7, + "learning_rate": 4.526388545539854e-05, + "loss": 0.0058, + "step": 336610 + }, + { + "epoch": 1.7, + "learning_rate": 4.525631776238453e-05, + "loss": 0.0071, + "step": 336620 + }, + { + "epoch": 1.7, + "learning_rate": 4.524875006937052e-05, + "loss": 0.0054, + "step": 336630 + }, + { + "epoch": 1.7, + "learning_rate": 4.5241182376356505e-05, + "loss": 0.006, + "step": 336640 + }, + { + "epoch": 1.7, + "learning_rate": 4.52336146833425e-05, + "loss": 0.0074, + "step": 336650 + }, + { + "epoch": 1.7, + "learning_rate": 4.522604699032849e-05, + "loss": 0.0057, + "step": 336660 + }, + { + "epoch": 1.7, + "learning_rate": 4.521847929731448e-05, + "loss": 0.0073, + "step": 336670 + }, + { + "epoch": 1.7, + "learning_rate": 4.5210911604300465e-05, + "loss": 0.006, + "step": 336680 + }, + { + "epoch": 1.7, + "learning_rate": 4.5203343911286446e-05, + "loss": 0.0101, + "step": 336690 + }, + { + "epoch": 1.7, + "learning_rate": 4.519577621827244e-05, + "loss": 0.0062, + "step": 336700 + }, + { + "epoch": 1.7, + "learning_rate": 4.518820852525843e-05, + "loss": 0.0059, + "step": 336710 + }, + { + "epoch": 1.7, + "learning_rate": 4.518064083224442e-05, + "loss": 0.0092, + "step": 336720 + }, + { + "epoch": 1.7, + "learning_rate": 4.5173073139230406e-05, + "loss": 0.0065, + "step": 336730 + }, + { + "epoch": 1.7, + "learning_rate": 4.51655054462164e-05, + "loss": 0.0066, + "step": 336740 + }, + { + "epoch": 1.7, + "learning_rate": 4.515793775320239e-05, + "loss": 0.0131, + "step": 336750 + }, + { + "epoch": 1.7, + "learning_rate": 4.515037006018838e-05, + "loss": 0.0071, + "step": 336760 + }, + { + "epoch": 1.7, + "learning_rate": 4.5142802367174366e-05, + "loss": 0.0053, + "step": 336770 + }, + { + "epoch": 1.7, + "learning_rate": 4.513523467416036e-05, + "loss": 0.0057, + "step": 336780 + }, + { + "epoch": 1.7, + "learning_rate": 4.512766698114635e-05, + "loss": 0.0061, + "step": 336790 + }, + { + "epoch": 1.7, + "learning_rate": 4.512009928813234e-05, + "loss": 0.006, + "step": 336800 + }, + { + "epoch": 1.7, + "learning_rate": 4.5112531595118325e-05, + "loss": 0.0052, + "step": 336810 + }, + { + "epoch": 1.7, + "learning_rate": 4.510496390210432e-05, + "loss": 0.0057, + "step": 336820 + }, + { + "epoch": 1.7, + "learning_rate": 4.509739620909031e-05, + "loss": 0.0076, + "step": 336830 + }, + { + "epoch": 1.7, + "learning_rate": 4.50898285160763e-05, + "loss": 0.0068, + "step": 336840 + }, + { + "epoch": 1.7, + "learning_rate": 4.5082260823062285e-05, + "loss": 0.0063, + "step": 336850 + }, + { + "epoch": 1.7, + "learning_rate": 4.507469313004828e-05, + "loss": 0.0075, + "step": 336860 + }, + { + "epoch": 1.7, + "learning_rate": 4.506712543703427e-05, + "loss": 0.0063, + "step": 336870 + }, + { + "epoch": 1.7, + "learning_rate": 4.5059557744020257e-05, + "loss": 0.0067, + "step": 336880 + }, + { + "epoch": 1.7, + "learning_rate": 4.505199005100625e-05, + "loss": 0.0069, + "step": 336890 + }, + { + "epoch": 1.7, + "learning_rate": 4.504442235799224e-05, + "loss": 0.0053, + "step": 336900 + }, + { + "epoch": 1.7, + "learning_rate": 4.503685466497823e-05, + "loss": 0.0047, + "step": 336910 + }, + { + "epoch": 1.7, + "learning_rate": 4.5029286971964216e-05, + "loss": 0.0073, + "step": 336920 + }, + { + "epoch": 1.7, + "learning_rate": 4.502171927895021e-05, + "loss": 0.006, + "step": 336930 + }, + { + "epoch": 1.7, + "learning_rate": 4.50141515859362e-05, + "loss": 0.0068, + "step": 336940 + }, + { + "epoch": 1.7, + "learning_rate": 4.500658389292219e-05, + "loss": 0.006, + "step": 336950 + }, + { + "epoch": 1.7, + "learning_rate": 4.4999016199908176e-05, + "loss": 0.0063, + "step": 336960 + }, + { + "epoch": 1.7, + "learning_rate": 4.499144850689417e-05, + "loss": 0.0073, + "step": 336970 + }, + { + "epoch": 1.7, + "learning_rate": 4.498388081388016e-05, + "loss": 0.0079, + "step": 336980 + }, + { + "epoch": 1.7, + "learning_rate": 4.497631312086615e-05, + "loss": 0.0066, + "step": 336990 + }, + { + "epoch": 1.7, + "learning_rate": 4.4968745427852135e-05, + "loss": 0.0093, + "step": 337000 + }, + { + "epoch": 1.7, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.004760997835546732, + "eval_runtime": 116.4296, + "eval_samples_per_second": 17.178, + "eval_steps_per_second": 4.294, + "step": 337000 + }, + { + "epoch": 1.7, + "learning_rate": 4.496117773483812e-05, + "loss": 0.0047, + "step": 337010 + }, + { + "epoch": 1.7, + "learning_rate": 4.495361004182411e-05, + "loss": 0.0063, + "step": 337020 + }, + { + "epoch": 1.7, + "learning_rate": 4.49460423488101e-05, + "loss": 0.0046, + "step": 337030 + }, + { + "epoch": 1.7, + "learning_rate": 4.493847465579609e-05, + "loss": 0.0063, + "step": 337040 + }, + { + "epoch": 1.7, + "learning_rate": 4.4930906962782077e-05, + "loss": 0.0099, + "step": 337050 + }, + { + "epoch": 1.7, + "learning_rate": 4.492333926976807e-05, + "loss": 0.0069, + "step": 337060 + }, + { + "epoch": 1.7, + "learning_rate": 4.491577157675406e-05, + "loss": 0.0062, + "step": 337070 + }, + { + "epoch": 1.7, + "learning_rate": 4.490820388374005e-05, + "loss": 0.0075, + "step": 337080 + }, + { + "epoch": 1.7, + "learning_rate": 4.4900636190726036e-05, + "loss": 0.0078, + "step": 337090 + }, + { + "epoch": 1.7, + "learning_rate": 4.489306849771203e-05, + "loss": 0.0058, + "step": 337100 + }, + { + "epoch": 1.7, + "learning_rate": 4.488550080469802e-05, + "loss": 0.0065, + "step": 337110 + }, + { + "epoch": 1.7, + "learning_rate": 4.487793311168401e-05, + "loss": 0.0054, + "step": 337120 + }, + { + "epoch": 1.7, + "learning_rate": 4.4870365418669996e-05, + "loss": 0.0059, + "step": 337130 + }, + { + "epoch": 1.7, + "learning_rate": 4.486279772565599e-05, + "loss": 0.0052, + "step": 337140 + }, + { + "epoch": 1.7, + "learning_rate": 4.485523003264198e-05, + "loss": 0.007, + "step": 337150 + }, + { + "epoch": 1.7, + "learning_rate": 4.484766233962797e-05, + "loss": 0.0076, + "step": 337160 + }, + { + "epoch": 1.7, + "learning_rate": 4.4840094646613956e-05, + "loss": 0.0063, + "step": 337170 + }, + { + "epoch": 1.7, + "learning_rate": 4.483252695359995e-05, + "loss": 0.0064, + "step": 337180 + }, + { + "epoch": 1.7, + "learning_rate": 4.482495926058594e-05, + "loss": 0.0086, + "step": 337190 + }, + { + "epoch": 1.7, + "learning_rate": 4.481739156757193e-05, + "loss": 0.0061, + "step": 337200 + }, + { + "epoch": 1.7, + "learning_rate": 4.4809823874557915e-05, + "loss": 0.0081, + "step": 337210 + }, + { + "epoch": 1.7, + "learning_rate": 4.480225618154391e-05, + "loss": 0.0066, + "step": 337220 + }, + { + "epoch": 1.7, + "learning_rate": 4.47946884885299e-05, + "loss": 0.004, + "step": 337230 + }, + { + "epoch": 1.7, + "learning_rate": 4.4787120795515887e-05, + "loss": 0.0083, + "step": 337240 + }, + { + "epoch": 1.7, + "learning_rate": 4.4779553102501875e-05, + "loss": 0.0059, + "step": 337250 + }, + { + "epoch": 1.7, + "learning_rate": 4.477198540948787e-05, + "loss": 0.0072, + "step": 337260 + }, + { + "epoch": 1.7, + "learning_rate": 4.476441771647386e-05, + "loss": 0.0081, + "step": 337270 + }, + { + "epoch": 1.7, + "learning_rate": 4.4756850023459846e-05, + "loss": 0.0069, + "step": 337280 + }, + { + "epoch": 1.7, + "learning_rate": 4.4749282330445834e-05, + "loss": 0.0051, + "step": 337290 + }, + { + "epoch": 1.7, + "learning_rate": 4.474171463743183e-05, + "loss": 0.0052, + "step": 337300 + }, + { + "epoch": 1.7, + "learning_rate": 4.473414694441782e-05, + "loss": 0.0058, + "step": 337310 + }, + { + "epoch": 1.7, + "learning_rate": 4.47265792514038e-05, + "loss": 0.0069, + "step": 337320 + }, + { + "epoch": 1.7, + "learning_rate": 4.471901155838979e-05, + "loss": 0.0078, + "step": 337330 + }, + { + "epoch": 1.7, + "learning_rate": 4.4711443865375776e-05, + "loss": 0.0058, + "step": 337340 + }, + { + "epoch": 1.7, + "learning_rate": 4.470387617236177e-05, + "loss": 0.0075, + "step": 337350 + }, + { + "epoch": 1.7, + "learning_rate": 4.469630847934776e-05, + "loss": 0.0071, + "step": 337360 + }, + { + "epoch": 1.7, + "learning_rate": 4.468874078633375e-05, + "loss": 0.0091, + "step": 337370 + }, + { + "epoch": 1.7, + "learning_rate": 4.468117309331974e-05, + "loss": 0.0056, + "step": 337380 + }, + { + "epoch": 1.7, + "learning_rate": 4.467360540030573e-05, + "loss": 0.0069, + "step": 337390 + }, + { + "epoch": 1.7, + "learning_rate": 4.466603770729172e-05, + "loss": 0.0068, + "step": 337400 + }, + { + "epoch": 1.7, + "learning_rate": 4.465847001427771e-05, + "loss": 0.0066, + "step": 337410 + }, + { + "epoch": 1.7, + "learning_rate": 4.46509023212637e-05, + "loss": 0.0051, + "step": 337420 + }, + { + "epoch": 1.7, + "learning_rate": 4.464333462824969e-05, + "loss": 0.0067, + "step": 337430 + }, + { + "epoch": 1.7, + "learning_rate": 4.463576693523568e-05, + "loss": 0.0064, + "step": 337440 + }, + { + "epoch": 1.7, + "learning_rate": 4.4628199242221666e-05, + "loss": 0.0078, + "step": 337450 + }, + { + "epoch": 1.7, + "learning_rate": 4.462063154920766e-05, + "loss": 0.0059, + "step": 337460 + }, + { + "epoch": 1.7, + "learning_rate": 4.461306385619365e-05, + "loss": 0.0077, + "step": 337470 + }, + { + "epoch": 1.7, + "learning_rate": 4.460549616317964e-05, + "loss": 0.0059, + "step": 337480 + }, + { + "epoch": 1.7, + "learning_rate": 4.4597928470165626e-05, + "loss": 0.0067, + "step": 337490 + }, + { + "epoch": 1.7, + "learning_rate": 4.459036077715162e-05, + "loss": 0.0036, + "step": 337500 + }, + { + "epoch": 1.7, + "learning_rate": 4.458279308413761e-05, + "loss": 0.0088, + "step": 337510 + }, + { + "epoch": 1.7, + "learning_rate": 4.45752253911236e-05, + "loss": 0.0046, + "step": 337520 + }, + { + "epoch": 1.7, + "learning_rate": 4.4567657698109586e-05, + "loss": 0.006, + "step": 337530 + }, + { + "epoch": 1.7, + "learning_rate": 4.456009000509558e-05, + "loss": 0.0055, + "step": 337540 + }, + { + "epoch": 1.7, + "learning_rate": 4.455252231208157e-05, + "loss": 0.006, + "step": 337550 + }, + { + "epoch": 1.7, + "learning_rate": 4.454495461906756e-05, + "loss": 0.0061, + "step": 337560 + }, + { + "epoch": 1.7, + "learning_rate": 4.4537386926053545e-05, + "loss": 0.0077, + "step": 337570 + }, + { + "epoch": 1.7, + "learning_rate": 4.452981923303954e-05, + "loss": 0.0061, + "step": 337580 + }, + { + "epoch": 1.7, + "learning_rate": 4.452225154002553e-05, + "loss": 0.0047, + "step": 337590 + }, + { + "epoch": 1.7, + "learning_rate": 4.451468384701152e-05, + "loss": 0.0062, + "step": 337600 + }, + { + "epoch": 1.7, + "learning_rate": 4.4507116153997505e-05, + "loss": 0.0073, + "step": 337610 + }, + { + "epoch": 1.7, + "learning_rate": 4.44995484609835e-05, + "loss": 0.0052, + "step": 337620 + }, + { + "epoch": 1.7, + "learning_rate": 4.449198076796949e-05, + "loss": 0.0055, + "step": 337630 + }, + { + "epoch": 1.7, + "learning_rate": 4.448441307495547e-05, + "loss": 0.0051, + "step": 337640 + }, + { + "epoch": 1.7, + "learning_rate": 4.447684538194146e-05, + "loss": 0.0088, + "step": 337650 + }, + { + "epoch": 1.7, + "learning_rate": 4.4469277688927446e-05, + "loss": 0.0046, + "step": 337660 + }, + { + "epoch": 1.7, + "learning_rate": 4.446170999591344e-05, + "loss": 0.0065, + "step": 337670 + }, + { + "epoch": 1.7, + "learning_rate": 4.445414230289943e-05, + "loss": 0.0053, + "step": 337680 + }, + { + "epoch": 1.7, + "learning_rate": 4.444657460988542e-05, + "loss": 0.0069, + "step": 337690 + }, + { + "epoch": 1.7, + "learning_rate": 4.4439006916871406e-05, + "loss": 0.0086, + "step": 337700 + }, + { + "epoch": 1.7, + "learning_rate": 4.44314392238574e-05, + "loss": 0.0049, + "step": 337710 + }, + { + "epoch": 1.7, + "learning_rate": 4.442387153084339e-05, + "loss": 0.0051, + "step": 337720 + }, + { + "epoch": 1.7, + "learning_rate": 4.441630383782938e-05, + "loss": 0.0066, + "step": 337730 + }, + { + "epoch": 1.7, + "learning_rate": 4.4408736144815365e-05, + "loss": 0.0051, + "step": 337740 + }, + { + "epoch": 1.7, + "learning_rate": 4.440116845180136e-05, + "loss": 0.0081, + "step": 337750 + }, + { + "epoch": 1.7, + "learning_rate": 4.439360075878735e-05, + "loss": 0.0089, + "step": 337760 + }, + { + "epoch": 1.7, + "learning_rate": 4.438603306577334e-05, + "loss": 0.0074, + "step": 337770 + }, + { + "epoch": 1.7, + "learning_rate": 4.4378465372759325e-05, + "loss": 0.0059, + "step": 337780 + }, + { + "epoch": 1.7, + "learning_rate": 4.437089767974532e-05, + "loss": 0.0081, + "step": 337790 + }, + { + "epoch": 1.7, + "learning_rate": 4.436332998673131e-05, + "loss": 0.0053, + "step": 337800 + }, + { + "epoch": 1.7, + "learning_rate": 4.4355762293717296e-05, + "loss": 0.0054, + "step": 337810 + }, + { + "epoch": 1.7, + "learning_rate": 4.4348194600703285e-05, + "loss": 0.0073, + "step": 337820 + }, + { + "epoch": 1.7, + "learning_rate": 4.434062690768928e-05, + "loss": 0.0065, + "step": 337830 + }, + { + "epoch": 1.7, + "learning_rate": 4.433305921467527e-05, + "loss": 0.0059, + "step": 337840 + }, + { + "epoch": 1.7, + "learning_rate": 4.4325491521661256e-05, + "loss": 0.0074, + "step": 337850 + }, + { + "epoch": 1.7, + "learning_rate": 4.431792382864725e-05, + "loss": 0.0055, + "step": 337860 + }, + { + "epoch": 1.7, + "learning_rate": 4.431035613563324e-05, + "loss": 0.0066, + "step": 337870 + }, + { + "epoch": 1.7, + "learning_rate": 4.430278844261923e-05, + "loss": 0.0077, + "step": 337880 + }, + { + "epoch": 1.7, + "learning_rate": 4.4295220749605216e-05, + "loss": 0.0065, + "step": 337890 + }, + { + "epoch": 1.7, + "learning_rate": 4.428765305659121e-05, + "loss": 0.006, + "step": 337900 + }, + { + "epoch": 1.7, + "learning_rate": 4.42800853635772e-05, + "loss": 0.0057, + "step": 337910 + }, + { + "epoch": 1.7, + "learning_rate": 4.427251767056319e-05, + "loss": 0.0091, + "step": 337920 + }, + { + "epoch": 1.7, + "learning_rate": 4.4264949977549175e-05, + "loss": 0.005, + "step": 337930 + }, + { + "epoch": 1.7, + "learning_rate": 4.425738228453517e-05, + "loss": 0.0074, + "step": 337940 + }, + { + "epoch": 1.7, + "learning_rate": 4.424981459152115e-05, + "loss": 0.0055, + "step": 337950 + }, + { + "epoch": 1.71, + "learning_rate": 4.424224689850714e-05, + "loss": 0.0051, + "step": 337960 + }, + { + "epoch": 1.71, + "learning_rate": 4.423467920549313e-05, + "loss": 0.0061, + "step": 337970 + }, + { + "epoch": 1.71, + "learning_rate": 4.4227111512479116e-05, + "loss": 0.0051, + "step": 337980 + }, + { + "epoch": 1.71, + "learning_rate": 4.421954381946511e-05, + "loss": 0.0076, + "step": 337990 + }, + { + "epoch": 1.71, + "learning_rate": 4.42119761264511e-05, + "loss": 0.0061, + "step": 338000 + }, + { + "epoch": 1.71, + "eval_cer": 0.9144197953046413, + "eval_loss": 0.004835808649659157, + "eval_runtime": 116.338, + "eval_samples_per_second": 17.191, + "eval_steps_per_second": 4.298, + "step": 338000 + }, + { + "epoch": 1.71, + "learning_rate": 4.420440843343709e-05, + "loss": 0.0052, + "step": 338010 + }, + { + "epoch": 1.71, + "learning_rate": 4.4196840740423076e-05, + "loss": 0.0073, + "step": 338020 + }, + { + "epoch": 1.71, + "learning_rate": 4.418927304740907e-05, + "loss": 0.0061, + "step": 338030 + }, + { + "epoch": 1.71, + "learning_rate": 4.418170535439506e-05, + "loss": 0.0081, + "step": 338040 + }, + { + "epoch": 1.71, + "learning_rate": 4.417413766138105e-05, + "loss": 0.0062, + "step": 338050 + }, + { + "epoch": 1.71, + "learning_rate": 4.4166569968367036e-05, + "loss": 0.0063, + "step": 338060 + }, + { + "epoch": 1.71, + "learning_rate": 4.415900227535303e-05, + "loss": 0.0064, + "step": 338070 + }, + { + "epoch": 1.71, + "learning_rate": 4.415143458233902e-05, + "loss": 0.0085, + "step": 338080 + }, + { + "epoch": 1.71, + "learning_rate": 4.414386688932501e-05, + "loss": 0.0073, + "step": 338090 + }, + { + "epoch": 1.71, + "learning_rate": 4.4136299196310995e-05, + "loss": 0.0043, + "step": 338100 + }, + { + "epoch": 1.71, + "learning_rate": 4.412873150329699e-05, + "loss": 0.006, + "step": 338110 + }, + { + "epoch": 1.71, + "learning_rate": 4.412116381028298e-05, + "loss": 0.0068, + "step": 338120 + }, + { + "epoch": 1.71, + "learning_rate": 4.411359611726897e-05, + "loss": 0.0068, + "step": 338130 + }, + { + "epoch": 1.71, + "learning_rate": 4.4106028424254955e-05, + "loss": 0.007, + "step": 338140 + }, + { + "epoch": 1.71, + "learning_rate": 4.409846073124095e-05, + "loss": 0.0064, + "step": 338150 + }, + { + "epoch": 1.71, + "learning_rate": 4.409089303822694e-05, + "loss": 0.006, + "step": 338160 + }, + { + "epoch": 1.71, + "learning_rate": 4.4083325345212926e-05, + "loss": 0.0074, + "step": 338170 + }, + { + "epoch": 1.71, + "learning_rate": 4.4075757652198915e-05, + "loss": 0.0069, + "step": 338180 + }, + { + "epoch": 1.71, + "learning_rate": 4.406818995918491e-05, + "loss": 0.0075, + "step": 338190 + }, + { + "epoch": 1.71, + "learning_rate": 4.40606222661709e-05, + "loss": 0.007, + "step": 338200 + }, + { + "epoch": 1.71, + "learning_rate": 4.4053054573156886e-05, + "loss": 0.0054, + "step": 338210 + }, + { + "epoch": 1.71, + "learning_rate": 4.4045486880142874e-05, + "loss": 0.0054, + "step": 338220 + }, + { + "epoch": 1.71, + "learning_rate": 4.403791918712887e-05, + "loss": 0.0064, + "step": 338230 + }, + { + "epoch": 1.71, + "learning_rate": 4.403035149411486e-05, + "loss": 0.0067, + "step": 338240 + }, + { + "epoch": 1.71, + "learning_rate": 4.4022783801100846e-05, + "loss": 0.0066, + "step": 338250 + }, + { + "epoch": 1.71, + "learning_rate": 4.401521610808683e-05, + "loss": 0.0067, + "step": 338260 + }, + { + "epoch": 1.71, + "learning_rate": 4.4007648415072815e-05, + "loss": 0.0086, + "step": 338270 + }, + { + "epoch": 1.71, + "learning_rate": 4.400008072205881e-05, + "loss": 0.0064, + "step": 338280 + }, + { + "epoch": 1.71, + "learning_rate": 4.39925130290448e-05, + "loss": 0.0062, + "step": 338290 + }, + { + "epoch": 1.71, + "learning_rate": 4.398494533603079e-05, + "loss": 0.0055, + "step": 338300 + }, + { + "epoch": 1.71, + "learning_rate": 4.3977377643016775e-05, + "loss": 0.0065, + "step": 338310 + }, + { + "epoch": 1.71, + "learning_rate": 4.396980995000277e-05, + "loss": 0.0056, + "step": 338320 + }, + { + "epoch": 1.71, + "learning_rate": 4.396224225698876e-05, + "loss": 0.0073, + "step": 338330 + }, + { + "epoch": 1.71, + "learning_rate": 4.3954674563974747e-05, + "loss": 0.0077, + "step": 338340 + }, + { + "epoch": 1.71, + "learning_rate": 4.394710687096074e-05, + "loss": 0.0057, + "step": 338350 + }, + { + "epoch": 1.71, + "learning_rate": 4.393953917794673e-05, + "loss": 0.0068, + "step": 338360 + }, + { + "epoch": 1.71, + "learning_rate": 4.393197148493272e-05, + "loss": 0.0055, + "step": 338370 + }, + { + "epoch": 1.71, + "learning_rate": 4.3924403791918706e-05, + "loss": 0.0074, + "step": 338380 + }, + { + "epoch": 1.71, + "learning_rate": 4.39168360989047e-05, + "loss": 0.0068, + "step": 338390 + }, + { + "epoch": 1.71, + "learning_rate": 4.390926840589069e-05, + "loss": 0.0083, + "step": 338400 + }, + { + "epoch": 1.71, + "learning_rate": 4.390170071287668e-05, + "loss": 0.0039, + "step": 338410 + }, + { + "epoch": 1.71, + "learning_rate": 4.3894133019862666e-05, + "loss": 0.0062, + "step": 338420 + }, + { + "epoch": 1.71, + "learning_rate": 4.388656532684866e-05, + "loss": 0.006, + "step": 338430 + }, + { + "epoch": 1.71, + "learning_rate": 4.387899763383465e-05, + "loss": 0.0053, + "step": 338440 + }, + { + "epoch": 1.71, + "learning_rate": 4.387142994082064e-05, + "loss": 0.0062, + "step": 338450 + }, + { + "epoch": 1.71, + "learning_rate": 4.3863862247806625e-05, + "loss": 0.0075, + "step": 338460 + }, + { + "epoch": 1.71, + "learning_rate": 4.385629455479262e-05, + "loss": 0.0064, + "step": 338470 + }, + { + "epoch": 1.71, + "learning_rate": 4.384872686177861e-05, + "loss": 0.0044, + "step": 338480 + }, + { + "epoch": 1.71, + "learning_rate": 4.38411591687646e-05, + "loss": 0.0056, + "step": 338490 + }, + { + "epoch": 1.71, + "learning_rate": 4.3833591475750585e-05, + "loss": 0.0052, + "step": 338500 + }, + { + "epoch": 1.71, + "learning_rate": 4.382602378273658e-05, + "loss": 0.0062, + "step": 338510 + }, + { + "epoch": 1.71, + "learning_rate": 4.381845608972257e-05, + "loss": 0.0057, + "step": 338520 + }, + { + "epoch": 1.71, + "learning_rate": 4.3810888396708557e-05, + "loss": 0.0059, + "step": 338530 + }, + { + "epoch": 1.71, + "learning_rate": 4.3803320703694545e-05, + "loss": 0.0097, + "step": 338540 + }, + { + "epoch": 1.71, + "learning_rate": 4.379575301068054e-05, + "loss": 0.0064, + "step": 338550 + }, + { + "epoch": 1.71, + "learning_rate": 4.378818531766653e-05, + "loss": 0.0055, + "step": 338560 + }, + { + "epoch": 1.71, + "learning_rate": 4.3780617624652516e-05, + "loss": 0.0067, + "step": 338570 + }, + { + "epoch": 1.71, + "learning_rate": 4.37730499316385e-05, + "loss": 0.0058, + "step": 338580 + }, + { + "epoch": 1.71, + "learning_rate": 4.3765482238624486e-05, + "loss": 0.0065, + "step": 338590 + }, + { + "epoch": 1.71, + "learning_rate": 4.375791454561048e-05, + "loss": 0.005, + "step": 338600 + }, + { + "epoch": 1.71, + "learning_rate": 4.375034685259647e-05, + "loss": 0.0068, + "step": 338610 + }, + { + "epoch": 1.71, + "learning_rate": 4.374277915958246e-05, + "loss": 0.0063, + "step": 338620 + }, + { + "epoch": 1.71, + "learning_rate": 4.3735211466568446e-05, + "loss": 0.0051, + "step": 338630 + }, + { + "epoch": 1.71, + "learning_rate": 4.372764377355444e-05, + "loss": 0.0058, + "step": 338640 + }, + { + "epoch": 1.71, + "learning_rate": 4.372007608054043e-05, + "loss": 0.0053, + "step": 338650 + }, + { + "epoch": 1.71, + "learning_rate": 4.371250838752642e-05, + "loss": 0.005, + "step": 338660 + }, + { + "epoch": 1.71, + "learning_rate": 4.3704940694512405e-05, + "loss": 0.0071, + "step": 338670 + }, + { + "epoch": 1.71, + "learning_rate": 4.36973730014984e-05, + "loss": 0.006, + "step": 338680 + }, + { + "epoch": 1.71, + "learning_rate": 4.368980530848439e-05, + "loss": 0.008, + "step": 338690 + }, + { + "epoch": 1.71, + "learning_rate": 4.3682237615470377e-05, + "loss": 0.0083, + "step": 338700 + }, + { + "epoch": 1.71, + "learning_rate": 4.3674669922456365e-05, + "loss": 0.0058, + "step": 338710 + }, + { + "epoch": 1.71, + "learning_rate": 4.366710222944236e-05, + "loss": 0.0097, + "step": 338720 + }, + { + "epoch": 1.71, + "learning_rate": 4.365953453642835e-05, + "loss": 0.0068, + "step": 338730 + }, + { + "epoch": 1.71, + "learning_rate": 4.3651966843414336e-05, + "loss": 0.0063, + "step": 338740 + }, + { + "epoch": 1.71, + "learning_rate": 4.3644399150400324e-05, + "loss": 0.0063, + "step": 338750 + }, + { + "epoch": 1.71, + "learning_rate": 4.363683145738632e-05, + "loss": 0.0098, + "step": 338760 + }, + { + "epoch": 1.71, + "learning_rate": 4.362926376437231e-05, + "loss": 0.0066, + "step": 338770 + }, + { + "epoch": 1.71, + "learning_rate": 4.3621696071358296e-05, + "loss": 0.0088, + "step": 338780 + }, + { + "epoch": 1.71, + "learning_rate": 4.3614128378344284e-05, + "loss": 0.0079, + "step": 338790 + }, + { + "epoch": 1.71, + "learning_rate": 4.360656068533028e-05, + "loss": 0.0072, + "step": 338800 + }, + { + "epoch": 1.71, + "learning_rate": 4.359899299231627e-05, + "loss": 0.0053, + "step": 338810 + }, + { + "epoch": 1.71, + "learning_rate": 4.3591425299302256e-05, + "loss": 0.0056, + "step": 338820 + }, + { + "epoch": 1.71, + "learning_rate": 4.358385760628825e-05, + "loss": 0.0082, + "step": 338830 + }, + { + "epoch": 1.71, + "learning_rate": 4.357628991327424e-05, + "loss": 0.0049, + "step": 338840 + }, + { + "epoch": 1.71, + "learning_rate": 4.356872222026023e-05, + "loss": 0.0061, + "step": 338850 + }, + { + "epoch": 1.71, + "learning_rate": 4.3561154527246215e-05, + "loss": 0.005, + "step": 338860 + }, + { + "epoch": 1.71, + "learning_rate": 4.355358683423221e-05, + "loss": 0.0063, + "step": 338870 + }, + { + "epoch": 1.71, + "learning_rate": 4.35460191412182e-05, + "loss": 0.0066, + "step": 338880 + }, + { + "epoch": 1.71, + "learning_rate": 4.353845144820418e-05, + "loss": 0.0061, + "step": 338890 + }, + { + "epoch": 1.71, + "learning_rate": 4.353088375519017e-05, + "loss": 0.0038, + "step": 338900 + }, + { + "epoch": 1.71, + "learning_rate": 4.3523316062176156e-05, + "loss": 0.006, + "step": 338910 + }, + { + "epoch": 1.71, + "learning_rate": 4.351574836916215e-05, + "loss": 0.0068, + "step": 338920 + }, + { + "epoch": 1.71, + "learning_rate": 4.350818067614814e-05, + "loss": 0.0049, + "step": 338930 + }, + { + "epoch": 1.71, + "learning_rate": 4.350061298313413e-05, + "loss": 0.0044, + "step": 338940 + }, + { + "epoch": 1.71, + "learning_rate": 4.3493045290120116e-05, + "loss": 0.0057, + "step": 338950 + }, + { + "epoch": 1.71, + "learning_rate": 4.348547759710611e-05, + "loss": 0.008, + "step": 338960 + }, + { + "epoch": 1.71, + "learning_rate": 4.34779099040921e-05, + "loss": 0.0053, + "step": 338970 + }, + { + "epoch": 1.71, + "learning_rate": 4.347034221107809e-05, + "loss": 0.0043, + "step": 338980 + }, + { + "epoch": 1.71, + "learning_rate": 4.3462774518064076e-05, + "loss": 0.0088, + "step": 338990 + }, + { + "epoch": 1.71, + "learning_rate": 4.345520682505007e-05, + "loss": 0.0057, + "step": 339000 + }, + { + "epoch": 1.71, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.0047121611423790455, + "eval_runtime": 116.4797, + "eval_samples_per_second": 17.17, + "eval_steps_per_second": 4.293, + "step": 339000 + }, + { + "epoch": 1.71, + "learning_rate": 4.344763913203606e-05, + "loss": 0.0056, + "step": 339010 + }, + { + "epoch": 1.71, + "learning_rate": 4.344007143902205e-05, + "loss": 0.0057, + "step": 339020 + }, + { + "epoch": 1.71, + "learning_rate": 4.3432503746008035e-05, + "loss": 0.0096, + "step": 339030 + }, + { + "epoch": 1.71, + "learning_rate": 4.342493605299403e-05, + "loss": 0.0079, + "step": 339040 + }, + { + "epoch": 1.71, + "learning_rate": 4.341736835998002e-05, + "loss": 0.0053, + "step": 339050 + }, + { + "epoch": 1.71, + "learning_rate": 4.340980066696601e-05, + "loss": 0.0053, + "step": 339060 + }, + { + "epoch": 1.71, + "learning_rate": 4.3402232973951995e-05, + "loss": 0.0061, + "step": 339070 + }, + { + "epoch": 1.71, + "learning_rate": 4.339466528093799e-05, + "loss": 0.0059, + "step": 339080 + }, + { + "epoch": 1.71, + "learning_rate": 4.338709758792398e-05, + "loss": 0.0054, + "step": 339090 + }, + { + "epoch": 1.71, + "learning_rate": 4.3379529894909966e-05, + "loss": 0.006, + "step": 339100 + }, + { + "epoch": 1.71, + "learning_rate": 4.3371962201895955e-05, + "loss": 0.006, + "step": 339110 + }, + { + "epoch": 1.71, + "learning_rate": 4.336439450888195e-05, + "loss": 0.0072, + "step": 339120 + }, + { + "epoch": 1.71, + "learning_rate": 4.335682681586794e-05, + "loss": 0.0068, + "step": 339130 + }, + { + "epoch": 1.71, + "learning_rate": 4.3349259122853926e-05, + "loss": 0.0074, + "step": 339140 + }, + { + "epoch": 1.71, + "learning_rate": 4.3341691429839914e-05, + "loss": 0.006, + "step": 339150 + }, + { + "epoch": 1.71, + "learning_rate": 4.333412373682591e-05, + "loss": 0.0088, + "step": 339160 + }, + { + "epoch": 1.71, + "learning_rate": 4.33265560438119e-05, + "loss": 0.0069, + "step": 339170 + }, + { + "epoch": 1.71, + "learning_rate": 4.3318988350797886e-05, + "loss": 0.0055, + "step": 339180 + }, + { + "epoch": 1.71, + "learning_rate": 4.3311420657783874e-05, + "loss": 0.0068, + "step": 339190 + }, + { + "epoch": 1.71, + "learning_rate": 4.330385296476987e-05, + "loss": 0.0065, + "step": 339200 + }, + { + "epoch": 1.71, + "learning_rate": 4.329628527175585e-05, + "loss": 0.0048, + "step": 339210 + }, + { + "epoch": 1.71, + "learning_rate": 4.328871757874184e-05, + "loss": 0.0055, + "step": 339220 + }, + { + "epoch": 1.71, + "learning_rate": 4.328114988572783e-05, + "loss": 0.0065, + "step": 339230 + }, + { + "epoch": 1.71, + "learning_rate": 4.3273582192713815e-05, + "loss": 0.0081, + "step": 339240 + }, + { + "epoch": 1.71, + "learning_rate": 4.326601449969981e-05, + "loss": 0.0062, + "step": 339250 + }, + { + "epoch": 1.71, + "learning_rate": 4.32584468066858e-05, + "loss": 0.006, + "step": 339260 + }, + { + "epoch": 1.71, + "learning_rate": 4.3250879113671786e-05, + "loss": 0.0072, + "step": 339270 + }, + { + "epoch": 1.71, + "learning_rate": 4.3243311420657775e-05, + "loss": 0.0056, + "step": 339280 + }, + { + "epoch": 1.71, + "learning_rate": 4.323574372764377e-05, + "loss": 0.0035, + "step": 339290 + }, + { + "epoch": 1.71, + "learning_rate": 4.322817603462976e-05, + "loss": 0.0066, + "step": 339300 + }, + { + "epoch": 1.71, + "learning_rate": 4.3220608341615746e-05, + "loss": 0.0064, + "step": 339310 + }, + { + "epoch": 1.71, + "learning_rate": 4.321304064860174e-05, + "loss": 0.0061, + "step": 339320 + }, + { + "epoch": 1.71, + "learning_rate": 4.320547295558773e-05, + "loss": 0.0085, + "step": 339330 + }, + { + "epoch": 1.71, + "learning_rate": 4.319790526257372e-05, + "loss": 0.0052, + "step": 339340 + }, + { + "epoch": 1.71, + "learning_rate": 4.3190337569559706e-05, + "loss": 0.0055, + "step": 339350 + }, + { + "epoch": 1.71, + "learning_rate": 4.31827698765457e-05, + "loss": 0.0058, + "step": 339360 + }, + { + "epoch": 1.71, + "learning_rate": 4.317520218353169e-05, + "loss": 0.008, + "step": 339370 + }, + { + "epoch": 1.71, + "learning_rate": 4.316763449051768e-05, + "loss": 0.0047, + "step": 339380 + }, + { + "epoch": 1.71, + "learning_rate": 4.3160066797503665e-05, + "loss": 0.0064, + "step": 339390 + }, + { + "epoch": 1.71, + "learning_rate": 4.315249910448966e-05, + "loss": 0.0051, + "step": 339400 + }, + { + "epoch": 1.71, + "learning_rate": 4.314493141147565e-05, + "loss": 0.0086, + "step": 339410 + }, + { + "epoch": 1.71, + "learning_rate": 4.313736371846164e-05, + "loss": 0.0058, + "step": 339420 + }, + { + "epoch": 1.71, + "learning_rate": 4.3129796025447625e-05, + "loss": 0.0042, + "step": 339430 + }, + { + "epoch": 1.71, + "learning_rate": 4.312222833243362e-05, + "loss": 0.0052, + "step": 339440 + }, + { + "epoch": 1.71, + "learning_rate": 4.311466063941961e-05, + "loss": 0.0068, + "step": 339450 + }, + { + "epoch": 1.71, + "learning_rate": 4.3107092946405596e-05, + "loss": 0.0057, + "step": 339460 + }, + { + "epoch": 1.71, + "learning_rate": 4.3099525253391585e-05, + "loss": 0.0072, + "step": 339470 + }, + { + "epoch": 1.71, + "learning_rate": 4.309195756037758e-05, + "loss": 0.0063, + "step": 339480 + }, + { + "epoch": 1.71, + "learning_rate": 4.308438986736357e-05, + "loss": 0.0076, + "step": 339490 + }, + { + "epoch": 1.71, + "learning_rate": 4.3076822174349556e-05, + "loss": 0.0069, + "step": 339500 + }, + { + "epoch": 1.71, + "learning_rate": 4.3069254481335544e-05, + "loss": 0.0092, + "step": 339510 + }, + { + "epoch": 1.71, + "learning_rate": 4.3061686788321526e-05, + "loss": 0.0055, + "step": 339520 + }, + { + "epoch": 1.71, + "learning_rate": 4.305411909530752e-05, + "loss": 0.0074, + "step": 339530 + }, + { + "epoch": 1.71, + "learning_rate": 4.304655140229351e-05, + "loss": 0.0057, + "step": 339540 + }, + { + "epoch": 1.71, + "learning_rate": 4.30389837092795e-05, + "loss": 0.0046, + "step": 339550 + }, + { + "epoch": 1.71, + "learning_rate": 4.3031416016265485e-05, + "loss": 0.0076, + "step": 339560 + }, + { + "epoch": 1.71, + "learning_rate": 4.302384832325148e-05, + "loss": 0.0076, + "step": 339570 + }, + { + "epoch": 1.71, + "learning_rate": 4.301628063023747e-05, + "loss": 0.0079, + "step": 339580 + }, + { + "epoch": 1.71, + "learning_rate": 4.300871293722346e-05, + "loss": 0.0073, + "step": 339590 + }, + { + "epoch": 1.71, + "learning_rate": 4.3001145244209445e-05, + "loss": 0.0071, + "step": 339600 + }, + { + "epoch": 1.71, + "learning_rate": 4.299357755119544e-05, + "loss": 0.0081, + "step": 339610 + }, + { + "epoch": 1.71, + "learning_rate": 4.298600985818143e-05, + "loss": 0.0052, + "step": 339620 + }, + { + "epoch": 1.71, + "learning_rate": 4.2978442165167416e-05, + "loss": 0.0045, + "step": 339630 + }, + { + "epoch": 1.71, + "learning_rate": 4.2970874472153405e-05, + "loss": 0.0059, + "step": 339640 + }, + { + "epoch": 1.71, + "learning_rate": 4.29633067791394e-05, + "loss": 0.0093, + "step": 339650 + }, + { + "epoch": 1.71, + "learning_rate": 4.295573908612539e-05, + "loss": 0.0054, + "step": 339660 + }, + { + "epoch": 1.71, + "learning_rate": 4.2948171393111376e-05, + "loss": 0.0073, + "step": 339670 + }, + { + "epoch": 1.71, + "learning_rate": 4.2940603700097364e-05, + "loss": 0.0057, + "step": 339680 + }, + { + "epoch": 1.71, + "learning_rate": 4.293303600708336e-05, + "loss": 0.0059, + "step": 339690 + }, + { + "epoch": 1.71, + "learning_rate": 4.292546831406935e-05, + "loss": 0.0089, + "step": 339700 + }, + { + "epoch": 1.71, + "learning_rate": 4.2917900621055336e-05, + "loss": 0.0073, + "step": 339710 + }, + { + "epoch": 1.71, + "learning_rate": 4.2910332928041324e-05, + "loss": 0.0065, + "step": 339720 + }, + { + "epoch": 1.71, + "learning_rate": 4.290276523502732e-05, + "loss": 0.0063, + "step": 339730 + }, + { + "epoch": 1.71, + "learning_rate": 4.289519754201331e-05, + "loss": 0.0082, + "step": 339740 + }, + { + "epoch": 1.71, + "learning_rate": 4.2887629848999295e-05, + "loss": 0.0068, + "step": 339750 + }, + { + "epoch": 1.71, + "learning_rate": 4.2880062155985284e-05, + "loss": 0.0062, + "step": 339760 + }, + { + "epoch": 1.71, + "learning_rate": 4.287249446297128e-05, + "loss": 0.006, + "step": 339770 + }, + { + "epoch": 1.71, + "learning_rate": 4.286492676995727e-05, + "loss": 0.0077, + "step": 339780 + }, + { + "epoch": 1.71, + "learning_rate": 4.2857359076943255e-05, + "loss": 0.0062, + "step": 339790 + }, + { + "epoch": 1.71, + "learning_rate": 4.284979138392925e-05, + "loss": 0.0059, + "step": 339800 + }, + { + "epoch": 1.71, + "learning_rate": 4.284222369091524e-05, + "loss": 0.0071, + "step": 339810 + }, + { + "epoch": 1.71, + "learning_rate": 4.2834655997901227e-05, + "loss": 0.0053, + "step": 339820 + }, + { + "epoch": 1.71, + "learning_rate": 4.2827088304887215e-05, + "loss": 0.0069, + "step": 339830 + }, + { + "epoch": 1.71, + "learning_rate": 4.2819520611873196e-05, + "loss": 0.0071, + "step": 339840 + }, + { + "epoch": 1.71, + "learning_rate": 4.281195291885919e-05, + "loss": 0.0059, + "step": 339850 + }, + { + "epoch": 1.71, + "learning_rate": 4.280438522584518e-05, + "loss": 0.0069, + "step": 339860 + }, + { + "epoch": 1.71, + "learning_rate": 4.279681753283117e-05, + "loss": 0.0058, + "step": 339870 + }, + { + "epoch": 1.71, + "learning_rate": 4.2789249839817156e-05, + "loss": 0.0058, + "step": 339880 + }, + { + "epoch": 1.71, + "learning_rate": 4.278168214680315e-05, + "loss": 0.0055, + "step": 339890 + }, + { + "epoch": 1.71, + "learning_rate": 4.277411445378914e-05, + "loss": 0.0046, + "step": 339900 + }, + { + "epoch": 1.71, + "learning_rate": 4.276654676077513e-05, + "loss": 0.0054, + "step": 339910 + }, + { + "epoch": 1.71, + "learning_rate": 4.2758979067761115e-05, + "loss": 0.006, + "step": 339920 + }, + { + "epoch": 1.71, + "learning_rate": 4.275141137474711e-05, + "loss": 0.0065, + "step": 339930 + }, + { + "epoch": 1.72, + "learning_rate": 4.27438436817331e-05, + "loss": 0.0072, + "step": 339940 + }, + { + "epoch": 1.72, + "learning_rate": 4.273627598871909e-05, + "loss": 0.0046, + "step": 339950 + }, + { + "epoch": 1.72, + "learning_rate": 4.2728708295705075e-05, + "loss": 0.0049, + "step": 339960 + }, + { + "epoch": 1.72, + "learning_rate": 4.272114060269107e-05, + "loss": 0.0051, + "step": 339970 + }, + { + "epoch": 1.72, + "learning_rate": 4.271357290967706e-05, + "loss": 0.0068, + "step": 339980 + }, + { + "epoch": 1.72, + "learning_rate": 4.2706005216663047e-05, + "loss": 0.0073, + "step": 339990 + }, + { + "epoch": 1.72, + "learning_rate": 4.2698437523649035e-05, + "loss": 0.0059, + "step": 340000 + }, + { + "epoch": 1.72, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004758994095027447, + "eval_runtime": 116.784, + "eval_samples_per_second": 17.126, + "eval_steps_per_second": 4.281, + "step": 340000 + }, + { + "epoch": 1.72, + "learning_rate": 4.269086983063503e-05, + "loss": 0.0051, + "step": 340010 + }, + { + "epoch": 1.72, + "learning_rate": 4.268330213762102e-05, + "loss": 0.009, + "step": 340020 + }, + { + "epoch": 1.72, + "learning_rate": 4.2675734444607006e-05, + "loss": 0.0068, + "step": 340030 + }, + { + "epoch": 1.72, + "learning_rate": 4.2668166751592994e-05, + "loss": 0.0054, + "step": 340040 + }, + { + "epoch": 1.72, + "learning_rate": 4.266059905857899e-05, + "loss": 0.0063, + "step": 340050 + }, + { + "epoch": 1.72, + "learning_rate": 4.265303136556498e-05, + "loss": 0.0078, + "step": 340060 + }, + { + "epoch": 1.72, + "learning_rate": 4.2645463672550966e-05, + "loss": 0.006, + "step": 340070 + }, + { + "epoch": 1.72, + "learning_rate": 4.2637895979536954e-05, + "loss": 0.005, + "step": 340080 + }, + { + "epoch": 1.72, + "learning_rate": 4.263032828652295e-05, + "loss": 0.0083, + "step": 340090 + }, + { + "epoch": 1.72, + "learning_rate": 4.262276059350894e-05, + "loss": 0.005, + "step": 340100 + }, + { + "epoch": 1.72, + "learning_rate": 4.2615192900494926e-05, + "loss": 0.006, + "step": 340110 + }, + { + "epoch": 1.72, + "learning_rate": 4.2607625207480914e-05, + "loss": 0.0039, + "step": 340120 + }, + { + "epoch": 1.72, + "learning_rate": 4.260005751446691e-05, + "loss": 0.0057, + "step": 340130 + }, + { + "epoch": 1.72, + "learning_rate": 4.25924898214529e-05, + "loss": 0.0061, + "step": 340140 + }, + { + "epoch": 1.72, + "learning_rate": 4.258492212843888e-05, + "loss": 0.0055, + "step": 340150 + }, + { + "epoch": 1.72, + "learning_rate": 4.2577354435424867e-05, + "loss": 0.0045, + "step": 340160 + }, + { + "epoch": 1.72, + "learning_rate": 4.2569786742410855e-05, + "loss": 0.0068, + "step": 340170 + }, + { + "epoch": 1.72, + "learning_rate": 4.256221904939685e-05, + "loss": 0.0073, + "step": 340180 + }, + { + "epoch": 1.72, + "learning_rate": 4.255465135638284e-05, + "loss": 0.0052, + "step": 340190 + }, + { + "epoch": 1.72, + "learning_rate": 4.2547083663368826e-05, + "loss": 0.0063, + "step": 340200 + }, + { + "epoch": 1.72, + "learning_rate": 4.2539515970354814e-05, + "loss": 0.0065, + "step": 340210 + }, + { + "epoch": 1.72, + "learning_rate": 4.253194827734081e-05, + "loss": 0.0062, + "step": 340220 + }, + { + "epoch": 1.72, + "learning_rate": 4.25243805843268e-05, + "loss": 0.0036, + "step": 340230 + }, + { + "epoch": 1.72, + "learning_rate": 4.2516812891312786e-05, + "loss": 0.0061, + "step": 340240 + }, + { + "epoch": 1.72, + "learning_rate": 4.2509245198298774e-05, + "loss": 0.0046, + "step": 340250 + }, + { + "epoch": 1.72, + "learning_rate": 4.250167750528477e-05, + "loss": 0.006, + "step": 340260 + }, + { + "epoch": 1.72, + "learning_rate": 4.249410981227076e-05, + "loss": 0.0045, + "step": 340270 + }, + { + "epoch": 1.72, + "learning_rate": 4.2486542119256746e-05, + "loss": 0.008, + "step": 340280 + }, + { + "epoch": 1.72, + "learning_rate": 4.247897442624274e-05, + "loss": 0.0056, + "step": 340290 + }, + { + "epoch": 1.72, + "learning_rate": 4.247140673322873e-05, + "loss": 0.0051, + "step": 340300 + }, + { + "epoch": 1.72, + "learning_rate": 4.246383904021472e-05, + "loss": 0.0075, + "step": 340310 + }, + { + "epoch": 1.72, + "learning_rate": 4.2456271347200705e-05, + "loss": 0.009, + "step": 340320 + }, + { + "epoch": 1.72, + "learning_rate": 4.24487036541867e-05, + "loss": 0.0065, + "step": 340330 + }, + { + "epoch": 1.72, + "learning_rate": 4.244113596117269e-05, + "loss": 0.0075, + "step": 340340 + }, + { + "epoch": 1.72, + "learning_rate": 4.243356826815868e-05, + "loss": 0.0053, + "step": 340350 + }, + { + "epoch": 1.72, + "learning_rate": 4.2426000575144665e-05, + "loss": 0.006, + "step": 340360 + }, + { + "epoch": 1.72, + "learning_rate": 4.241843288213066e-05, + "loss": 0.0073, + "step": 340370 + }, + { + "epoch": 1.72, + "learning_rate": 4.241086518911665e-05, + "loss": 0.0066, + "step": 340380 + }, + { + "epoch": 1.72, + "learning_rate": 4.2403297496102636e-05, + "loss": 0.0062, + "step": 340390 + }, + { + "epoch": 1.72, + "learning_rate": 4.2395729803088625e-05, + "loss": 0.0073, + "step": 340400 + }, + { + "epoch": 1.72, + "learning_rate": 4.238816211007462e-05, + "loss": 0.008, + "step": 340410 + }, + { + "epoch": 1.72, + "learning_rate": 4.238059441706061e-05, + "loss": 0.0076, + "step": 340420 + }, + { + "epoch": 1.72, + "learning_rate": 4.2373026724046596e-05, + "loss": 0.007, + "step": 340430 + }, + { + "epoch": 1.72, + "learning_rate": 4.2365459031032584e-05, + "loss": 0.0072, + "step": 340440 + }, + { + "epoch": 1.72, + "learning_rate": 4.235789133801858e-05, + "loss": 0.006, + "step": 340450 + }, + { + "epoch": 1.72, + "learning_rate": 4.235032364500456e-05, + "loss": 0.0092, + "step": 340460 + }, + { + "epoch": 1.72, + "learning_rate": 4.234275595199055e-05, + "loss": 0.0055, + "step": 340470 + }, + { + "epoch": 1.72, + "learning_rate": 4.233518825897654e-05, + "loss": 0.0064, + "step": 340480 + }, + { + "epoch": 1.72, + "learning_rate": 4.2327620565962525e-05, + "loss": 0.0072, + "step": 340490 + }, + { + "epoch": 1.72, + "learning_rate": 4.232005287294852e-05, + "loss": 0.0061, + "step": 340500 + }, + { + "epoch": 1.72, + "learning_rate": 4.231248517993451e-05, + "loss": 0.0072, + "step": 340510 + }, + { + "epoch": 1.72, + "learning_rate": 4.23049174869205e-05, + "loss": 0.0052, + "step": 340520 + }, + { + "epoch": 1.72, + "learning_rate": 4.2297349793906485e-05, + "loss": 0.0049, + "step": 340530 + }, + { + "epoch": 1.72, + "learning_rate": 4.228978210089248e-05, + "loss": 0.0066, + "step": 340540 + }, + { + "epoch": 1.72, + "learning_rate": 4.228221440787847e-05, + "loss": 0.0053, + "step": 340550 + }, + { + "epoch": 1.72, + "learning_rate": 4.2274646714864456e-05, + "loss": 0.0096, + "step": 340560 + }, + { + "epoch": 1.72, + "learning_rate": 4.2267079021850445e-05, + "loss": 0.0053, + "step": 340570 + }, + { + "epoch": 1.72, + "learning_rate": 4.225951132883644e-05, + "loss": 0.0084, + "step": 340580 + }, + { + "epoch": 1.72, + "learning_rate": 4.225194363582243e-05, + "loss": 0.0061, + "step": 340590 + }, + { + "epoch": 1.72, + "learning_rate": 4.2244375942808416e-05, + "loss": 0.007, + "step": 340600 + }, + { + "epoch": 1.72, + "learning_rate": 4.2236808249794404e-05, + "loss": 0.0062, + "step": 340610 + }, + { + "epoch": 1.72, + "learning_rate": 4.22292405567804e-05, + "loss": 0.0078, + "step": 340620 + }, + { + "epoch": 1.72, + "learning_rate": 4.222167286376639e-05, + "loss": 0.0053, + "step": 340630 + }, + { + "epoch": 1.72, + "learning_rate": 4.2214105170752376e-05, + "loss": 0.0128, + "step": 340640 + }, + { + "epoch": 1.72, + "learning_rate": 4.2206537477738364e-05, + "loss": 0.005, + "step": 340650 + }, + { + "epoch": 1.72, + "learning_rate": 4.219896978472436e-05, + "loss": 0.0052, + "step": 340660 + }, + { + "epoch": 1.72, + "learning_rate": 4.219140209171035e-05, + "loss": 0.0058, + "step": 340670 + }, + { + "epoch": 1.72, + "learning_rate": 4.2183834398696335e-05, + "loss": 0.0069, + "step": 340680 + }, + { + "epoch": 1.72, + "learning_rate": 4.2176266705682324e-05, + "loss": 0.0061, + "step": 340690 + }, + { + "epoch": 1.72, + "learning_rate": 4.216869901266832e-05, + "loss": 0.0078, + "step": 340700 + }, + { + "epoch": 1.72, + "learning_rate": 4.216113131965431e-05, + "loss": 0.0069, + "step": 340710 + }, + { + "epoch": 1.72, + "learning_rate": 4.2153563626640295e-05, + "loss": 0.007, + "step": 340720 + }, + { + "epoch": 1.72, + "learning_rate": 4.214599593362628e-05, + "loss": 0.0065, + "step": 340730 + }, + { + "epoch": 1.72, + "learning_rate": 4.213842824061228e-05, + "loss": 0.0075, + "step": 340740 + }, + { + "epoch": 1.72, + "learning_rate": 4.2130860547598266e-05, + "loss": 0.0069, + "step": 340750 + }, + { + "epoch": 1.72, + "learning_rate": 4.2123292854584255e-05, + "loss": 0.0065, + "step": 340760 + }, + { + "epoch": 1.72, + "learning_rate": 4.211572516157025e-05, + "loss": 0.0065, + "step": 340770 + }, + { + "epoch": 1.72, + "learning_rate": 4.210815746855623e-05, + "loss": 0.0082, + "step": 340780 + }, + { + "epoch": 1.72, + "learning_rate": 4.210058977554222e-05, + "loss": 0.0045, + "step": 340790 + }, + { + "epoch": 1.72, + "learning_rate": 4.209302208252821e-05, + "loss": 0.0057, + "step": 340800 + }, + { + "epoch": 1.72, + "learning_rate": 4.2085454389514196e-05, + "loss": 0.0063, + "step": 340810 + }, + { + "epoch": 1.72, + "learning_rate": 4.207788669650019e-05, + "loss": 0.0062, + "step": 340820 + }, + { + "epoch": 1.72, + "learning_rate": 4.207031900348618e-05, + "loss": 0.0097, + "step": 340830 + }, + { + "epoch": 1.72, + "learning_rate": 4.206275131047217e-05, + "loss": 0.0082, + "step": 340840 + }, + { + "epoch": 1.72, + "learning_rate": 4.2055183617458155e-05, + "loss": 0.0061, + "step": 340850 + }, + { + "epoch": 1.72, + "learning_rate": 4.204761592444415e-05, + "loss": 0.0058, + "step": 340860 + }, + { + "epoch": 1.72, + "learning_rate": 4.204004823143014e-05, + "loss": 0.0086, + "step": 340870 + }, + { + "epoch": 1.72, + "learning_rate": 4.203248053841613e-05, + "loss": 0.0055, + "step": 340880 + }, + { + "epoch": 1.72, + "learning_rate": 4.2024912845402115e-05, + "loss": 0.0048, + "step": 340890 + }, + { + "epoch": 1.72, + "learning_rate": 4.201734515238811e-05, + "loss": 0.0063, + "step": 340900 + }, + { + "epoch": 1.72, + "learning_rate": 4.20097774593741e-05, + "loss": 0.0054, + "step": 340910 + }, + { + "epoch": 1.72, + "learning_rate": 4.2002209766360086e-05, + "loss": 0.0048, + "step": 340920 + }, + { + "epoch": 1.72, + "learning_rate": 4.1994642073346075e-05, + "loss": 0.0056, + "step": 340930 + }, + { + "epoch": 1.72, + "learning_rate": 4.198707438033207e-05, + "loss": 0.0067, + "step": 340940 + }, + { + "epoch": 1.72, + "learning_rate": 4.197950668731806e-05, + "loss": 0.0076, + "step": 340950 + }, + { + "epoch": 1.72, + "learning_rate": 4.1971938994304046e-05, + "loss": 0.0057, + "step": 340960 + }, + { + "epoch": 1.72, + "learning_rate": 4.1964371301290034e-05, + "loss": 0.006, + "step": 340970 + }, + { + "epoch": 1.72, + "learning_rate": 4.195680360827603e-05, + "loss": 0.0066, + "step": 340980 + }, + { + "epoch": 1.72, + "learning_rate": 4.194923591526202e-05, + "loss": 0.0058, + "step": 340990 + }, + { + "epoch": 1.72, + "learning_rate": 4.1941668222248006e-05, + "loss": 0.0053, + "step": 341000 + }, + { + "epoch": 1.72, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.00470845028758049, + "eval_runtime": 116.8214, + "eval_samples_per_second": 17.12, + "eval_steps_per_second": 4.28, + "step": 341000 + }, + { + "epoch": 1.72, + "learning_rate": 4.1934100529233994e-05, + "loss": 0.0051, + "step": 341010 + }, + { + "epoch": 1.72, + "learning_rate": 4.192653283621999e-05, + "loss": 0.0075, + "step": 341020 + }, + { + "epoch": 1.72, + "learning_rate": 4.191896514320598e-05, + "loss": 0.0072, + "step": 341030 + }, + { + "epoch": 1.72, + "learning_rate": 4.1911397450191965e-05, + "loss": 0.007, + "step": 341040 + }, + { + "epoch": 1.72, + "learning_rate": 4.1903829757177954e-05, + "loss": 0.0043, + "step": 341050 + }, + { + "epoch": 1.72, + "learning_rate": 4.189626206416395e-05, + "loss": 0.0071, + "step": 341060 + }, + { + "epoch": 1.72, + "learning_rate": 4.188869437114994e-05, + "loss": 0.0068, + "step": 341070 + }, + { + "epoch": 1.72, + "learning_rate": 4.1881126678135925e-05, + "loss": 0.0062, + "step": 341080 + }, + { + "epoch": 1.72, + "learning_rate": 4.1873558985121906e-05, + "loss": 0.005, + "step": 341090 + }, + { + "epoch": 1.72, + "learning_rate": 4.1865991292107895e-05, + "loss": 0.0064, + "step": 341100 + }, + { + "epoch": 1.72, + "learning_rate": 4.185842359909389e-05, + "loss": 0.0053, + "step": 341110 + }, + { + "epoch": 1.72, + "learning_rate": 4.185085590607988e-05, + "loss": 0.008, + "step": 341120 + }, + { + "epoch": 1.72, + "learning_rate": 4.1843288213065866e-05, + "loss": 0.0063, + "step": 341130 + }, + { + "epoch": 1.72, + "learning_rate": 4.1835720520051854e-05, + "loss": 0.0068, + "step": 341140 + }, + { + "epoch": 1.72, + "learning_rate": 4.182815282703785e-05, + "loss": 0.0061, + "step": 341150 + }, + { + "epoch": 1.72, + "learning_rate": 4.182058513402384e-05, + "loss": 0.0113, + "step": 341160 + }, + { + "epoch": 1.72, + "learning_rate": 4.1813017441009826e-05, + "loss": 0.0062, + "step": 341170 + }, + { + "epoch": 1.72, + "learning_rate": 4.1805449747995814e-05, + "loss": 0.005, + "step": 341180 + }, + { + "epoch": 1.72, + "learning_rate": 4.179788205498181e-05, + "loss": 0.0057, + "step": 341190 + }, + { + "epoch": 1.72, + "learning_rate": 4.17903143619678e-05, + "loss": 0.007, + "step": 341200 + }, + { + "epoch": 1.72, + "learning_rate": 4.1782746668953785e-05, + "loss": 0.0044, + "step": 341210 + }, + { + "epoch": 1.72, + "learning_rate": 4.1775178975939774e-05, + "loss": 0.006, + "step": 341220 + }, + { + "epoch": 1.72, + "learning_rate": 4.176761128292577e-05, + "loss": 0.0066, + "step": 341230 + }, + { + "epoch": 1.72, + "learning_rate": 4.176004358991176e-05, + "loss": 0.0058, + "step": 341240 + }, + { + "epoch": 1.72, + "learning_rate": 4.1752475896897745e-05, + "loss": 0.006, + "step": 341250 + }, + { + "epoch": 1.72, + "learning_rate": 4.174490820388374e-05, + "loss": 0.008, + "step": 341260 + }, + { + "epoch": 1.72, + "learning_rate": 4.173734051086973e-05, + "loss": 0.0061, + "step": 341270 + }, + { + "epoch": 1.72, + "learning_rate": 4.1729772817855717e-05, + "loss": 0.0052, + "step": 341280 + }, + { + "epoch": 1.72, + "learning_rate": 4.1722205124841705e-05, + "loss": 0.005, + "step": 341290 + }, + { + "epoch": 1.72, + "learning_rate": 4.17146374318277e-05, + "loss": 0.008, + "step": 341300 + }, + { + "epoch": 1.72, + "learning_rate": 4.170706973881369e-05, + "loss": 0.0053, + "step": 341310 + }, + { + "epoch": 1.72, + "learning_rate": 4.1699502045799676e-05, + "loss": 0.0055, + "step": 341320 + }, + { + "epoch": 1.72, + "learning_rate": 4.1691934352785664e-05, + "loss": 0.0079, + "step": 341330 + }, + { + "epoch": 1.72, + "learning_rate": 4.168436665977166e-05, + "loss": 0.0067, + "step": 341340 + }, + { + "epoch": 1.72, + "learning_rate": 4.167679896675765e-05, + "loss": 0.0054, + "step": 341350 + }, + { + "epoch": 1.72, + "learning_rate": 4.1669231273743636e-05, + "loss": 0.0045, + "step": 341360 + }, + { + "epoch": 1.72, + "learning_rate": 4.1661663580729624e-05, + "loss": 0.0064, + "step": 341370 + }, + { + "epoch": 1.72, + "learning_rate": 4.165409588771562e-05, + "loss": 0.0085, + "step": 341380 + }, + { + "epoch": 1.72, + "learning_rate": 4.164652819470161e-05, + "loss": 0.0081, + "step": 341390 + }, + { + "epoch": 1.72, + "learning_rate": 4.1638960501687595e-05, + "loss": 0.0069, + "step": 341400 + }, + { + "epoch": 1.72, + "learning_rate": 4.163139280867358e-05, + "loss": 0.0059, + "step": 341410 + }, + { + "epoch": 1.72, + "learning_rate": 4.1623825115659565e-05, + "loss": 0.0055, + "step": 341420 + }, + { + "epoch": 1.72, + "learning_rate": 4.161625742264556e-05, + "loss": 0.0084, + "step": 341430 + }, + { + "epoch": 1.72, + "learning_rate": 4.160868972963155e-05, + "loss": 0.0103, + "step": 341440 + }, + { + "epoch": 1.72, + "learning_rate": 4.1601122036617537e-05, + "loss": 0.008, + "step": 341450 + }, + { + "epoch": 1.72, + "learning_rate": 4.1593554343603525e-05, + "loss": 0.0066, + "step": 341460 + }, + { + "epoch": 1.72, + "learning_rate": 4.158598665058952e-05, + "loss": 0.0068, + "step": 341470 + }, + { + "epoch": 1.72, + "learning_rate": 4.157841895757551e-05, + "loss": 0.0056, + "step": 341480 + }, + { + "epoch": 1.72, + "learning_rate": 4.1570851264561496e-05, + "loss": 0.0064, + "step": 341490 + }, + { + "epoch": 1.72, + "learning_rate": 4.1563283571547484e-05, + "loss": 0.0059, + "step": 341500 + }, + { + "epoch": 1.72, + "learning_rate": 4.155571587853348e-05, + "loss": 0.0075, + "step": 341510 + }, + { + "epoch": 1.72, + "learning_rate": 4.154814818551947e-05, + "loss": 0.0071, + "step": 341520 + }, + { + "epoch": 1.72, + "learning_rate": 4.1540580492505456e-05, + "loss": 0.0058, + "step": 341530 + }, + { + "epoch": 1.72, + "learning_rate": 4.1533012799491444e-05, + "loss": 0.0074, + "step": 341540 + }, + { + "epoch": 1.72, + "learning_rate": 4.152544510647744e-05, + "loss": 0.0079, + "step": 341550 + }, + { + "epoch": 1.72, + "learning_rate": 4.151787741346343e-05, + "loss": 0.0065, + "step": 341560 + }, + { + "epoch": 1.72, + "learning_rate": 4.1510309720449416e-05, + "loss": 0.0062, + "step": 341570 + }, + { + "epoch": 1.72, + "learning_rate": 4.1502742027435404e-05, + "loss": 0.0051, + "step": 341580 + }, + { + "epoch": 1.72, + "learning_rate": 4.14951743344214e-05, + "loss": 0.0048, + "step": 341590 + }, + { + "epoch": 1.72, + "learning_rate": 4.148760664140739e-05, + "loss": 0.0072, + "step": 341600 + }, + { + "epoch": 1.72, + "learning_rate": 4.1480038948393375e-05, + "loss": 0.0066, + "step": 341610 + }, + { + "epoch": 1.72, + "learning_rate": 4.1472471255379363e-05, + "loss": 0.0046, + "step": 341620 + }, + { + "epoch": 1.72, + "learning_rate": 4.146490356236536e-05, + "loss": 0.0052, + "step": 341630 + }, + { + "epoch": 1.72, + "learning_rate": 4.1457335869351347e-05, + "loss": 0.0059, + "step": 341640 + }, + { + "epoch": 1.72, + "learning_rate": 4.1449768176337335e-05, + "loss": 0.0054, + "step": 341650 + }, + { + "epoch": 1.72, + "learning_rate": 4.144220048332332e-05, + "loss": 0.0076, + "step": 341660 + }, + { + "epoch": 1.72, + "learning_rate": 4.143463279030932e-05, + "loss": 0.0065, + "step": 341670 + }, + { + "epoch": 1.72, + "learning_rate": 4.1427065097295306e-05, + "loss": 0.0062, + "step": 341680 + }, + { + "epoch": 1.72, + "learning_rate": 4.1419497404281294e-05, + "loss": 0.0076, + "step": 341690 + }, + { + "epoch": 1.72, + "learning_rate": 4.141192971126728e-05, + "loss": 0.0071, + "step": 341700 + }, + { + "epoch": 1.72, + "learning_rate": 4.140436201825328e-05, + "loss": 0.0058, + "step": 341710 + }, + { + "epoch": 1.72, + "learning_rate": 4.139679432523926e-05, + "loss": 0.0105, + "step": 341720 + }, + { + "epoch": 1.72, + "learning_rate": 4.138922663222525e-05, + "loss": 0.0065, + "step": 341730 + }, + { + "epoch": 1.72, + "learning_rate": 4.1381658939211236e-05, + "loss": 0.0053, + "step": 341740 + }, + { + "epoch": 1.72, + "learning_rate": 4.137409124619723e-05, + "loss": 0.0054, + "step": 341750 + }, + { + "epoch": 1.72, + "learning_rate": 4.136652355318322e-05, + "loss": 0.0069, + "step": 341760 + }, + { + "epoch": 1.72, + "learning_rate": 4.135895586016921e-05, + "loss": 0.0062, + "step": 341770 + }, + { + "epoch": 1.72, + "learning_rate": 4.1351388167155195e-05, + "loss": 0.0079, + "step": 341780 + }, + { + "epoch": 1.72, + "learning_rate": 4.134382047414119e-05, + "loss": 0.0088, + "step": 341790 + }, + { + "epoch": 1.72, + "learning_rate": 4.133625278112718e-05, + "loss": 0.0043, + "step": 341800 + }, + { + "epoch": 1.72, + "learning_rate": 4.132868508811317e-05, + "loss": 0.0067, + "step": 341810 + }, + { + "epoch": 1.72, + "learning_rate": 4.1321117395099155e-05, + "loss": 0.0071, + "step": 341820 + }, + { + "epoch": 1.72, + "learning_rate": 4.131354970208515e-05, + "loss": 0.0077, + "step": 341830 + }, + { + "epoch": 1.72, + "learning_rate": 4.130598200907114e-05, + "loss": 0.0054, + "step": 341840 + }, + { + "epoch": 1.72, + "learning_rate": 4.1298414316057126e-05, + "loss": 0.0046, + "step": 341850 + }, + { + "epoch": 1.72, + "learning_rate": 4.1290846623043115e-05, + "loss": 0.006, + "step": 341860 + }, + { + "epoch": 1.72, + "learning_rate": 4.128327893002911e-05, + "loss": 0.006, + "step": 341870 + }, + { + "epoch": 1.72, + "learning_rate": 4.12757112370151e-05, + "loss": 0.0065, + "step": 341880 + }, + { + "epoch": 1.72, + "learning_rate": 4.1268143544001086e-05, + "loss": 0.005, + "step": 341890 + }, + { + "epoch": 1.72, + "learning_rate": 4.1260575850987074e-05, + "loss": 0.0054, + "step": 341900 + }, + { + "epoch": 1.72, + "learning_rate": 4.125300815797307e-05, + "loss": 0.0073, + "step": 341910 + }, + { + "epoch": 1.73, + "learning_rate": 4.124544046495906e-05, + "loss": 0.0047, + "step": 341920 + }, + { + "epoch": 1.73, + "learning_rate": 4.1237872771945046e-05, + "loss": 0.0055, + "step": 341930 + }, + { + "epoch": 1.73, + "learning_rate": 4.1230305078931034e-05, + "loss": 0.0078, + "step": 341940 + }, + { + "epoch": 1.73, + "learning_rate": 4.122273738591703e-05, + "loss": 0.0069, + "step": 341950 + }, + { + "epoch": 1.73, + "learning_rate": 4.121516969290302e-05, + "loss": 0.0068, + "step": 341960 + }, + { + "epoch": 1.73, + "learning_rate": 4.1207601999889005e-05, + "loss": 0.0088, + "step": 341970 + }, + { + "epoch": 1.73, + "learning_rate": 4.1200034306874993e-05, + "loss": 0.0068, + "step": 341980 + }, + { + "epoch": 1.73, + "learning_rate": 4.119246661386099e-05, + "loss": 0.0071, + "step": 341990 + }, + { + "epoch": 1.73, + "learning_rate": 4.118489892084698e-05, + "loss": 0.0068, + "step": 342000 + }, + { + "epoch": 1.73, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004726854152977467, + "eval_runtime": 116.8239, + "eval_samples_per_second": 17.12, + "eval_steps_per_second": 4.28, + "step": 342000 + }, + { + "epoch": 1.73, + "learning_rate": 4.1177331227832965e-05, + "loss": 0.0063, + "step": 342010 + }, + { + "epoch": 1.73, + "learning_rate": 4.116976353481895e-05, + "loss": 0.0071, + "step": 342020 + }, + { + "epoch": 1.73, + "learning_rate": 4.116219584180495e-05, + "loss": 0.0046, + "step": 342030 + }, + { + "epoch": 1.73, + "learning_rate": 4.115462814879093e-05, + "loss": 0.0056, + "step": 342040 + }, + { + "epoch": 1.73, + "learning_rate": 4.114706045577692e-05, + "loss": 0.0053, + "step": 342050 + }, + { + "epoch": 1.73, + "learning_rate": 4.1139492762762906e-05, + "loss": 0.0069, + "step": 342060 + }, + { + "epoch": 1.73, + "learning_rate": 4.1131925069748894e-05, + "loss": 0.0048, + "step": 342070 + }, + { + "epoch": 1.73, + "learning_rate": 4.112435737673489e-05, + "loss": 0.0054, + "step": 342080 + }, + { + "epoch": 1.73, + "learning_rate": 4.111678968372088e-05, + "loss": 0.0062, + "step": 342090 + }, + { + "epoch": 1.73, + "learning_rate": 4.1109221990706866e-05, + "loss": 0.0048, + "step": 342100 + }, + { + "epoch": 1.73, + "learning_rate": 4.1101654297692854e-05, + "loss": 0.0073, + "step": 342110 + }, + { + "epoch": 1.73, + "learning_rate": 4.109408660467885e-05, + "loss": 0.0064, + "step": 342120 + }, + { + "epoch": 1.73, + "learning_rate": 4.108651891166484e-05, + "loss": 0.0045, + "step": 342130 + }, + { + "epoch": 1.73, + "learning_rate": 4.1078951218650825e-05, + "loss": 0.0069, + "step": 342140 + }, + { + "epoch": 1.73, + "learning_rate": 4.1071383525636814e-05, + "loss": 0.0068, + "step": 342150 + }, + { + "epoch": 1.73, + "learning_rate": 4.106381583262281e-05, + "loss": 0.0057, + "step": 342160 + }, + { + "epoch": 1.73, + "learning_rate": 4.10562481396088e-05, + "loss": 0.0061, + "step": 342170 + }, + { + "epoch": 1.73, + "learning_rate": 4.1048680446594785e-05, + "loss": 0.0061, + "step": 342180 + }, + { + "epoch": 1.73, + "learning_rate": 4.104111275358077e-05, + "loss": 0.0098, + "step": 342190 + }, + { + "epoch": 1.73, + "learning_rate": 4.103354506056677e-05, + "loss": 0.0062, + "step": 342200 + }, + { + "epoch": 1.73, + "learning_rate": 4.1025977367552756e-05, + "loss": 0.0056, + "step": 342210 + }, + { + "epoch": 1.73, + "learning_rate": 4.1018409674538745e-05, + "loss": 0.0046, + "step": 342220 + }, + { + "epoch": 1.73, + "learning_rate": 4.101084198152474e-05, + "loss": 0.0079, + "step": 342230 + }, + { + "epoch": 1.73, + "learning_rate": 4.100327428851073e-05, + "loss": 0.0059, + "step": 342240 + }, + { + "epoch": 1.73, + "learning_rate": 4.0995706595496716e-05, + "loss": 0.0053, + "step": 342250 + }, + { + "epoch": 1.73, + "learning_rate": 4.0988138902482704e-05, + "loss": 0.0065, + "step": 342260 + }, + { + "epoch": 1.73, + "learning_rate": 4.09805712094687e-05, + "loss": 0.0084, + "step": 342270 + }, + { + "epoch": 1.73, + "learning_rate": 4.097300351645469e-05, + "loss": 0.0067, + "step": 342280 + }, + { + "epoch": 1.73, + "learning_rate": 4.0965435823440676e-05, + "loss": 0.0063, + "step": 342290 + }, + { + "epoch": 1.73, + "learning_rate": 4.0957868130426664e-05, + "loss": 0.0072, + "step": 342300 + }, + { + "epoch": 1.73, + "learning_rate": 4.095030043741266e-05, + "loss": 0.0047, + "step": 342310 + }, + { + "epoch": 1.73, + "learning_rate": 4.094273274439865e-05, + "loss": 0.0089, + "step": 342320 + }, + { + "epoch": 1.73, + "learning_rate": 4.0935165051384635e-05, + "loss": 0.0066, + "step": 342330 + }, + { + "epoch": 1.73, + "learning_rate": 4.0927597358370624e-05, + "loss": 0.0065, + "step": 342340 + }, + { + "epoch": 1.73, + "learning_rate": 4.0920029665356605e-05, + "loss": 0.0095, + "step": 342350 + }, + { + "epoch": 1.73, + "learning_rate": 4.09124619723426e-05, + "loss": 0.0055, + "step": 342360 + }, + { + "epoch": 1.73, + "learning_rate": 4.090489427932859e-05, + "loss": 0.0069, + "step": 342370 + }, + { + "epoch": 1.73, + "learning_rate": 4.0897326586314576e-05, + "loss": 0.0068, + "step": 342380 + }, + { + "epoch": 1.73, + "learning_rate": 4.0889758893300565e-05, + "loss": 0.0051, + "step": 342390 + }, + { + "epoch": 1.73, + "learning_rate": 4.088219120028656e-05, + "loss": 0.0047, + "step": 342400 + }, + { + "epoch": 1.73, + "learning_rate": 4.087462350727255e-05, + "loss": 0.0069, + "step": 342410 + }, + { + "epoch": 1.73, + "learning_rate": 4.0867055814258536e-05, + "loss": 0.0069, + "step": 342420 + }, + { + "epoch": 1.73, + "learning_rate": 4.0859488121244524e-05, + "loss": 0.0048, + "step": 342430 + }, + { + "epoch": 1.73, + "learning_rate": 4.085192042823052e-05, + "loss": 0.006, + "step": 342440 + }, + { + "epoch": 1.73, + "learning_rate": 4.084435273521651e-05, + "loss": 0.007, + "step": 342450 + }, + { + "epoch": 1.73, + "learning_rate": 4.0836785042202496e-05, + "loss": 0.0052, + "step": 342460 + }, + { + "epoch": 1.73, + "learning_rate": 4.0829217349188484e-05, + "loss": 0.0079, + "step": 342470 + }, + { + "epoch": 1.73, + "learning_rate": 4.082164965617448e-05, + "loss": 0.0064, + "step": 342480 + }, + { + "epoch": 1.73, + "learning_rate": 4.081408196316047e-05, + "loss": 0.0064, + "step": 342490 + }, + { + "epoch": 1.73, + "learning_rate": 4.0806514270146455e-05, + "loss": 0.007, + "step": 342500 + }, + { + "epoch": 1.73, + "learning_rate": 4.0798946577132444e-05, + "loss": 0.0072, + "step": 342510 + }, + { + "epoch": 1.73, + "learning_rate": 4.079137888411844e-05, + "loss": 0.0057, + "step": 342520 + }, + { + "epoch": 1.73, + "learning_rate": 4.078381119110443e-05, + "loss": 0.007, + "step": 342530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0776243498090415e-05, + "loss": 0.0066, + "step": 342540 + }, + { + "epoch": 1.73, + "learning_rate": 4.07686758050764e-05, + "loss": 0.0059, + "step": 342550 + }, + { + "epoch": 1.73, + "learning_rate": 4.07611081120624e-05, + "loss": 0.0103, + "step": 342560 + }, + { + "epoch": 1.73, + "learning_rate": 4.0753540419048386e-05, + "loss": 0.0053, + "step": 342570 + }, + { + "epoch": 1.73, + "learning_rate": 4.0745972726034375e-05, + "loss": 0.0115, + "step": 342580 + }, + { + "epoch": 1.73, + "learning_rate": 4.073840503302036e-05, + "loss": 0.0059, + "step": 342590 + }, + { + "epoch": 1.73, + "learning_rate": 4.073083734000636e-05, + "loss": 0.0067, + "step": 342600 + }, + { + "epoch": 1.73, + "learning_rate": 4.0723269646992346e-05, + "loss": 0.0077, + "step": 342610 + }, + { + "epoch": 1.73, + "learning_rate": 4.0715701953978334e-05, + "loss": 0.0071, + "step": 342620 + }, + { + "epoch": 1.73, + "learning_rate": 4.070813426096432e-05, + "loss": 0.0063, + "step": 342630 + }, + { + "epoch": 1.73, + "learning_rate": 4.070056656795032e-05, + "loss": 0.0078, + "step": 342640 + }, + { + "epoch": 1.73, + "learning_rate": 4.0692998874936306e-05, + "loss": 0.0079, + "step": 342650 + }, + { + "epoch": 1.73, + "learning_rate": 4.068543118192229e-05, + "loss": 0.0065, + "step": 342660 + }, + { + "epoch": 1.73, + "learning_rate": 4.0677863488908275e-05, + "loss": 0.0073, + "step": 342670 + }, + { + "epoch": 1.73, + "learning_rate": 4.067029579589427e-05, + "loss": 0.0058, + "step": 342680 + }, + { + "epoch": 1.73, + "learning_rate": 4.066272810288026e-05, + "loss": 0.007, + "step": 342690 + }, + { + "epoch": 1.73, + "learning_rate": 4.065516040986625e-05, + "loss": 0.0076, + "step": 342700 + }, + { + "epoch": 1.73, + "learning_rate": 4.0647592716852235e-05, + "loss": 0.0068, + "step": 342710 + }, + { + "epoch": 1.73, + "learning_rate": 4.064002502383823e-05, + "loss": 0.009, + "step": 342720 + }, + { + "epoch": 1.73, + "learning_rate": 4.063245733082422e-05, + "loss": 0.007, + "step": 342730 + }, + { + "epoch": 1.73, + "learning_rate": 4.0624889637810207e-05, + "loss": 0.0054, + "step": 342740 + }, + { + "epoch": 1.73, + "learning_rate": 4.0617321944796195e-05, + "loss": 0.0063, + "step": 342750 + }, + { + "epoch": 1.73, + "learning_rate": 4.060975425178219e-05, + "loss": 0.0059, + "step": 342760 + }, + { + "epoch": 1.73, + "learning_rate": 4.060218655876818e-05, + "loss": 0.0069, + "step": 342770 + }, + { + "epoch": 1.73, + "learning_rate": 4.0594618865754166e-05, + "loss": 0.0049, + "step": 342780 + }, + { + "epoch": 1.73, + "learning_rate": 4.0587051172740154e-05, + "loss": 0.0064, + "step": 342790 + }, + { + "epoch": 1.73, + "learning_rate": 4.057948347972615e-05, + "loss": 0.0067, + "step": 342800 + }, + { + "epoch": 1.73, + "learning_rate": 4.057191578671214e-05, + "loss": 0.0055, + "step": 342810 + }, + { + "epoch": 1.73, + "learning_rate": 4.0564348093698126e-05, + "loss": 0.0057, + "step": 342820 + }, + { + "epoch": 1.73, + "learning_rate": 4.0556780400684114e-05, + "loss": 0.0058, + "step": 342830 + }, + { + "epoch": 1.73, + "learning_rate": 4.054921270767011e-05, + "loss": 0.0053, + "step": 342840 + }, + { + "epoch": 1.73, + "learning_rate": 4.05416450146561e-05, + "loss": 0.0053, + "step": 342850 + }, + { + "epoch": 1.73, + "learning_rate": 4.0534077321642085e-05, + "loss": 0.0059, + "step": 342860 + }, + { + "epoch": 1.73, + "learning_rate": 4.0526509628628074e-05, + "loss": 0.0048, + "step": 342870 + }, + { + "epoch": 1.73, + "learning_rate": 4.051894193561407e-05, + "loss": 0.0057, + "step": 342880 + }, + { + "epoch": 1.73, + "learning_rate": 4.051137424260006e-05, + "loss": 0.0048, + "step": 342890 + }, + { + "epoch": 1.73, + "learning_rate": 4.0503806549586045e-05, + "loss": 0.0066, + "step": 342900 + }, + { + "epoch": 1.73, + "learning_rate": 4.049623885657203e-05, + "loss": 0.0056, + "step": 342910 + }, + { + "epoch": 1.73, + "learning_rate": 4.048867116355803e-05, + "loss": 0.0063, + "step": 342920 + }, + { + "epoch": 1.73, + "learning_rate": 4.0481103470544017e-05, + "loss": 0.0047, + "step": 342930 + }, + { + "epoch": 1.73, + "learning_rate": 4.0473535777530005e-05, + "loss": 0.0053, + "step": 342940 + }, + { + "epoch": 1.73, + "learning_rate": 4.046596808451599e-05, + "loss": 0.0052, + "step": 342950 + }, + { + "epoch": 1.73, + "learning_rate": 4.045840039150199e-05, + "loss": 0.0072, + "step": 342960 + }, + { + "epoch": 1.73, + "learning_rate": 4.0450832698487976e-05, + "loss": 0.0061, + "step": 342970 + }, + { + "epoch": 1.73, + "learning_rate": 4.044326500547396e-05, + "loss": 0.0084, + "step": 342980 + }, + { + "epoch": 1.73, + "learning_rate": 4.0435697312459946e-05, + "loss": 0.0058, + "step": 342990 + }, + { + "epoch": 1.73, + "learning_rate": 4.0428129619445934e-05, + "loss": 0.005, + "step": 343000 + }, + { + "epoch": 1.73, + "eval_cer": 0.9144333808503969, + "eval_loss": 0.00461353175342083, + "eval_runtime": 116.7176, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, + "step": 343000 + }, + { + "epoch": 1.73, + "learning_rate": 4.042056192643193e-05, + "loss": 0.0097, + "step": 343010 + }, + { + "epoch": 1.73, + "learning_rate": 4.041299423341792e-05, + "loss": 0.0053, + "step": 343020 + }, + { + "epoch": 1.73, + "learning_rate": 4.0405426540403906e-05, + "loss": 0.0051, + "step": 343030 + }, + { + "epoch": 1.73, + "learning_rate": 4.0397858847389894e-05, + "loss": 0.0072, + "step": 343040 + }, + { + "epoch": 1.73, + "learning_rate": 4.039029115437589e-05, + "loss": 0.0068, + "step": 343050 + }, + { + "epoch": 1.73, + "learning_rate": 4.038272346136188e-05, + "loss": 0.0061, + "step": 343060 + }, + { + "epoch": 1.73, + "learning_rate": 4.0375155768347865e-05, + "loss": 0.0049, + "step": 343070 + }, + { + "epoch": 1.73, + "learning_rate": 4.0367588075333853e-05, + "loss": 0.0053, + "step": 343080 + }, + { + "epoch": 1.73, + "learning_rate": 4.036002038231985e-05, + "loss": 0.0069, + "step": 343090 + }, + { + "epoch": 1.73, + "learning_rate": 4.0352452689305837e-05, + "loss": 0.0059, + "step": 343100 + }, + { + "epoch": 1.73, + "learning_rate": 4.0344884996291825e-05, + "loss": 0.0052, + "step": 343110 + }, + { + "epoch": 1.73, + "learning_rate": 4.033731730327781e-05, + "loss": 0.0053, + "step": 343120 + }, + { + "epoch": 1.73, + "learning_rate": 4.032974961026381e-05, + "loss": 0.0062, + "step": 343130 + }, + { + "epoch": 1.73, + "learning_rate": 4.0322181917249796e-05, + "loss": 0.0082, + "step": 343140 + }, + { + "epoch": 1.73, + "learning_rate": 4.0314614224235784e-05, + "loss": 0.0063, + "step": 343150 + }, + { + "epoch": 1.73, + "learning_rate": 4.030704653122177e-05, + "loss": 0.0066, + "step": 343160 + }, + { + "epoch": 1.73, + "learning_rate": 4.029947883820777e-05, + "loss": 0.0068, + "step": 343170 + }, + { + "epoch": 1.73, + "learning_rate": 4.0291911145193756e-05, + "loss": 0.0046, + "step": 343180 + }, + { + "epoch": 1.73, + "learning_rate": 4.0284343452179744e-05, + "loss": 0.0071, + "step": 343190 + }, + { + "epoch": 1.73, + "learning_rate": 4.027677575916574e-05, + "loss": 0.0074, + "step": 343200 + }, + { + "epoch": 1.73, + "learning_rate": 4.026920806615173e-05, + "loss": 0.0063, + "step": 343210 + }, + { + "epoch": 1.73, + "learning_rate": 4.0261640373137716e-05, + "loss": 0.0068, + "step": 343220 + }, + { + "epoch": 1.73, + "learning_rate": 4.0254072680123704e-05, + "loss": 0.0082, + "step": 343230 + }, + { + "epoch": 1.73, + "learning_rate": 4.02465049871097e-05, + "loss": 0.0053, + "step": 343240 + }, + { + "epoch": 1.73, + "learning_rate": 4.023893729409569e-05, + "loss": 0.0062, + "step": 343250 + }, + { + "epoch": 1.73, + "learning_rate": 4.0231369601081675e-05, + "loss": 0.0057, + "step": 343260 + }, + { + "epoch": 1.73, + "learning_rate": 4.0223801908067663e-05, + "loss": 0.0064, + "step": 343270 + }, + { + "epoch": 1.73, + "learning_rate": 4.021623421505366e-05, + "loss": 0.0058, + "step": 343280 + }, + { + "epoch": 1.73, + "learning_rate": 4.020866652203964e-05, + "loss": 0.0077, + "step": 343290 + }, + { + "epoch": 1.73, + "learning_rate": 4.020109882902563e-05, + "loss": 0.0051, + "step": 343300 + }, + { + "epoch": 1.73, + "learning_rate": 4.0193531136011616e-05, + "loss": 0.006, + "step": 343310 + }, + { + "epoch": 1.73, + "learning_rate": 4.0185963442997605e-05, + "loss": 0.0057, + "step": 343320 + }, + { + "epoch": 1.73, + "learning_rate": 4.01783957499836e-05, + "loss": 0.0051, + "step": 343330 + }, + { + "epoch": 1.73, + "learning_rate": 4.017082805696959e-05, + "loss": 0.0068, + "step": 343340 + }, + { + "epoch": 1.73, + "learning_rate": 4.0163260363955576e-05, + "loss": 0.0071, + "step": 343350 + }, + { + "epoch": 1.73, + "learning_rate": 4.0155692670941564e-05, + "loss": 0.0065, + "step": 343360 + }, + { + "epoch": 1.73, + "learning_rate": 4.014812497792756e-05, + "loss": 0.0055, + "step": 343370 + }, + { + "epoch": 1.73, + "learning_rate": 4.014055728491355e-05, + "loss": 0.0046, + "step": 343380 + }, + { + "epoch": 1.73, + "learning_rate": 4.0132989591899536e-05, + "loss": 0.0059, + "step": 343390 + }, + { + "epoch": 1.73, + "learning_rate": 4.0125421898885524e-05, + "loss": 0.0051, + "step": 343400 + }, + { + "epoch": 1.73, + "learning_rate": 4.011785420587152e-05, + "loss": 0.0074, + "step": 343410 + }, + { + "epoch": 1.73, + "learning_rate": 4.011028651285751e-05, + "loss": 0.0082, + "step": 343420 + }, + { + "epoch": 1.73, + "learning_rate": 4.0102718819843495e-05, + "loss": 0.0094, + "step": 343430 + }, + { + "epoch": 1.73, + "learning_rate": 4.0095151126829483e-05, + "loss": 0.0072, + "step": 343440 + }, + { + "epoch": 1.73, + "learning_rate": 4.008758343381548e-05, + "loss": 0.0063, + "step": 343450 + }, + { + "epoch": 1.73, + "learning_rate": 4.008001574080147e-05, + "loss": 0.0069, + "step": 343460 + }, + { + "epoch": 1.73, + "learning_rate": 4.0072448047787455e-05, + "loss": 0.0055, + "step": 343470 + }, + { + "epoch": 1.73, + "learning_rate": 4.006488035477344e-05, + "loss": 0.0058, + "step": 343480 + }, + { + "epoch": 1.73, + "learning_rate": 4.005731266175944e-05, + "loss": 0.0049, + "step": 343490 + }, + { + "epoch": 1.73, + "learning_rate": 4.0049744968745426e-05, + "loss": 0.0045, + "step": 343500 + }, + { + "epoch": 1.73, + "learning_rate": 4.0042177275731415e-05, + "loss": 0.0066, + "step": 343510 + }, + { + "epoch": 1.73, + "learning_rate": 4.00346095827174e-05, + "loss": 0.0058, + "step": 343520 + }, + { + "epoch": 1.73, + "learning_rate": 4.00270418897034e-05, + "loss": 0.007, + "step": 343530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0019474196689386e-05, + "loss": 0.0057, + "step": 343540 + }, + { + "epoch": 1.73, + "learning_rate": 4.0011906503675374e-05, + "loss": 0.0053, + "step": 343550 + }, + { + "epoch": 1.73, + "learning_rate": 4.000433881066136e-05, + "loss": 0.0064, + "step": 343560 + }, + { + "epoch": 1.73, + "learning_rate": 3.999677111764736e-05, + "loss": 0.0071, + "step": 343570 + }, + { + "epoch": 1.73, + "learning_rate": 3.9989203424633346e-05, + "loss": 0.0059, + "step": 343580 + }, + { + "epoch": 1.73, + "learning_rate": 3.9981635731619334e-05, + "loss": 0.0073, + "step": 343590 + }, + { + "epoch": 1.73, + "learning_rate": 3.997406803860532e-05, + "loss": 0.0049, + "step": 343600 + }, + { + "epoch": 1.73, + "learning_rate": 3.9966500345591304e-05, + "loss": 0.009, + "step": 343610 + }, + { + "epoch": 1.73, + "learning_rate": 3.99589326525773e-05, + "loss": 0.0062, + "step": 343620 + }, + { + "epoch": 1.73, + "learning_rate": 3.995136495956329e-05, + "loss": 0.0051, + "step": 343630 + }, + { + "epoch": 1.73, + "learning_rate": 3.9943797266549275e-05, + "loss": 0.0065, + "step": 343640 + }, + { + "epoch": 1.73, + "learning_rate": 3.993622957353527e-05, + "loss": 0.0075, + "step": 343650 + }, + { + "epoch": 1.73, + "learning_rate": 3.992866188052126e-05, + "loss": 0.0078, + "step": 343660 + }, + { + "epoch": 1.73, + "learning_rate": 3.9921094187507246e-05, + "loss": 0.0067, + "step": 343670 + }, + { + "epoch": 1.73, + "learning_rate": 3.9913526494493235e-05, + "loss": 0.0072, + "step": 343680 + }, + { + "epoch": 1.73, + "learning_rate": 3.990595880147923e-05, + "loss": 0.0067, + "step": 343690 + }, + { + "epoch": 1.73, + "learning_rate": 3.989839110846522e-05, + "loss": 0.0054, + "step": 343700 + }, + { + "epoch": 1.73, + "learning_rate": 3.9890823415451206e-05, + "loss": 0.004, + "step": 343710 + }, + { + "epoch": 1.73, + "learning_rate": 3.9883255722437194e-05, + "loss": 0.0059, + "step": 343720 + }, + { + "epoch": 1.73, + "learning_rate": 3.987568802942319e-05, + "loss": 0.0056, + "step": 343730 + }, + { + "epoch": 1.73, + "learning_rate": 3.986812033640918e-05, + "loss": 0.009, + "step": 343740 + }, + { + "epoch": 1.73, + "learning_rate": 3.9860552643395166e-05, + "loss": 0.0057, + "step": 343750 + }, + { + "epoch": 1.73, + "learning_rate": 3.9852984950381154e-05, + "loss": 0.0057, + "step": 343760 + }, + { + "epoch": 1.73, + "learning_rate": 3.984541725736715e-05, + "loss": 0.0081, + "step": 343770 + }, + { + "epoch": 1.73, + "learning_rate": 3.983784956435314e-05, + "loss": 0.0077, + "step": 343780 + }, + { + "epoch": 1.73, + "learning_rate": 3.9830281871339125e-05, + "loss": 0.0064, + "step": 343790 + }, + { + "epoch": 1.73, + "learning_rate": 3.9822714178325114e-05, + "loss": 0.0055, + "step": 343800 + }, + { + "epoch": 1.73, + "learning_rate": 3.981514648531111e-05, + "loss": 0.0061, + "step": 343810 + }, + { + "epoch": 1.73, + "learning_rate": 3.98075787922971e-05, + "loss": 0.0097, + "step": 343820 + }, + { + "epoch": 1.73, + "learning_rate": 3.9800011099283085e-05, + "loss": 0.0053, + "step": 343830 + }, + { + "epoch": 1.73, + "learning_rate": 3.979244340626907e-05, + "loss": 0.0065, + "step": 343840 + }, + { + "epoch": 1.73, + "learning_rate": 3.978487571325507e-05, + "loss": 0.0078, + "step": 343850 + }, + { + "epoch": 1.73, + "learning_rate": 3.9777308020241056e-05, + "loss": 0.0046, + "step": 343860 + }, + { + "epoch": 1.73, + "learning_rate": 3.9769740327227045e-05, + "loss": 0.0046, + "step": 343870 + }, + { + "epoch": 1.73, + "learning_rate": 3.976217263421303e-05, + "loss": 0.0062, + "step": 343880 + }, + { + "epoch": 1.73, + "learning_rate": 3.975460494119903e-05, + "loss": 0.0072, + "step": 343890 + }, + { + "epoch": 1.74, + "learning_rate": 3.9747037248185016e-05, + "loss": 0.0063, + "step": 343900 + }, + { + "epoch": 1.74, + "learning_rate": 3.9739469555171004e-05, + "loss": 0.0057, + "step": 343910 + }, + { + "epoch": 1.74, + "learning_rate": 3.9731901862156986e-05, + "loss": 0.0048, + "step": 343920 + }, + { + "epoch": 1.74, + "learning_rate": 3.9724334169142974e-05, + "loss": 0.0049, + "step": 343930 + }, + { + "epoch": 1.74, + "learning_rate": 3.971676647612897e-05, + "loss": 0.0052, + "step": 343940 + }, + { + "epoch": 1.74, + "learning_rate": 3.970919878311496e-05, + "loss": 0.006, + "step": 343950 + }, + { + "epoch": 1.74, + "learning_rate": 3.9701631090100945e-05, + "loss": 0.0057, + "step": 343960 + }, + { + "epoch": 1.74, + "learning_rate": 3.9694063397086934e-05, + "loss": 0.0078, + "step": 343970 + }, + { + "epoch": 1.74, + "learning_rate": 3.968649570407293e-05, + "loss": 0.0077, + "step": 343980 + }, + { + "epoch": 1.74, + "learning_rate": 3.967892801105892e-05, + "loss": 0.0074, + "step": 343990 + }, + { + "epoch": 1.74, + "learning_rate": 3.9671360318044905e-05, + "loss": 0.004, + "step": 344000 + }, + { + "epoch": 1.74, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004634759854525328, + "eval_runtime": 116.8176, + "eval_samples_per_second": 17.121, + "eval_steps_per_second": 4.28, + "step": 344000 + }, + { + "epoch": 1.74, + "learning_rate": 3.966379262503089e-05, + "loss": 0.0071, + "step": 344010 + }, + { + "epoch": 1.74, + "learning_rate": 3.965622493201689e-05, + "loss": 0.0069, + "step": 344020 + }, + { + "epoch": 1.74, + "learning_rate": 3.9648657239002876e-05, + "loss": 0.0049, + "step": 344030 + }, + { + "epoch": 1.74, + "learning_rate": 3.9641089545988865e-05, + "loss": 0.0071, + "step": 344040 + }, + { + "epoch": 1.74, + "learning_rate": 3.963352185297485e-05, + "loss": 0.0043, + "step": 344050 + }, + { + "epoch": 1.74, + "learning_rate": 3.962595415996085e-05, + "loss": 0.0085, + "step": 344060 + }, + { + "epoch": 1.74, + "learning_rate": 3.9618386466946836e-05, + "loss": 0.0061, + "step": 344070 + }, + { + "epoch": 1.74, + "learning_rate": 3.9610818773932824e-05, + "loss": 0.0047, + "step": 344080 + }, + { + "epoch": 1.74, + "learning_rate": 3.960325108091881e-05, + "loss": 0.0069, + "step": 344090 + }, + { + "epoch": 1.74, + "learning_rate": 3.959568338790481e-05, + "loss": 0.006, + "step": 344100 + }, + { + "epoch": 1.74, + "learning_rate": 3.9588115694890796e-05, + "loss": 0.008, + "step": 344110 + }, + { + "epoch": 1.74, + "learning_rate": 3.9580548001876784e-05, + "loss": 0.0061, + "step": 344120 + }, + { + "epoch": 1.74, + "learning_rate": 3.957298030886277e-05, + "loss": 0.0058, + "step": 344130 + }, + { + "epoch": 1.74, + "learning_rate": 3.956541261584877e-05, + "loss": 0.0058, + "step": 344140 + }, + { + "epoch": 1.74, + "learning_rate": 3.9557844922834755e-05, + "loss": 0.0065, + "step": 344150 + }, + { + "epoch": 1.74, + "learning_rate": 3.9550277229820744e-05, + "loss": 0.0053, + "step": 344160 + }, + { + "epoch": 1.74, + "learning_rate": 3.954270953680674e-05, + "loss": 0.005, + "step": 344170 + }, + { + "epoch": 1.74, + "learning_rate": 3.953514184379273e-05, + "loss": 0.0058, + "step": 344180 + }, + { + "epoch": 1.74, + "learning_rate": 3.9527574150778715e-05, + "loss": 0.0086, + "step": 344190 + }, + { + "epoch": 1.74, + "learning_rate": 3.95200064577647e-05, + "loss": 0.0051, + "step": 344200 + }, + { + "epoch": 1.74, + "learning_rate": 3.95124387647507e-05, + "loss": 0.0068, + "step": 344210 + }, + { + "epoch": 1.74, + "learning_rate": 3.9504871071736687e-05, + "loss": 0.008, + "step": 344220 + }, + { + "epoch": 1.74, + "learning_rate": 3.949730337872267e-05, + "loss": 0.0076, + "step": 344230 + }, + { + "epoch": 1.74, + "learning_rate": 3.9489735685708656e-05, + "loss": 0.0068, + "step": 344240 + }, + { + "epoch": 1.74, + "learning_rate": 3.9482167992694644e-05, + "loss": 0.0052, + "step": 344250 + }, + { + "epoch": 1.74, + "learning_rate": 3.947460029968064e-05, + "loss": 0.0058, + "step": 344260 + }, + { + "epoch": 1.74, + "learning_rate": 3.946703260666663e-05, + "loss": 0.0042, + "step": 344270 + }, + { + "epoch": 1.74, + "learning_rate": 3.9459464913652616e-05, + "loss": 0.0044, + "step": 344280 + }, + { + "epoch": 1.74, + "learning_rate": 3.9451897220638604e-05, + "loss": 0.0074, + "step": 344290 + }, + { + "epoch": 1.74, + "learning_rate": 3.94443295276246e-05, + "loss": 0.0056, + "step": 344300 + }, + { + "epoch": 1.74, + "learning_rate": 3.943676183461059e-05, + "loss": 0.0066, + "step": 344310 + }, + { + "epoch": 1.74, + "learning_rate": 3.9429194141596575e-05, + "loss": 0.0057, + "step": 344320 + }, + { + "epoch": 1.74, + "learning_rate": 3.9421626448582564e-05, + "loss": 0.0079, + "step": 344330 + }, + { + "epoch": 1.74, + "learning_rate": 3.941405875556856e-05, + "loss": 0.0056, + "step": 344340 + }, + { + "epoch": 1.74, + "learning_rate": 3.940649106255455e-05, + "loss": 0.0071, + "step": 344350 + }, + { + "epoch": 1.74, + "learning_rate": 3.9398923369540535e-05, + "loss": 0.0073, + "step": 344360 + }, + { + "epoch": 1.74, + "learning_rate": 3.939135567652652e-05, + "loss": 0.0046, + "step": 344370 + }, + { + "epoch": 1.74, + "learning_rate": 3.938378798351252e-05, + "loss": 0.0057, + "step": 344380 + }, + { + "epoch": 1.74, + "learning_rate": 3.9376220290498507e-05, + "loss": 0.0047, + "step": 344390 + }, + { + "epoch": 1.74, + "learning_rate": 3.9368652597484495e-05, + "loss": 0.0077, + "step": 344400 + }, + { + "epoch": 1.74, + "learning_rate": 3.936108490447048e-05, + "loss": 0.0065, + "step": 344410 + }, + { + "epoch": 1.74, + "learning_rate": 3.935351721145648e-05, + "loss": 0.0087, + "step": 344420 + }, + { + "epoch": 1.74, + "learning_rate": 3.9345949518442466e-05, + "loss": 0.0074, + "step": 344430 + }, + { + "epoch": 1.74, + "learning_rate": 3.9338381825428454e-05, + "loss": 0.0076, + "step": 344440 + }, + { + "epoch": 1.74, + "learning_rate": 3.933081413241444e-05, + "loss": 0.004, + "step": 344450 + }, + { + "epoch": 1.74, + "learning_rate": 3.932324643940044e-05, + "loss": 0.007, + "step": 344460 + }, + { + "epoch": 1.74, + "learning_rate": 3.9315678746386426e-05, + "loss": 0.0054, + "step": 344470 + }, + { + "epoch": 1.74, + "learning_rate": 3.9308111053372414e-05, + "loss": 0.0067, + "step": 344480 + }, + { + "epoch": 1.74, + "learning_rate": 3.93005433603584e-05, + "loss": 0.0064, + "step": 344490 + }, + { + "epoch": 1.74, + "learning_rate": 3.92929756673444e-05, + "loss": 0.0089, + "step": 344500 + }, + { + "epoch": 1.74, + "learning_rate": 3.9285407974330386e-05, + "loss": 0.0056, + "step": 344510 + }, + { + "epoch": 1.74, + "learning_rate": 3.9277840281316374e-05, + "loss": 0.0054, + "step": 344520 + }, + { + "epoch": 1.74, + "learning_rate": 3.927027258830236e-05, + "loss": 0.0081, + "step": 344530 + }, + { + "epoch": 1.74, + "learning_rate": 3.926270489528836e-05, + "loss": 0.0077, + "step": 344540 + }, + { + "epoch": 1.74, + "learning_rate": 3.925513720227434e-05, + "loss": 0.0066, + "step": 344550 + }, + { + "epoch": 1.74, + "learning_rate": 3.924756950926033e-05, + "loss": 0.0067, + "step": 344560 + }, + { + "epoch": 1.74, + "learning_rate": 3.9240001816246315e-05, + "loss": 0.0054, + "step": 344570 + }, + { + "epoch": 1.74, + "learning_rate": 3.92324341232323e-05, + "loss": 0.0057, + "step": 344580 + }, + { + "epoch": 1.74, + "learning_rate": 3.92248664302183e-05, + "loss": 0.0048, + "step": 344590 + }, + { + "epoch": 1.74, + "learning_rate": 3.9217298737204286e-05, + "loss": 0.0055, + "step": 344600 + }, + { + "epoch": 1.74, + "learning_rate": 3.9209731044190274e-05, + "loss": 0.0067, + "step": 344610 + }, + { + "epoch": 1.74, + "learning_rate": 3.920216335117627e-05, + "loss": 0.0039, + "step": 344620 + }, + { + "epoch": 1.74, + "learning_rate": 3.919459565816226e-05, + "loss": 0.0081, + "step": 344630 + }, + { + "epoch": 1.74, + "learning_rate": 3.9187027965148246e-05, + "loss": 0.0068, + "step": 344640 + }, + { + "epoch": 1.74, + "learning_rate": 3.9179460272134234e-05, + "loss": 0.0084, + "step": 344650 + }, + { + "epoch": 1.74, + "learning_rate": 3.917189257912023e-05, + "loss": 0.0059, + "step": 344660 + }, + { + "epoch": 1.74, + "learning_rate": 3.916432488610622e-05, + "loss": 0.0053, + "step": 344670 + }, + { + "epoch": 1.74, + "learning_rate": 3.9156757193092206e-05, + "loss": 0.0054, + "step": 344680 + }, + { + "epoch": 1.74, + "learning_rate": 3.9149189500078194e-05, + "loss": 0.0067, + "step": 344690 + }, + { + "epoch": 1.74, + "learning_rate": 3.914162180706419e-05, + "loss": 0.0059, + "step": 344700 + }, + { + "epoch": 1.74, + "learning_rate": 3.913405411405018e-05, + "loss": 0.0134, + "step": 344710 + }, + { + "epoch": 1.74, + "learning_rate": 3.9126486421036165e-05, + "loss": 0.0066, + "step": 344720 + }, + { + "epoch": 1.74, + "learning_rate": 3.9118918728022153e-05, + "loss": 0.0062, + "step": 344730 + }, + { + "epoch": 1.74, + "learning_rate": 3.911135103500815e-05, + "loss": 0.0071, + "step": 344740 + }, + { + "epoch": 1.74, + "learning_rate": 3.910378334199414e-05, + "loss": 0.006, + "step": 344750 + }, + { + "epoch": 1.74, + "learning_rate": 3.9096215648980125e-05, + "loss": 0.0063, + "step": 344760 + }, + { + "epoch": 1.74, + "learning_rate": 3.908864795596611e-05, + "loss": 0.0044, + "step": 344770 + }, + { + "epoch": 1.74, + "learning_rate": 3.908108026295211e-05, + "loss": 0.0082, + "step": 344780 + }, + { + "epoch": 1.74, + "learning_rate": 3.9073512569938096e-05, + "loss": 0.0064, + "step": 344790 + }, + { + "epoch": 1.74, + "learning_rate": 3.9065944876924085e-05, + "loss": 0.0052, + "step": 344800 + }, + { + "epoch": 1.74, + "learning_rate": 3.905837718391007e-05, + "loss": 0.0063, + "step": 344810 + }, + { + "epoch": 1.74, + "learning_rate": 3.905080949089607e-05, + "loss": 0.007, + "step": 344820 + }, + { + "epoch": 1.74, + "learning_rate": 3.9043241797882056e-05, + "loss": 0.0061, + "step": 344830 + }, + { + "epoch": 1.74, + "learning_rate": 3.9035674104868044e-05, + "loss": 0.0064, + "step": 344840 + }, + { + "epoch": 1.74, + "learning_rate": 3.902810641185403e-05, + "loss": 0.0058, + "step": 344850 + }, + { + "epoch": 1.74, + "learning_rate": 3.9020538718840014e-05, + "loss": 0.0058, + "step": 344860 + }, + { + "epoch": 1.74, + "learning_rate": 3.901297102582601e-05, + "loss": 0.0072, + "step": 344870 + }, + { + "epoch": 1.74, + "learning_rate": 3.9005403332812e-05, + "loss": 0.0099, + "step": 344880 + }, + { + "epoch": 1.74, + "learning_rate": 3.8997835639797985e-05, + "loss": 0.0063, + "step": 344890 + }, + { + "epoch": 1.74, + "learning_rate": 3.8990267946783973e-05, + "loss": 0.0065, + "step": 344900 + }, + { + "epoch": 1.74, + "learning_rate": 3.898270025376997e-05, + "loss": 0.0067, + "step": 344910 + }, + { + "epoch": 1.74, + "learning_rate": 3.897513256075596e-05, + "loss": 0.0049, + "step": 344920 + }, + { + "epoch": 1.74, + "learning_rate": 3.8967564867741945e-05, + "loss": 0.0058, + "step": 344930 + }, + { + "epoch": 1.74, + "learning_rate": 3.895999717472793e-05, + "loss": 0.0062, + "step": 344940 + }, + { + "epoch": 1.74, + "learning_rate": 3.895242948171393e-05, + "loss": 0.0068, + "step": 344950 + }, + { + "epoch": 1.74, + "learning_rate": 3.8944861788699916e-05, + "loss": 0.0059, + "step": 344960 + }, + { + "epoch": 1.74, + "learning_rate": 3.8937294095685905e-05, + "loss": 0.0075, + "step": 344970 + }, + { + "epoch": 1.74, + "learning_rate": 3.892972640267189e-05, + "loss": 0.0096, + "step": 344980 + }, + { + "epoch": 1.74, + "learning_rate": 3.892215870965789e-05, + "loss": 0.0054, + "step": 344990 + }, + { + "epoch": 1.74, + "learning_rate": 3.8914591016643876e-05, + "loss": 0.0079, + "step": 345000 + }, + { + "epoch": 1.74, + "eval_cer": 0.9144159137201398, + "eval_loss": 0.004668357782065868, + "eval_runtime": 116.7577, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, + "step": 345000 + }, + { + "epoch": 1.74, + "learning_rate": 3.8907023323629864e-05, + "loss": 0.0054, + "step": 345010 + }, + { + "epoch": 1.74, + "learning_rate": 3.889945563061585e-05, + "loss": 0.0093, + "step": 345020 + }, + { + "epoch": 1.74, + "learning_rate": 3.889188793760185e-05, + "loss": 0.0057, + "step": 345030 + }, + { + "epoch": 1.74, + "learning_rate": 3.8884320244587836e-05, + "loss": 0.0052, + "step": 345040 + }, + { + "epoch": 1.74, + "learning_rate": 3.8876752551573824e-05, + "loss": 0.0057, + "step": 345050 + }, + { + "epoch": 1.74, + "learning_rate": 3.886918485855981e-05, + "loss": 0.0091, + "step": 345060 + }, + { + "epoch": 1.74, + "learning_rate": 3.886161716554581e-05, + "loss": 0.0057, + "step": 345070 + }, + { + "epoch": 1.74, + "learning_rate": 3.8854049472531795e-05, + "loss": 0.0076, + "step": 345080 + }, + { + "epoch": 1.74, + "learning_rate": 3.8846481779517784e-05, + "loss": 0.0075, + "step": 345090 + }, + { + "epoch": 1.74, + "learning_rate": 3.883891408650377e-05, + "loss": 0.005, + "step": 345100 + }, + { + "epoch": 1.74, + "learning_rate": 3.883134639348977e-05, + "loss": 0.0061, + "step": 345110 + }, + { + "epoch": 1.74, + "learning_rate": 3.8823778700475755e-05, + "loss": 0.0042, + "step": 345120 + }, + { + "epoch": 1.74, + "learning_rate": 3.881621100746174e-05, + "loss": 0.0061, + "step": 345130 + }, + { + "epoch": 1.74, + "learning_rate": 3.880864331444774e-05, + "loss": 0.0062, + "step": 345140 + }, + { + "epoch": 1.74, + "learning_rate": 3.8801075621433726e-05, + "loss": 0.0064, + "step": 345150 + }, + { + "epoch": 1.74, + "learning_rate": 3.8793507928419715e-05, + "loss": 0.0068, + "step": 345160 + }, + { + "epoch": 1.74, + "learning_rate": 3.87859402354057e-05, + "loss": 0.0053, + "step": 345170 + }, + { + "epoch": 1.74, + "learning_rate": 3.8778372542391684e-05, + "loss": 0.0078, + "step": 345180 + }, + { + "epoch": 1.74, + "learning_rate": 3.877080484937768e-05, + "loss": 0.0056, + "step": 345190 + }, + { + "epoch": 1.74, + "learning_rate": 3.876323715636367e-05, + "loss": 0.0088, + "step": 345200 + }, + { + "epoch": 1.74, + "learning_rate": 3.8755669463349656e-05, + "loss": 0.0048, + "step": 345210 + }, + { + "epoch": 1.74, + "learning_rate": 3.8748101770335644e-05, + "loss": 0.0066, + "step": 345220 + }, + { + "epoch": 1.74, + "learning_rate": 3.874053407732164e-05, + "loss": 0.0075, + "step": 345230 + }, + { + "epoch": 1.74, + "learning_rate": 3.873296638430763e-05, + "loss": 0.0082, + "step": 345240 + }, + { + "epoch": 1.74, + "learning_rate": 3.8725398691293615e-05, + "loss": 0.0077, + "step": 345250 + }, + { + "epoch": 1.74, + "learning_rate": 3.8717830998279604e-05, + "loss": 0.0069, + "step": 345260 + }, + { + "epoch": 1.74, + "learning_rate": 3.87102633052656e-05, + "loss": 0.0043, + "step": 345270 + }, + { + "epoch": 1.74, + "learning_rate": 3.870269561225159e-05, + "loss": 0.0068, + "step": 345280 + }, + { + "epoch": 1.74, + "learning_rate": 3.8695127919237575e-05, + "loss": 0.0066, + "step": 345290 + }, + { + "epoch": 1.74, + "learning_rate": 3.868756022622356e-05, + "loss": 0.0074, + "step": 345300 + }, + { + "epoch": 1.74, + "learning_rate": 3.867999253320956e-05, + "loss": 0.0054, + "step": 345310 + }, + { + "epoch": 1.74, + "learning_rate": 3.8672424840195546e-05, + "loss": 0.0057, + "step": 345320 + }, + { + "epoch": 1.74, + "learning_rate": 3.8664857147181535e-05, + "loss": 0.005, + "step": 345330 + }, + { + "epoch": 1.74, + "learning_rate": 3.865728945416752e-05, + "loss": 0.006, + "step": 345340 + }, + { + "epoch": 1.74, + "learning_rate": 3.864972176115352e-05, + "loss": 0.0061, + "step": 345350 + }, + { + "epoch": 1.74, + "learning_rate": 3.8642154068139506e-05, + "loss": 0.0063, + "step": 345360 + }, + { + "epoch": 1.74, + "learning_rate": 3.8634586375125494e-05, + "loss": 0.0065, + "step": 345370 + }, + { + "epoch": 1.74, + "learning_rate": 3.862701868211148e-05, + "loss": 0.0054, + "step": 345380 + }, + { + "epoch": 1.74, + "learning_rate": 3.861945098909748e-05, + "loss": 0.0048, + "step": 345390 + }, + { + "epoch": 1.74, + "learning_rate": 3.8611883296083466e-05, + "loss": 0.0046, + "step": 345400 + }, + { + "epoch": 1.74, + "learning_rate": 3.8604315603069454e-05, + "loss": 0.0056, + "step": 345410 + }, + { + "epoch": 1.74, + "learning_rate": 3.859674791005544e-05, + "loss": 0.0069, + "step": 345420 + }, + { + "epoch": 1.74, + "learning_rate": 3.858918021704144e-05, + "loss": 0.0073, + "step": 345430 + }, + { + "epoch": 1.74, + "learning_rate": 3.8581612524027425e-05, + "loss": 0.0071, + "step": 345440 + }, + { + "epoch": 1.74, + "learning_rate": 3.8574044831013414e-05, + "loss": 0.005, + "step": 345450 + }, + { + "epoch": 1.74, + "learning_rate": 3.85664771379994e-05, + "loss": 0.0052, + "step": 345460 + }, + { + "epoch": 1.74, + "learning_rate": 3.85589094449854e-05, + "loss": 0.0077, + "step": 345470 + }, + { + "epoch": 1.74, + "learning_rate": 3.8551341751971385e-05, + "loss": 0.0066, + "step": 345480 + }, + { + "epoch": 1.74, + "learning_rate": 3.8543774058957366e-05, + "loss": 0.0061, + "step": 345490 + }, + { + "epoch": 1.74, + "learning_rate": 3.8536206365943355e-05, + "loss": 0.0095, + "step": 345500 + }, + { + "epoch": 1.74, + "learning_rate": 3.852863867292934e-05, + "loss": 0.0059, + "step": 345510 + }, + { + "epoch": 1.74, + "learning_rate": 3.852107097991534e-05, + "loss": 0.007, + "step": 345520 + }, + { + "epoch": 1.74, + "learning_rate": 3.8513503286901326e-05, + "loss": 0.0054, + "step": 345530 + }, + { + "epoch": 1.74, + "learning_rate": 3.8505935593887314e-05, + "loss": 0.0059, + "step": 345540 + }, + { + "epoch": 1.74, + "learning_rate": 3.84983679008733e-05, + "loss": 0.006, + "step": 345550 + }, + { + "epoch": 1.74, + "learning_rate": 3.84908002078593e-05, + "loss": 0.0055, + "step": 345560 + }, + { + "epoch": 1.74, + "learning_rate": 3.8483232514845286e-05, + "loss": 0.0058, + "step": 345570 + }, + { + "epoch": 1.74, + "learning_rate": 3.8475664821831274e-05, + "loss": 0.006, + "step": 345580 + }, + { + "epoch": 1.74, + "learning_rate": 3.846809712881727e-05, + "loss": 0.0055, + "step": 345590 + }, + { + "epoch": 1.74, + "learning_rate": 3.846052943580326e-05, + "loss": 0.006, + "step": 345600 + }, + { + "epoch": 1.74, + "learning_rate": 3.8452961742789245e-05, + "loss": 0.0085, + "step": 345610 + }, + { + "epoch": 1.74, + "learning_rate": 3.8445394049775234e-05, + "loss": 0.007, + "step": 345620 + }, + { + "epoch": 1.74, + "learning_rate": 3.843782635676123e-05, + "loss": 0.0061, + "step": 345630 + }, + { + "epoch": 1.74, + "learning_rate": 3.843025866374722e-05, + "loss": 0.0053, + "step": 345640 + }, + { + "epoch": 1.74, + "learning_rate": 3.8422690970733205e-05, + "loss": 0.0087, + "step": 345650 + }, + { + "epoch": 1.74, + "learning_rate": 3.841512327771919e-05, + "loss": 0.0074, + "step": 345660 + }, + { + "epoch": 1.74, + "learning_rate": 3.840755558470519e-05, + "loss": 0.007, + "step": 345670 + }, + { + "epoch": 1.74, + "learning_rate": 3.8399987891691177e-05, + "loss": 0.0061, + "step": 345680 + }, + { + "epoch": 1.74, + "learning_rate": 3.8392420198677165e-05, + "loss": 0.0064, + "step": 345690 + }, + { + "epoch": 1.74, + "learning_rate": 3.838485250566315e-05, + "loss": 0.0063, + "step": 345700 + }, + { + "epoch": 1.74, + "learning_rate": 3.837728481264915e-05, + "loss": 0.0058, + "step": 345710 + }, + { + "epoch": 1.74, + "learning_rate": 3.8369717119635136e-05, + "loss": 0.0058, + "step": 345720 + }, + { + "epoch": 1.74, + "learning_rate": 3.8362149426621124e-05, + "loss": 0.0081, + "step": 345730 + }, + { + "epoch": 1.74, + "learning_rate": 3.835458173360711e-05, + "loss": 0.006, + "step": 345740 + }, + { + "epoch": 1.74, + "learning_rate": 3.834701404059311e-05, + "loss": 0.0068, + "step": 345750 + }, + { + "epoch": 1.74, + "learning_rate": 3.8339446347579096e-05, + "loss": 0.0095, + "step": 345760 + }, + { + "epoch": 1.74, + "learning_rate": 3.8331878654565084e-05, + "loss": 0.0067, + "step": 345770 + }, + { + "epoch": 1.74, + "learning_rate": 3.832431096155107e-05, + "loss": 0.0074, + "step": 345780 + }, + { + "epoch": 1.74, + "learning_rate": 3.831674326853707e-05, + "loss": 0.0081, + "step": 345790 + }, + { + "epoch": 1.74, + "learning_rate": 3.8309175575523055e-05, + "loss": 0.0062, + "step": 345800 + }, + { + "epoch": 1.74, + "learning_rate": 3.830160788250904e-05, + "loss": 0.0085, + "step": 345810 + }, + { + "epoch": 1.74, + "learning_rate": 3.8294040189495025e-05, + "loss": 0.008, + "step": 345820 + }, + { + "epoch": 1.74, + "learning_rate": 3.828647249648101e-05, + "loss": 0.0078, + "step": 345830 + }, + { + "epoch": 1.74, + "learning_rate": 3.827890480346701e-05, + "loss": 0.0052, + "step": 345840 + }, + { + "epoch": 1.74, + "learning_rate": 3.8271337110452997e-05, + "loss": 0.0059, + "step": 345850 + }, + { + "epoch": 1.74, + "learning_rate": 3.8263769417438985e-05, + "loss": 0.0075, + "step": 345860 + }, + { + "epoch": 1.74, + "learning_rate": 3.825620172442497e-05, + "loss": 0.0065, + "step": 345870 + }, + { + "epoch": 1.75, + "learning_rate": 3.824863403141097e-05, + "loss": 0.006, + "step": 345880 + }, + { + "epoch": 1.75, + "learning_rate": 3.8241066338396956e-05, + "loss": 0.0058, + "step": 345890 + }, + { + "epoch": 1.75, + "learning_rate": 3.8233498645382944e-05, + "loss": 0.0072, + "step": 345900 + }, + { + "epoch": 1.75, + "learning_rate": 3.822593095236893e-05, + "loss": 0.0054, + "step": 345910 + }, + { + "epoch": 1.75, + "learning_rate": 3.821836325935493e-05, + "loss": 0.0044, + "step": 345920 + }, + { + "epoch": 1.75, + "learning_rate": 3.8210795566340916e-05, + "loss": 0.0052, + "step": 345930 + }, + { + "epoch": 1.75, + "learning_rate": 3.8203227873326904e-05, + "loss": 0.0063, + "step": 345940 + }, + { + "epoch": 1.75, + "learning_rate": 3.819566018031289e-05, + "loss": 0.0081, + "step": 345950 + }, + { + "epoch": 1.75, + "learning_rate": 3.818809248729889e-05, + "loss": 0.0048, + "step": 345960 + }, + { + "epoch": 1.75, + "learning_rate": 3.8180524794284876e-05, + "loss": 0.0071, + "step": 345970 + }, + { + "epoch": 1.75, + "learning_rate": 3.8172957101270864e-05, + "loss": 0.0067, + "step": 345980 + }, + { + "epoch": 1.75, + "learning_rate": 3.816538940825685e-05, + "loss": 0.0069, + "step": 345990 + }, + { + "epoch": 1.75, + "learning_rate": 3.815782171524285e-05, + "loss": 0.0062, + "step": 346000 + }, + { + "epoch": 1.75, + "eval_cer": 0.9144227064930175, + "eval_loss": 0.004535060841590166, + "eval_runtime": 116.7184, + "eval_samples_per_second": 17.135, + "eval_steps_per_second": 4.284, + "step": 346000 + }, + { + "epoch": 1.75, + "learning_rate": 3.8150254022228835e-05, + "loss": 0.0045, + "step": 346010 + }, + { + "epoch": 1.75, + "learning_rate": 3.8142686329214823e-05, + "loss": 0.0068, + "step": 346020 + }, + { + "epoch": 1.75, + "learning_rate": 3.813511863620081e-05, + "loss": 0.0056, + "step": 346030 + }, + { + "epoch": 1.75, + "learning_rate": 3.812755094318681e-05, + "loss": 0.0063, + "step": 346040 + }, + { + "epoch": 1.75, + "learning_rate": 3.8119983250172795e-05, + "loss": 0.0082, + "step": 346050 + }, + { + "epoch": 1.75, + "learning_rate": 3.811241555715878e-05, + "loss": 0.0056, + "step": 346060 + }, + { + "epoch": 1.75, + "learning_rate": 3.810484786414477e-05, + "loss": 0.006, + "step": 346070 + }, + { + "epoch": 1.75, + "learning_rate": 3.8097280171130766e-05, + "loss": 0.0068, + "step": 346080 + }, + { + "epoch": 1.75, + "learning_rate": 3.8089712478116754e-05, + "loss": 0.0063, + "step": 346090 + }, + { + "epoch": 1.75, + "learning_rate": 3.808214478510274e-05, + "loss": 0.0052, + "step": 346100 + }, + { + "epoch": 1.75, + "learning_rate": 3.807457709208874e-05, + "loss": 0.0067, + "step": 346110 + }, + { + "epoch": 1.75, + "learning_rate": 3.806700939907472e-05, + "loss": 0.0057, + "step": 346120 + }, + { + "epoch": 1.75, + "learning_rate": 3.805944170606071e-05, + "loss": 0.006, + "step": 346130 + }, + { + "epoch": 1.75, + "learning_rate": 3.8051874013046696e-05, + "loss": 0.0069, + "step": 346140 + }, + { + "epoch": 1.75, + "learning_rate": 3.8044306320032684e-05, + "loss": 0.0065, + "step": 346150 + }, + { + "epoch": 1.75, + "learning_rate": 3.803673862701868e-05, + "loss": 0.0046, + "step": 346160 + }, + { + "epoch": 1.75, + "learning_rate": 3.802917093400467e-05, + "loss": 0.0074, + "step": 346170 + }, + { + "epoch": 1.75, + "learning_rate": 3.8021603240990655e-05, + "loss": 0.0064, + "step": 346180 + }, + { + "epoch": 1.75, + "learning_rate": 3.8014035547976643e-05, + "loss": 0.0057, + "step": 346190 + }, + { + "epoch": 1.75, + "learning_rate": 3.800646785496264e-05, + "loss": 0.0058, + "step": 346200 + }, + { + "epoch": 1.75, + "learning_rate": 3.799890016194863e-05, + "loss": 0.0045, + "step": 346210 + }, + { + "epoch": 1.75, + "learning_rate": 3.7991332468934615e-05, + "loss": 0.0068, + "step": 346220 + }, + { + "epoch": 1.75, + "learning_rate": 3.79837647759206e-05, + "loss": 0.0056, + "step": 346230 + }, + { + "epoch": 1.75, + "learning_rate": 3.79761970829066e-05, + "loss": 0.0063, + "step": 346240 + }, + { + "epoch": 1.75, + "learning_rate": 3.7968629389892586e-05, + "loss": 0.006, + "step": 346250 + }, + { + "epoch": 1.75, + "learning_rate": 3.7961061696878575e-05, + "loss": 0.0075, + "step": 346260 + }, + { + "epoch": 1.75, + "learning_rate": 3.795349400386456e-05, + "loss": 0.006, + "step": 346270 + }, + { + "epoch": 1.75, + "learning_rate": 3.794592631085056e-05, + "loss": 0.0064, + "step": 346280 + }, + { + "epoch": 1.75, + "learning_rate": 3.7938358617836546e-05, + "loss": 0.0062, + "step": 346290 + }, + { + "epoch": 1.75, + "learning_rate": 3.7930790924822534e-05, + "loss": 0.0079, + "step": 346300 + }, + { + "epoch": 1.75, + "learning_rate": 3.792322323180852e-05, + "loss": 0.0078, + "step": 346310 + }, + { + "epoch": 1.75, + "learning_rate": 3.791565553879452e-05, + "loss": 0.0055, + "step": 346320 + }, + { + "epoch": 1.75, + "learning_rate": 3.7908087845780506e-05, + "loss": 0.0073, + "step": 346330 + }, + { + "epoch": 1.75, + "learning_rate": 3.7900520152766494e-05, + "loss": 0.0086, + "step": 346340 + }, + { + "epoch": 1.75, + "learning_rate": 3.789295245975248e-05, + "loss": 0.005, + "step": 346350 + }, + { + "epoch": 1.75, + "learning_rate": 3.788538476673848e-05, + "loss": 0.0055, + "step": 346360 + }, + { + "epoch": 1.75, + "learning_rate": 3.7877817073724465e-05, + "loss": 0.0074, + "step": 346370 + }, + { + "epoch": 1.75, + "learning_rate": 3.7870249380710453e-05, + "loss": 0.005, + "step": 346380 + }, + { + "epoch": 1.75, + "learning_rate": 3.786268168769644e-05, + "loss": 0.0048, + "step": 346390 + }, + { + "epoch": 1.75, + "learning_rate": 3.785511399468244e-05, + "loss": 0.0066, + "step": 346400 + }, + { + "epoch": 1.75, + "learning_rate": 3.7847546301668425e-05, + "loss": 0.0066, + "step": 346410 + }, + { + "epoch": 1.75, + "learning_rate": 3.783997860865441e-05, + "loss": 0.0054, + "step": 346420 + }, + { + "epoch": 1.75, + "learning_rate": 3.7832410915640395e-05, + "loss": 0.0075, + "step": 346430 + }, + { + "epoch": 1.75, + "learning_rate": 3.782484322262638e-05, + "loss": 0.0052, + "step": 346440 + }, + { + "epoch": 1.75, + "learning_rate": 3.781727552961238e-05, + "loss": 0.0071, + "step": 346450 + }, + { + "epoch": 1.75, + "learning_rate": 3.7809707836598366e-05, + "loss": 0.0061, + "step": 346460 + }, + { + "epoch": 1.75, + "learning_rate": 3.7802140143584354e-05, + "loss": 0.0063, + "step": 346470 + }, + { + "epoch": 1.75, + "learning_rate": 3.779457245057034e-05, + "loss": 0.0049, + "step": 346480 + }, + { + "epoch": 1.75, + "learning_rate": 3.778700475755634e-05, + "loss": 0.0053, + "step": 346490 + }, + { + "epoch": 1.75, + "learning_rate": 3.7779437064542326e-05, + "loss": 0.0065, + "step": 346500 + }, + { + "epoch": 1.75, + "learning_rate": 3.7771869371528314e-05, + "loss": 0.006, + "step": 346510 + }, + { + "epoch": 1.75, + "learning_rate": 3.77643016785143e-05, + "loss": 0.0049, + "step": 346520 + }, + { + "epoch": 1.75, + "learning_rate": 3.77567339855003e-05, + "loss": 0.0072, + "step": 346530 + }, + { + "epoch": 1.75, + "learning_rate": 3.7749166292486285e-05, + "loss": 0.0076, + "step": 346540 + }, + { + "epoch": 1.75, + "learning_rate": 3.7741598599472274e-05, + "loss": 0.0044, + "step": 346550 + }, + { + "epoch": 1.75, + "learning_rate": 3.773403090645827e-05, + "loss": 0.0061, + "step": 346560 + }, + { + "epoch": 1.75, + "learning_rate": 3.772646321344426e-05, + "loss": 0.0045, + "step": 346570 + }, + { + "epoch": 1.75, + "learning_rate": 3.7718895520430245e-05, + "loss": 0.0057, + "step": 346580 + }, + { + "epoch": 1.75, + "learning_rate": 3.771132782741623e-05, + "loss": 0.0055, + "step": 346590 + }, + { + "epoch": 1.75, + "learning_rate": 3.770376013440223e-05, + "loss": 0.0078, + "step": 346600 + }, + { + "epoch": 1.75, + "learning_rate": 3.7696192441388216e-05, + "loss": 0.0065, + "step": 346610 + }, + { + "epoch": 1.75, + "learning_rate": 3.7688624748374205e-05, + "loss": 0.0057, + "step": 346620 + }, + { + "epoch": 1.75, + "learning_rate": 3.768105705536019e-05, + "loss": 0.0061, + "step": 346630 + }, + { + "epoch": 1.75, + "learning_rate": 3.767348936234619e-05, + "loss": 0.0075, + "step": 346640 + }, + { + "epoch": 1.75, + "learning_rate": 3.7665921669332176e-05, + "loss": 0.0052, + "step": 346650 + }, + { + "epoch": 1.75, + "learning_rate": 3.7658353976318164e-05, + "loss": 0.006, + "step": 346660 + }, + { + "epoch": 1.75, + "learning_rate": 3.765078628330415e-05, + "loss": 0.0056, + "step": 346670 + }, + { + "epoch": 1.75, + "learning_rate": 3.764321859029015e-05, + "loss": 0.007, + "step": 346680 + }, + { + "epoch": 1.75, + "learning_rate": 3.7635650897276136e-05, + "loss": 0.0046, + "step": 346690 + }, + { + "epoch": 1.75, + "learning_rate": 3.7628083204262124e-05, + "loss": 0.0056, + "step": 346700 + }, + { + "epoch": 1.75, + "learning_rate": 3.762051551124811e-05, + "loss": 0.0077, + "step": 346710 + }, + { + "epoch": 1.75, + "learning_rate": 3.761294781823411e-05, + "loss": 0.0058, + "step": 346720 + }, + { + "epoch": 1.75, + "learning_rate": 3.7605380125220095e-05, + "loss": 0.0078, + "step": 346730 + }, + { + "epoch": 1.75, + "learning_rate": 3.7597812432206084e-05, + "loss": 0.009, + "step": 346740 + }, + { + "epoch": 1.75, + "learning_rate": 3.7590244739192065e-05, + "loss": 0.009, + "step": 346750 + }, + { + "epoch": 1.75, + "learning_rate": 3.758267704617805e-05, + "loss": 0.0087, + "step": 346760 + }, + { + "epoch": 1.75, + "learning_rate": 3.757510935316405e-05, + "loss": 0.0054, + "step": 346770 + }, + { + "epoch": 1.75, + "learning_rate": 3.7567541660150036e-05, + "loss": 0.0058, + "step": 346780 + }, + { + "epoch": 1.75, + "learning_rate": 3.7559973967136025e-05, + "loss": 0.0065, + "step": 346790 + }, + { + "epoch": 1.75, + "learning_rate": 3.755240627412201e-05, + "loss": 0.007, + "step": 346800 + }, + { + "epoch": 1.75, + "learning_rate": 3.754483858110801e-05, + "loss": 0.0063, + "step": 346810 + }, + { + "epoch": 1.75, + "learning_rate": 3.7537270888093996e-05, + "loss": 0.0052, + "step": 346820 + }, + { + "epoch": 1.75, + "learning_rate": 3.7529703195079984e-05, + "loss": 0.0088, + "step": 346830 + }, + { + "epoch": 1.75, + "learning_rate": 3.752213550206597e-05, + "loss": 0.0053, + "step": 346840 + }, + { + "epoch": 1.75, + "learning_rate": 3.751456780905197e-05, + "loss": 0.0047, + "step": 346850 + }, + { + "epoch": 1.75, + "learning_rate": 3.7507000116037956e-05, + "loss": 0.0074, + "step": 346860 + }, + { + "epoch": 1.75, + "learning_rate": 3.7499432423023944e-05, + "loss": 0.0058, + "step": 346870 + }, + { + "epoch": 1.75, + "learning_rate": 3.749186473000993e-05, + "loss": 0.0057, + "step": 346880 + }, + { + "epoch": 1.75, + "learning_rate": 3.748429703699593e-05, + "loss": 0.0068, + "step": 346890 + }, + { + "epoch": 1.75, + "learning_rate": 3.7476729343981915e-05, + "loss": 0.0081, + "step": 346900 + }, + { + "epoch": 1.75, + "learning_rate": 3.7469161650967904e-05, + "loss": 0.006, + "step": 346910 + }, + { + "epoch": 1.75, + "learning_rate": 3.746159395795389e-05, + "loss": 0.0073, + "step": 346920 + }, + { + "epoch": 1.75, + "learning_rate": 3.745402626493989e-05, + "loss": 0.0053, + "step": 346930 + }, + { + "epoch": 1.75, + "learning_rate": 3.7446458571925875e-05, + "loss": 0.0062, + "step": 346940 + }, + { + "epoch": 1.75, + "learning_rate": 3.743889087891186e-05, + "loss": 0.0063, + "step": 346950 + }, + { + "epoch": 1.75, + "learning_rate": 3.743132318589785e-05, + "loss": 0.0113, + "step": 346960 + }, + { + "epoch": 1.75, + "learning_rate": 3.7423755492883846e-05, + "loss": 0.0055, + "step": 346970 + }, + { + "epoch": 1.75, + "learning_rate": 3.741618779986983e-05, + "loss": 0.0074, + "step": 346980 + }, + { + "epoch": 1.75, + "learning_rate": 3.740862010685582e-05, + "loss": 0.0075, + "step": 346990 + }, + { + "epoch": 1.75, + "learning_rate": 3.740105241384181e-05, + "loss": 0.0079, + "step": 347000 + }, + { + "epoch": 1.75, + "eval_cer": 0.9144304696620207, + "eval_loss": 0.004600143525749445, + "eval_runtime": 116.8017, + "eval_samples_per_second": 17.123, + "eval_steps_per_second": 4.281, + "step": 347000 + }, + { + "epoch": 1.75, + "learning_rate": 3.73934847208278e-05, + "loss": 0.0062, + "step": 347010 + }, + { + "epoch": 1.75, + "learning_rate": 3.738591702781379e-05, + "loss": 0.0065, + "step": 347020 + }, + { + "epoch": 1.75, + "learning_rate": 3.737834933479978e-05, + "loss": 0.0069, + "step": 347030 + }, + { + "epoch": 1.75, + "learning_rate": 3.737078164178577e-05, + "loss": 0.0059, + "step": 347040 + }, + { + "epoch": 1.75, + "learning_rate": 3.736321394877176e-05, + "loss": 0.0075, + "step": 347050 + }, + { + "epoch": 1.75, + "learning_rate": 3.735564625575775e-05, + "loss": 0.0058, + "step": 347060 + }, + { + "epoch": 1.75, + "learning_rate": 3.734807856274374e-05, + "loss": 0.005, + "step": 347070 + }, + { + "epoch": 1.75, + "learning_rate": 3.734051086972973e-05, + "loss": 0.0054, + "step": 347080 + }, + { + "epoch": 1.75, + "learning_rate": 3.733294317671572e-05, + "loss": 0.0065, + "step": 347090 + }, + { + "epoch": 1.75, + "learning_rate": 3.732537548370171e-05, + "loss": 0.006, + "step": 347100 + }, + { + "epoch": 1.75, + "learning_rate": 3.73178077906877e-05, + "loss": 0.0053, + "step": 347110 + }, + { + "epoch": 1.75, + "learning_rate": 3.731024009767369e-05, + "loss": 0.0061, + "step": 347120 + }, + { + "epoch": 1.75, + "learning_rate": 3.730267240465968e-05, + "loss": 0.0052, + "step": 347130 + }, + { + "epoch": 1.75, + "learning_rate": 3.7295104711645667e-05, + "loss": 0.0065, + "step": 347140 + }, + { + "epoch": 1.75, + "learning_rate": 3.7287537018631655e-05, + "loss": 0.0074, + "step": 347150 + }, + { + "epoch": 1.75, + "learning_rate": 3.727996932561764e-05, + "loss": 0.0094, + "step": 347160 + }, + { + "epoch": 1.75, + "learning_rate": 3.727240163260364e-05, + "loss": 0.0055, + "step": 347170 + }, + { + "epoch": 1.75, + "learning_rate": 3.7264833939589626e-05, + "loss": 0.0071, + "step": 347180 + }, + { + "epoch": 1.75, + "learning_rate": 3.7257266246575614e-05, + "loss": 0.0047, + "step": 347190 + }, + { + "epoch": 1.75, + "learning_rate": 3.72496985535616e-05, + "loss": 0.0053, + "step": 347200 + }, + { + "epoch": 1.75, + "learning_rate": 3.72421308605476e-05, + "loss": 0.0105, + "step": 347210 + }, + { + "epoch": 1.75, + "learning_rate": 3.7234563167533586e-05, + "loss": 0.0057, + "step": 347220 + }, + { + "epoch": 1.75, + "learning_rate": 3.7226995474519574e-05, + "loss": 0.0101, + "step": 347230 + }, + { + "epoch": 1.75, + "learning_rate": 3.721942778150556e-05, + "loss": 0.0075, + "step": 347240 + }, + { + "epoch": 1.75, + "learning_rate": 3.721186008849156e-05, + "loss": 0.0086, + "step": 347250 + }, + { + "epoch": 1.75, + "learning_rate": 3.7204292395477545e-05, + "loss": 0.0041, + "step": 347260 + }, + { + "epoch": 1.75, + "learning_rate": 3.7196724702463534e-05, + "loss": 0.0052, + "step": 347270 + }, + { + "epoch": 1.75, + "learning_rate": 3.718915700944952e-05, + "loss": 0.0081, + "step": 347280 + }, + { + "epoch": 1.75, + "learning_rate": 3.718158931643552e-05, + "loss": 0.0068, + "step": 347290 + }, + { + "epoch": 1.75, + "learning_rate": 3.71740216234215e-05, + "loss": 0.0076, + "step": 347300 + }, + { + "epoch": 1.75, + "learning_rate": 3.716645393040749e-05, + "loss": 0.007, + "step": 347310 + }, + { + "epoch": 1.75, + "learning_rate": 3.715888623739348e-05, + "loss": 0.0053, + "step": 347320 + }, + { + "epoch": 1.75, + "learning_rate": 3.715131854437947e-05, + "loss": 0.0055, + "step": 347330 + }, + { + "epoch": 1.75, + "learning_rate": 3.714375085136546e-05, + "loss": 0.0054, + "step": 347340 + }, + { + "epoch": 1.75, + "learning_rate": 3.713618315835145e-05, + "loss": 0.0044, + "step": 347350 + }, + { + "epoch": 1.75, + "learning_rate": 3.712861546533744e-05, + "loss": 0.0051, + "step": 347360 + }, + { + "epoch": 1.75, + "learning_rate": 3.712104777232343e-05, + "loss": 0.0054, + "step": 347370 + }, + { + "epoch": 1.75, + "learning_rate": 3.711348007930942e-05, + "loss": 0.012, + "step": 347380 + }, + { + "epoch": 1.75, + "learning_rate": 3.710591238629541e-05, + "loss": 0.0051, + "step": 347390 + }, + { + "epoch": 1.75, + "learning_rate": 3.70983446932814e-05, + "loss": 0.0054, + "step": 347400 + }, + { + "epoch": 1.75, + "learning_rate": 3.709077700026739e-05, + "loss": 0.005, + "step": 347410 + }, + { + "epoch": 1.75, + "learning_rate": 3.708320930725338e-05, + "loss": 0.0052, + "step": 347420 + }, + { + "epoch": 1.75, + "learning_rate": 3.707564161423937e-05, + "loss": 0.0039, + "step": 347430 + }, + { + "epoch": 1.75, + "learning_rate": 3.706807392122536e-05, + "loss": 0.0063, + "step": 347440 + }, + { + "epoch": 1.75, + "learning_rate": 3.706050622821135e-05, + "loss": 0.0048, + "step": 347450 + }, + { + "epoch": 1.75, + "learning_rate": 3.705293853519734e-05, + "loss": 0.0059, + "step": 347460 + }, + { + "epoch": 1.75, + "learning_rate": 3.7045370842183325e-05, + "loss": 0.0068, + "step": 347470 + }, + { + "epoch": 1.75, + "learning_rate": 3.7037803149169313e-05, + "loss": 0.0062, + "step": 347480 + }, + { + "epoch": 1.75, + "learning_rate": 3.70302354561553e-05, + "loss": 0.0056, + "step": 347490 + }, + { + "epoch": 1.75, + "learning_rate": 3.70226677631413e-05, + "loss": 0.0055, + "step": 347500 + }, + { + "epoch": 1.75, + "learning_rate": 3.7015100070127285e-05, + "loss": 0.0087, + "step": 347510 + }, + { + "epoch": 1.75, + "learning_rate": 3.700753237711327e-05, + "loss": 0.0067, + "step": 347520 + }, + { + "epoch": 1.75, + "learning_rate": 3.699996468409927e-05, + "loss": 0.0058, + "step": 347530 + }, + { + "epoch": 1.75, + "learning_rate": 3.6992396991085256e-05, + "loss": 0.0068, + "step": 347540 + }, + { + "epoch": 1.75, + "learning_rate": 3.6984829298071244e-05, + "loss": 0.0073, + "step": 347550 + }, + { + "epoch": 1.75, + "learning_rate": 3.697726160505723e-05, + "loss": 0.0046, + "step": 347560 + }, + { + "epoch": 1.75, + "learning_rate": 3.696969391204323e-05, + "loss": 0.0054, + "step": 347570 + }, + { + "epoch": 1.75, + "learning_rate": 3.6962126219029216e-05, + "loss": 0.0063, + "step": 347580 + }, + { + "epoch": 1.75, + "learning_rate": 3.6954558526015204e-05, + "loss": 0.0057, + "step": 347590 + }, + { + "epoch": 1.75, + "learning_rate": 3.694699083300119e-05, + "loss": 0.0049, + "step": 347600 + }, + { + "epoch": 1.75, + "learning_rate": 3.693942313998718e-05, + "loss": 0.0051, + "step": 347610 + }, + { + "epoch": 1.75, + "learning_rate": 3.693185544697317e-05, + "loss": 0.0057, + "step": 347620 + }, + { + "epoch": 1.75, + "learning_rate": 3.692428775395916e-05, + "loss": 0.0054, + "step": 347630 + }, + { + "epoch": 1.75, + "learning_rate": 3.691672006094515e-05, + "loss": 0.0059, + "step": 347640 + }, + { + "epoch": 1.75, + "learning_rate": 3.690915236793114e-05, + "loss": 0.0066, + "step": 347650 + }, + { + "epoch": 1.75, + "learning_rate": 3.690158467491713e-05, + "loss": 0.0049, + "step": 347660 + }, + { + "epoch": 1.75, + "learning_rate": 3.689401698190312e-05, + "loss": 0.0087, + "step": 347670 + }, + { + "epoch": 1.75, + "learning_rate": 3.688644928888911e-05, + "loss": 0.0101, + "step": 347680 + }, + { + "epoch": 1.75, + "learning_rate": 3.68788815958751e-05, + "loss": 0.0065, + "step": 347690 + }, + { + "epoch": 1.75, + "learning_rate": 3.687131390286109e-05, + "loss": 0.0083, + "step": 347700 + }, + { + "epoch": 1.75, + "learning_rate": 3.6863746209847076e-05, + "loss": 0.0049, + "step": 347710 + }, + { + "epoch": 1.75, + "learning_rate": 3.685617851683307e-05, + "loss": 0.0056, + "step": 347720 + }, + { + "epoch": 1.75, + "learning_rate": 3.684861082381906e-05, + "loss": 0.0087, + "step": 347730 + }, + { + "epoch": 1.75, + "learning_rate": 3.684104313080505e-05, + "loss": 0.0044, + "step": 347740 + }, + { + "epoch": 1.75, + "learning_rate": 3.6833475437791036e-05, + "loss": 0.006, + "step": 347750 + }, + { + "epoch": 1.75, + "learning_rate": 3.682590774477703e-05, + "loss": 0.0091, + "step": 347760 + }, + { + "epoch": 1.75, + "learning_rate": 3.681834005176301e-05, + "loss": 0.0048, + "step": 347770 + }, + { + "epoch": 1.75, + "learning_rate": 3.681077235874901e-05, + "loss": 0.0067, + "step": 347780 + }, + { + "epoch": 1.75, + "learning_rate": 3.6803204665734996e-05, + "loss": 0.0066, + "step": 347790 + }, + { + "epoch": 1.75, + "learning_rate": 3.6795636972720984e-05, + "loss": 0.0047, + "step": 347800 + }, + { + "epoch": 1.75, + "learning_rate": 3.678806927970697e-05, + "loss": 0.0043, + "step": 347810 + }, + { + "epoch": 1.75, + "learning_rate": 3.678050158669297e-05, + "loss": 0.006, + "step": 347820 + }, + { + "epoch": 1.75, + "learning_rate": 3.6772933893678955e-05, + "loss": 0.0074, + "step": 347830 + }, + { + "epoch": 1.75, + "learning_rate": 3.6765366200664943e-05, + "loss": 0.0063, + "step": 347840 + }, + { + "epoch": 1.75, + "learning_rate": 3.675779850765093e-05, + "loss": 0.0069, + "step": 347850 + }, + { + "epoch": 1.75, + "learning_rate": 3.675023081463693e-05, + "loss": 0.0062, + "step": 347860 + }, + { + "epoch": 1.76, + "learning_rate": 3.6742663121622915e-05, + "loss": 0.0044, + "step": 347870 + }, + { + "epoch": 1.76, + "learning_rate": 3.67350954286089e-05, + "loss": 0.0063, + "step": 347880 + }, + { + "epoch": 1.76, + "learning_rate": 3.672752773559489e-05, + "loss": 0.0053, + "step": 347890 + }, + { + "epoch": 1.76, + "learning_rate": 3.6719960042580886e-05, + "loss": 0.0053, + "step": 347900 + }, + { + "epoch": 1.76, + "learning_rate": 3.6712392349566875e-05, + "loss": 0.007, + "step": 347910 + }, + { + "epoch": 1.76, + "learning_rate": 3.670482465655286e-05, + "loss": 0.0066, + "step": 347920 + }, + { + "epoch": 1.76, + "learning_rate": 3.669725696353885e-05, + "loss": 0.0059, + "step": 347930 + }, + { + "epoch": 1.76, + "learning_rate": 3.668968927052484e-05, + "loss": 0.0073, + "step": 347940 + }, + { + "epoch": 1.76, + "learning_rate": 3.668212157751083e-05, + "loss": 0.0048, + "step": 347950 + }, + { + "epoch": 1.76, + "learning_rate": 3.667455388449682e-05, + "loss": 0.0055, + "step": 347960 + }, + { + "epoch": 1.76, + "learning_rate": 3.666698619148281e-05, + "loss": 0.0062, + "step": 347970 + }, + { + "epoch": 1.76, + "learning_rate": 3.66594184984688e-05, + "loss": 0.0037, + "step": 347980 + }, + { + "epoch": 1.76, + "learning_rate": 3.665185080545479e-05, + "loss": 0.0064, + "step": 347990 + }, + { + "epoch": 1.76, + "learning_rate": 3.664428311244078e-05, + "loss": 0.0056, + "step": 348000 + }, + { + "epoch": 1.76, + "eval_cer": 0.9144324104542716, + "eval_loss": 0.004651382099837065, + "eval_runtime": 116.6456, + "eval_samples_per_second": 17.146, + "eval_steps_per_second": 4.286, + "step": 348000 + }, + { + "epoch": 1.76, + "learning_rate": 3.663671541942677e-05, + "loss": 0.0051, + "step": 348010 + }, + { + "epoch": 1.76, + "learning_rate": 3.662914772641276e-05, + "loss": 0.0062, + "step": 348020 + }, + { + "epoch": 1.76, + "learning_rate": 3.662158003339875e-05, + "loss": 0.0045, + "step": 348030 + }, + { + "epoch": 1.76, + "learning_rate": 3.661401234038474e-05, + "loss": 0.0053, + "step": 348040 + }, + { + "epoch": 1.76, + "learning_rate": 3.660644464737073e-05, + "loss": 0.0071, + "step": 348050 + }, + { + "epoch": 1.76, + "learning_rate": 3.659887695435672e-05, + "loss": 0.0084, + "step": 348060 + }, + { + "epoch": 1.76, + "learning_rate": 3.6591309261342706e-05, + "loss": 0.0073, + "step": 348070 + }, + { + "epoch": 1.76, + "learning_rate": 3.6583741568328695e-05, + "loss": 0.0064, + "step": 348080 + }, + { + "epoch": 1.76, + "learning_rate": 3.657617387531468e-05, + "loss": 0.0076, + "step": 348090 + }, + { + "epoch": 1.76, + "learning_rate": 3.656860618230068e-05, + "loss": 0.006, + "step": 348100 + }, + { + "epoch": 1.76, + "learning_rate": 3.6561038489286666e-05, + "loss": 0.0061, + "step": 348110 + }, + { + "epoch": 1.76, + "learning_rate": 3.6553470796272654e-05, + "loss": 0.0059, + "step": 348120 + }, + { + "epoch": 1.76, + "learning_rate": 3.654590310325864e-05, + "loss": 0.0067, + "step": 348130 + }, + { + "epoch": 1.76, + "learning_rate": 3.653833541024464e-05, + "loss": 0.0065, + "step": 348140 + }, + { + "epoch": 1.76, + "learning_rate": 3.6530767717230626e-05, + "loss": 0.0071, + "step": 348150 + }, + { + "epoch": 1.76, + "learning_rate": 3.6523200024216614e-05, + "loss": 0.0065, + "step": 348160 + }, + { + "epoch": 1.76, + "learning_rate": 3.65156323312026e-05, + "loss": 0.0049, + "step": 348170 + }, + { + "epoch": 1.76, + "learning_rate": 3.65080646381886e-05, + "loss": 0.0052, + "step": 348180 + }, + { + "epoch": 1.76, + "learning_rate": 3.6500496945174585e-05, + "loss": 0.005, + "step": 348190 + }, + { + "epoch": 1.76, + "learning_rate": 3.6492929252160574e-05, + "loss": 0.0067, + "step": 348200 + }, + { + "epoch": 1.76, + "learning_rate": 3.648536155914656e-05, + "loss": 0.0047, + "step": 348210 + }, + { + "epoch": 1.76, + "learning_rate": 3.647779386613256e-05, + "loss": 0.0057, + "step": 348220 + }, + { + "epoch": 1.76, + "learning_rate": 3.6470226173118545e-05, + "loss": 0.0072, + "step": 348230 + }, + { + "epoch": 1.76, + "learning_rate": 3.646265848010453e-05, + "loss": 0.0074, + "step": 348240 + }, + { + "epoch": 1.76, + "learning_rate": 3.645509078709052e-05, + "loss": 0.0062, + "step": 348250 + }, + { + "epoch": 1.76, + "learning_rate": 3.644752309407651e-05, + "loss": 0.0088, + "step": 348260 + }, + { + "epoch": 1.76, + "learning_rate": 3.64399554010625e-05, + "loss": 0.005, + "step": 348270 + }, + { + "epoch": 1.76, + "learning_rate": 3.643238770804849e-05, + "loss": 0.0068, + "step": 348280 + }, + { + "epoch": 1.76, + "learning_rate": 3.642482001503448e-05, + "loss": 0.008, + "step": 348290 + }, + { + "epoch": 1.76, + "learning_rate": 3.641725232202047e-05, + "loss": 0.0054, + "step": 348300 + }, + { + "epoch": 1.76, + "learning_rate": 3.640968462900646e-05, + "loss": 0.0052, + "step": 348310 + }, + { + "epoch": 1.76, + "learning_rate": 3.640211693599245e-05, + "loss": 0.0045, + "step": 348320 + }, + { + "epoch": 1.76, + "learning_rate": 3.639454924297844e-05, + "loss": 0.0062, + "step": 348330 + }, + { + "epoch": 1.76, + "learning_rate": 3.638698154996443e-05, + "loss": 0.0066, + "step": 348340 + }, + { + "epoch": 1.76, + "learning_rate": 3.637941385695042e-05, + "loss": 0.0072, + "step": 348350 + }, + { + "epoch": 1.76, + "learning_rate": 3.637184616393641e-05, + "loss": 0.0066, + "step": 348360 + }, + { + "epoch": 1.76, + "learning_rate": 3.63642784709224e-05, + "loss": 0.0064, + "step": 348370 + }, + { + "epoch": 1.76, + "learning_rate": 3.635671077790839e-05, + "loss": 0.0044, + "step": 348380 + }, + { + "epoch": 1.76, + "learning_rate": 3.634914308489438e-05, + "loss": 0.0041, + "step": 348390 + }, + { + "epoch": 1.76, + "learning_rate": 3.6341575391880365e-05, + "loss": 0.0069, + "step": 348400 + }, + { + "epoch": 1.76, + "learning_rate": 3.633400769886635e-05, + "loss": 0.0063, + "step": 348410 + }, + { + "epoch": 1.76, + "learning_rate": 3.632644000585234e-05, + "loss": 0.0091, + "step": 348420 + }, + { + "epoch": 1.76, + "learning_rate": 3.6318872312838336e-05, + "loss": 0.0045, + "step": 348430 + }, + { + "epoch": 1.76, + "learning_rate": 3.6311304619824325e-05, + "loss": 0.0057, + "step": 348440 + }, + { + "epoch": 1.76, + "learning_rate": 3.630373692681031e-05, + "loss": 0.0059, + "step": 348450 + }, + { + "epoch": 1.76, + "learning_rate": 3.62961692337963e-05, + "loss": 0.0113, + "step": 348460 + }, + { + "epoch": 1.76, + "learning_rate": 3.6288601540782296e-05, + "loss": 0.008, + "step": 348470 + }, + { + "epoch": 1.76, + "learning_rate": 3.6281033847768284e-05, + "loss": 0.0051, + "step": 348480 + }, + { + "epoch": 1.76, + "learning_rate": 3.627346615475427e-05, + "loss": 0.0062, + "step": 348490 + }, + { + "epoch": 1.76, + "learning_rate": 3.626589846174027e-05, + "loss": 0.0041, + "step": 348500 + }, + { + "epoch": 1.76, + "learning_rate": 3.6258330768726256e-05, + "loss": 0.0054, + "step": 348510 + }, + { + "epoch": 1.76, + "learning_rate": 3.6250763075712244e-05, + "loss": 0.0074, + "step": 348520 + }, + { + "epoch": 1.76, + "learning_rate": 3.624319538269823e-05, + "loss": 0.0054, + "step": 348530 + }, + { + "epoch": 1.76, + "learning_rate": 3.623562768968423e-05, + "loss": 0.0067, + "step": 348540 + }, + { + "epoch": 1.76, + "learning_rate": 3.6228059996670215e-05, + "loss": 0.0054, + "step": 348550 + }, + { + "epoch": 1.76, + "learning_rate": 3.62204923036562e-05, + "loss": 0.006, + "step": 348560 + }, + { + "epoch": 1.76, + "learning_rate": 3.621292461064219e-05, + "loss": 0.0057, + "step": 348570 + }, + { + "epoch": 1.76, + "learning_rate": 3.620535691762818e-05, + "loss": 0.0062, + "step": 348580 + }, + { + "epoch": 1.76, + "learning_rate": 3.619778922461417e-05, + "loss": 0.0042, + "step": 348590 + }, + { + "epoch": 1.76, + "learning_rate": 3.6190221531600157e-05, + "loss": 0.0101, + "step": 348600 + }, + { + "epoch": 1.76, + "learning_rate": 3.618265383858615e-05, + "loss": 0.0049, + "step": 348610 + }, + { + "epoch": 1.76, + "learning_rate": 3.617508614557214e-05, + "loss": 0.0036, + "step": 348620 + }, + { + "epoch": 1.76, + "learning_rate": 3.616751845255813e-05, + "loss": 0.0084, + "step": 348630 + }, + { + "epoch": 1.76, + "learning_rate": 3.6159950759544116e-05, + "loss": 0.0058, + "step": 348640 + }, + { + "epoch": 1.76, + "learning_rate": 3.615238306653011e-05, + "loss": 0.0055, + "step": 348650 + }, + { + "epoch": 1.76, + "learning_rate": 3.61448153735161e-05, + "loss": 0.0067, + "step": 348660 + }, + { + "epoch": 1.76, + "learning_rate": 3.613724768050209e-05, + "loss": 0.0059, + "step": 348670 + }, + { + "epoch": 1.76, + "learning_rate": 3.6129679987488076e-05, + "loss": 0.0082, + "step": 348680 + }, + { + "epoch": 1.76, + "learning_rate": 3.612211229447407e-05, + "loss": 0.0046, + "step": 348690 + }, + { + "epoch": 1.76, + "learning_rate": 3.611454460146006e-05, + "loss": 0.0054, + "step": 348700 + }, + { + "epoch": 1.76, + "learning_rate": 3.610697690844605e-05, + "loss": 0.0062, + "step": 348710 + }, + { + "epoch": 1.76, + "learning_rate": 3.6099409215432035e-05, + "loss": 0.0056, + "step": 348720 + }, + { + "epoch": 1.76, + "learning_rate": 3.6091841522418024e-05, + "loss": 0.0083, + "step": 348730 + }, + { + "epoch": 1.76, + "learning_rate": 3.608427382940401e-05, + "loss": 0.0051, + "step": 348740 + }, + { + "epoch": 1.76, + "learning_rate": 3.607670613639001e-05, + "loss": 0.0064, + "step": 348750 + }, + { + "epoch": 1.76, + "learning_rate": 3.6069138443375995e-05, + "loss": 0.0074, + "step": 348760 + }, + { + "epoch": 1.76, + "learning_rate": 3.606157075036198e-05, + "loss": 0.0064, + "step": 348770 + }, + { + "epoch": 1.76, + "learning_rate": 3.605400305734797e-05, + "loss": 0.0091, + "step": 348780 + }, + { + "epoch": 1.76, + "learning_rate": 3.6046435364333967e-05, + "loss": 0.0059, + "step": 348790 + }, + { + "epoch": 1.76, + "learning_rate": 3.6038867671319955e-05, + "loss": 0.0053, + "step": 348800 + }, + { + "epoch": 1.76, + "learning_rate": 3.603129997830594e-05, + "loss": 0.0054, + "step": 348810 + }, + { + "epoch": 1.76, + "learning_rate": 3.602373228529193e-05, + "loss": 0.005, + "step": 348820 + }, + { + "epoch": 1.76, + "learning_rate": 3.6016164592277926e-05, + "loss": 0.0072, + "step": 348830 + }, + { + "epoch": 1.76, + "learning_rate": 3.6008596899263914e-05, + "loss": 0.005, + "step": 348840 + }, + { + "epoch": 1.76, + "learning_rate": 3.60010292062499e-05, + "loss": 0.0062, + "step": 348850 + }, + { + "epoch": 1.76, + "learning_rate": 3.599346151323589e-05, + "loss": 0.0082, + "step": 348860 + }, + { + "epoch": 1.76, + "learning_rate": 3.598589382022188e-05, + "loss": 0.0085, + "step": 348870 + }, + { + "epoch": 1.76, + "learning_rate": 3.597832612720787e-05, + "loss": 0.0054, + "step": 348880 + }, + { + "epoch": 1.76, + "learning_rate": 3.597075843419386e-05, + "loss": 0.0048, + "step": 348890 + }, + { + "epoch": 1.76, + "learning_rate": 3.596319074117985e-05, + "loss": 0.0046, + "step": 348900 + }, + { + "epoch": 1.76, + "learning_rate": 3.595562304816584e-05, + "loss": 0.0062, + "step": 348910 + }, + { + "epoch": 1.76, + "learning_rate": 3.594805535515183e-05, + "loss": 0.0054, + "step": 348920 + }, + { + "epoch": 1.76, + "learning_rate": 3.594048766213782e-05, + "loss": 0.0078, + "step": 348930 + }, + { + "epoch": 1.76, + "learning_rate": 3.593291996912381e-05, + "loss": 0.0057, + "step": 348940 + }, + { + "epoch": 1.76, + "learning_rate": 3.59253522761098e-05, + "loss": 0.0057, + "step": 348950 + }, + { + "epoch": 1.76, + "learning_rate": 3.591778458309579e-05, + "loss": 0.0079, + "step": 348960 + }, + { + "epoch": 1.76, + "learning_rate": 3.591021689008178e-05, + "loss": 0.0054, + "step": 348970 + }, + { + "epoch": 1.76, + "learning_rate": 3.590264919706777e-05, + "loss": 0.0056, + "step": 348980 + }, + { + "epoch": 1.76, + "learning_rate": 3.589508150405376e-05, + "loss": 0.0069, + "step": 348990 + }, + { + "epoch": 1.76, + "learning_rate": 3.5887513811039746e-05, + "loss": 0.0054, + "step": 349000 + }, + { + "epoch": 1.76, + "eval_cer": 0.9144188249085159, + "eval_loss": 0.004665224812924862, + "eval_runtime": 116.662, + "eval_samples_per_second": 17.144, + "eval_steps_per_second": 4.286, + "step": 349000 + }, + { + "epoch": 1.76, + "learning_rate": 3.587994611802574e-05, + "loss": 0.0094, + "step": 349010 + }, + { + "epoch": 1.76, + "learning_rate": 3.587237842501173e-05, + "loss": 0.0063, + "step": 349020 + }, + { + "epoch": 1.76, + "learning_rate": 3.586481073199772e-05, + "loss": 0.006, + "step": 349030 + }, + { + "epoch": 1.76, + "learning_rate": 3.5857243038983706e-05, + "loss": 0.0056, + "step": 349040 + }, + { + "epoch": 1.76, + "learning_rate": 3.5849675345969694e-05, + "loss": 0.0042, + "step": 349050 + }, + { + "epoch": 1.76, + "learning_rate": 3.584210765295568e-05, + "loss": 0.0072, + "step": 349060 + }, + { + "epoch": 1.76, + "learning_rate": 3.583453995994168e-05, + "loss": 0.0063, + "step": 349070 + }, + { + "epoch": 1.76, + "learning_rate": 3.5826972266927666e-05, + "loss": 0.0065, + "step": 349080 + }, + { + "epoch": 1.76, + "learning_rate": 3.5819404573913654e-05, + "loss": 0.0065, + "step": 349090 + }, + { + "epoch": 1.76, + "learning_rate": 3.581183688089964e-05, + "loss": 0.0072, + "step": 349100 + }, + { + "epoch": 1.76, + "learning_rate": 3.580426918788564e-05, + "loss": 0.0069, + "step": 349110 + }, + { + "epoch": 1.76, + "learning_rate": 3.5796701494871625e-05, + "loss": 0.0074, + "step": 349120 + }, + { + "epoch": 1.76, + "learning_rate": 3.5789133801857613e-05, + "loss": 0.011, + "step": 349130 + }, + { + "epoch": 1.76, + "learning_rate": 3.57815661088436e-05, + "loss": 0.0094, + "step": 349140 + }, + { + "epoch": 1.76, + "learning_rate": 3.57739984158296e-05, + "loss": 0.0077, + "step": 349150 + }, + { + "epoch": 1.76, + "learning_rate": 3.5766430722815585e-05, + "loss": 0.0053, + "step": 349160 + }, + { + "epoch": 1.76, + "learning_rate": 3.575886302980157e-05, + "loss": 0.0089, + "step": 349170 + }, + { + "epoch": 1.76, + "learning_rate": 3.575129533678756e-05, + "loss": 0.005, + "step": 349180 + }, + { + "epoch": 1.76, + "learning_rate": 3.574372764377355e-05, + "loss": 0.0079, + "step": 349190 + }, + { + "epoch": 1.76, + "learning_rate": 3.573615995075954e-05, + "loss": 0.0064, + "step": 349200 + }, + { + "epoch": 1.76, + "learning_rate": 3.572859225774553e-05, + "loss": 0.0062, + "step": 349210 + }, + { + "epoch": 1.76, + "learning_rate": 3.572102456473152e-05, + "loss": 0.0062, + "step": 349220 + }, + { + "epoch": 1.76, + "learning_rate": 3.571345687171751e-05, + "loss": 0.0078, + "step": 349230 + }, + { + "epoch": 1.76, + "learning_rate": 3.57058891787035e-05, + "loss": 0.006, + "step": 349240 + }, + { + "epoch": 1.76, + "learning_rate": 3.569832148568949e-05, + "loss": 0.0065, + "step": 349250 + }, + { + "epoch": 1.76, + "learning_rate": 3.569075379267548e-05, + "loss": 0.006, + "step": 349260 + }, + { + "epoch": 1.76, + "learning_rate": 3.568318609966147e-05, + "loss": 0.0066, + "step": 349270 + }, + { + "epoch": 1.76, + "learning_rate": 3.567561840664746e-05, + "loss": 0.0059, + "step": 349280 + }, + { + "epoch": 1.76, + "learning_rate": 3.566805071363345e-05, + "loss": 0.0164, + "step": 349290 + }, + { + "epoch": 1.76, + "learning_rate": 3.566048302061944e-05, + "loss": 0.0047, + "step": 349300 + }, + { + "epoch": 1.76, + "learning_rate": 3.565291532760543e-05, + "loss": 0.0071, + "step": 349310 + }, + { + "epoch": 1.76, + "learning_rate": 3.564534763459142e-05, + "loss": 0.0049, + "step": 349320 + }, + { + "epoch": 1.76, + "learning_rate": 3.563777994157741e-05, + "loss": 0.0056, + "step": 349330 + }, + { + "epoch": 1.76, + "learning_rate": 3.563021224856339e-05, + "loss": 0.0062, + "step": 349340 + }, + { + "epoch": 1.76, + "learning_rate": 3.562264455554938e-05, + "loss": 0.0037, + "step": 349350 + }, + { + "epoch": 1.76, + "learning_rate": 3.5615076862535376e-05, + "loss": 0.0049, + "step": 349360 + }, + { + "epoch": 1.76, + "learning_rate": 3.5607509169521365e-05, + "loss": 0.0062, + "step": 349370 + }, + { + "epoch": 1.76, + "learning_rate": 3.559994147650735e-05, + "loss": 0.0054, + "step": 349380 + }, + { + "epoch": 1.76, + "learning_rate": 3.559237378349334e-05, + "loss": 0.0051, + "step": 349390 + }, + { + "epoch": 1.76, + "learning_rate": 3.5584806090479336e-05, + "loss": 0.0072, + "step": 349400 + }, + { + "epoch": 1.76, + "learning_rate": 3.5577238397465324e-05, + "loss": 0.0067, + "step": 349410 + }, + { + "epoch": 1.76, + "learning_rate": 3.556967070445131e-05, + "loss": 0.0044, + "step": 349420 + }, + { + "epoch": 1.76, + "learning_rate": 3.55621030114373e-05, + "loss": 0.0078, + "step": 349430 + }, + { + "epoch": 1.76, + "learning_rate": 3.5554535318423296e-05, + "loss": 0.0062, + "step": 349440 + }, + { + "epoch": 1.76, + "learning_rate": 3.5546967625409284e-05, + "loss": 0.0049, + "step": 349450 + }, + { + "epoch": 1.76, + "learning_rate": 3.553939993239527e-05, + "loss": 0.0062, + "step": 349460 + }, + { + "epoch": 1.76, + "learning_rate": 3.553183223938127e-05, + "loss": 0.0075, + "step": 349470 + }, + { + "epoch": 1.76, + "learning_rate": 3.5524264546367255e-05, + "loss": 0.0068, + "step": 349480 + }, + { + "epoch": 1.76, + "learning_rate": 3.5516696853353244e-05, + "loss": 0.0057, + "step": 349490 + }, + { + "epoch": 1.76, + "learning_rate": 3.550912916033923e-05, + "loss": 0.0046, + "step": 349500 + }, + { + "epoch": 1.76, + "learning_rate": 3.550156146732522e-05, + "loss": 0.0088, + "step": 349510 + }, + { + "epoch": 1.76, + "learning_rate": 3.549399377431121e-05, + "loss": 0.0046, + "step": 349520 + }, + { + "epoch": 1.76, + "learning_rate": 3.5486426081297196e-05, + "loss": 0.006, + "step": 349530 + }, + { + "epoch": 1.76, + "learning_rate": 3.547885838828319e-05, + "loss": 0.0052, + "step": 349540 + }, + { + "epoch": 1.76, + "learning_rate": 3.547129069526918e-05, + "loss": 0.0061, + "step": 349550 + }, + { + "epoch": 1.76, + "learning_rate": 3.546372300225517e-05, + "loss": 0.0055, + "step": 349560 + }, + { + "epoch": 1.76, + "learning_rate": 3.5456155309241156e-05, + "loss": 0.0058, + "step": 349570 + }, + { + "epoch": 1.76, + "learning_rate": 3.544858761622715e-05, + "loss": 0.0061, + "step": 349580 + }, + { + "epoch": 1.76, + "learning_rate": 3.544101992321314e-05, + "loss": 0.0054, + "step": 349590 + }, + { + "epoch": 1.76, + "learning_rate": 3.543345223019913e-05, + "loss": 0.0048, + "step": 349600 + }, + { + "epoch": 1.76, + "learning_rate": 3.5425884537185116e-05, + "loss": 0.0068, + "step": 349610 + }, + { + "epoch": 1.76, + "learning_rate": 3.541831684417111e-05, + "loss": 0.0054, + "step": 349620 + }, + { + "epoch": 1.76, + "learning_rate": 3.54107491511571e-05, + "loss": 0.0058, + "step": 349630 + }, + { + "epoch": 1.76, + "learning_rate": 3.540318145814309e-05, + "loss": 0.0053, + "step": 349640 + }, + { + "epoch": 1.76, + "learning_rate": 3.5395613765129075e-05, + "loss": 0.0084, + "step": 349650 + }, + { + "epoch": 1.76, + "learning_rate": 3.5388046072115064e-05, + "loss": 0.0062, + "step": 349660 + }, + { + "epoch": 1.76, + "learning_rate": 3.538047837910105e-05, + "loss": 0.0054, + "step": 349670 + }, + { + "epoch": 1.76, + "learning_rate": 3.537291068608705e-05, + "loss": 0.0074, + "step": 349680 + }, + { + "epoch": 1.76, + "learning_rate": 3.5365342993073035e-05, + "loss": 0.0071, + "step": 349690 + }, + { + "epoch": 1.76, + "learning_rate": 3.535777530005902e-05, + "loss": 0.0049, + "step": 349700 + }, + { + "epoch": 1.76, + "learning_rate": 3.535020760704501e-05, + "loss": 0.0072, + "step": 349710 + }, + { + "epoch": 1.76, + "learning_rate": 3.5342639914031006e-05, + "loss": 0.0076, + "step": 349720 + }, + { + "epoch": 1.76, + "learning_rate": 3.5335072221016995e-05, + "loss": 0.0053, + "step": 349730 + }, + { + "epoch": 1.76, + "learning_rate": 3.532750452800298e-05, + "loss": 0.0065, + "step": 349740 + }, + { + "epoch": 1.76, + "learning_rate": 3.531993683498897e-05, + "loss": 0.006, + "step": 349750 + }, + { + "epoch": 1.76, + "learning_rate": 3.5312369141974966e-05, + "loss": 0.0056, + "step": 349760 + }, + { + "epoch": 1.76, + "learning_rate": 3.5304801448960954e-05, + "loss": 0.0109, + "step": 349770 + }, + { + "epoch": 1.76, + "learning_rate": 3.529723375594694e-05, + "loss": 0.0068, + "step": 349780 + }, + { + "epoch": 1.76, + "learning_rate": 3.528966606293293e-05, + "loss": 0.0063, + "step": 349790 + }, + { + "epoch": 1.76, + "learning_rate": 3.5282098369918926e-05, + "loss": 0.0061, + "step": 349800 + }, + { + "epoch": 1.76, + "learning_rate": 3.527453067690491e-05, + "loss": 0.0064, + "step": 349810 + }, + { + "epoch": 1.76, + "learning_rate": 3.52669629838909e-05, + "loss": 0.0091, + "step": 349820 + }, + { + "epoch": 1.76, + "learning_rate": 3.525939529087689e-05, + "loss": 0.0051, + "step": 349830 + }, + { + "epoch": 1.76, + "learning_rate": 3.525182759786288e-05, + "loss": 0.0073, + "step": 349840 + }, + { + "epoch": 1.77, + "learning_rate": 3.524425990484887e-05, + "loss": 0.0059, + "step": 349850 + }, + { + "epoch": 1.77, + "learning_rate": 3.523669221183486e-05, + "loss": 0.0061, + "step": 349860 + }, + { + "epoch": 1.77, + "learning_rate": 3.522912451882085e-05, + "loss": 0.0062, + "step": 349870 + }, + { + "epoch": 1.77, + "learning_rate": 3.522155682580684e-05, + "loss": 0.0074, + "step": 349880 + }, + { + "epoch": 1.77, + "learning_rate": 3.5213989132792826e-05, + "loss": 0.0059, + "step": 349890 + }, + { + "epoch": 1.77, + "learning_rate": 3.520642143977882e-05, + "loss": 0.0059, + "step": 349900 + }, + { + "epoch": 1.77, + "learning_rate": 3.519885374676481e-05, + "loss": 0.0063, + "step": 349910 + }, + { + "epoch": 1.77, + "learning_rate": 3.51912860537508e-05, + "loss": 0.0047, + "step": 349920 + }, + { + "epoch": 1.77, + "learning_rate": 3.5183718360736786e-05, + "loss": 0.0072, + "step": 349930 + }, + { + "epoch": 1.77, + "learning_rate": 3.517615066772278e-05, + "loss": 0.0068, + "step": 349940 + }, + { + "epoch": 1.77, + "learning_rate": 3.516858297470877e-05, + "loss": 0.0076, + "step": 349950 + }, + { + "epoch": 1.77, + "learning_rate": 3.516101528169476e-05, + "loss": 0.0082, + "step": 349960 + }, + { + "epoch": 1.77, + "learning_rate": 3.5153447588680746e-05, + "loss": 0.0096, + "step": 349970 + }, + { + "epoch": 1.77, + "learning_rate": 3.5145879895666734e-05, + "loss": 0.0061, + "step": 349980 + }, + { + "epoch": 1.77, + "learning_rate": 3.513831220265272e-05, + "loss": 0.0044, + "step": 349990 + }, + { + "epoch": 1.77, + "learning_rate": 3.513074450963872e-05, + "loss": 0.0051, + "step": 350000 + }, + { + "epoch": 1.77, + "eval_cer": 0.9144498775845288, + "eval_loss": 0.004672383423894644, + "eval_runtime": 116.7279, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.283, + "step": 350000 + }, + { + "epoch": 1.77, + "learning_rate": 3.5123176816624705e-05, + "loss": 0.0076, + "step": 350010 + }, + { + "epoch": 1.77, + "learning_rate": 3.5115609123610694e-05, + "loss": 0.0069, + "step": 350020 + }, + { + "epoch": 1.77, + "learning_rate": 3.510804143059668e-05, + "loss": 0.0082, + "step": 350030 + }, + { + "epoch": 1.77, + "learning_rate": 3.510047373758268e-05, + "loss": 0.0051, + "step": 350040 + }, + { + "epoch": 1.77, + "learning_rate": 3.5092906044568665e-05, + "loss": 0.0067, + "step": 350050 + }, + { + "epoch": 1.77, + "learning_rate": 3.508533835155465e-05, + "loss": 0.0053, + "step": 350060 + }, + { + "epoch": 1.77, + "learning_rate": 3.507777065854064e-05, + "loss": 0.0052, + "step": 350070 + }, + { + "epoch": 1.77, + "learning_rate": 3.5070202965526637e-05, + "loss": 0.0058, + "step": 350080 + }, + { + "epoch": 1.77, + "learning_rate": 3.5062635272512625e-05, + "loss": 0.0075, + "step": 350090 + }, + { + "epoch": 1.77, + "learning_rate": 3.505506757949861e-05, + "loss": 0.0058, + "step": 350100 + }, + { + "epoch": 1.77, + "learning_rate": 3.50474998864846e-05, + "loss": 0.0072, + "step": 350110 + }, + { + "epoch": 1.77, + "learning_rate": 3.5039932193470596e-05, + "loss": 0.0071, + "step": 350120 + }, + { + "epoch": 1.77, + "learning_rate": 3.503236450045658e-05, + "loss": 0.0058, + "step": 350130 + }, + { + "epoch": 1.77, + "learning_rate": 3.5024796807442566e-05, + "loss": 0.0053, + "step": 350140 + }, + { + "epoch": 1.77, + "learning_rate": 3.501722911442856e-05, + "loss": 0.0057, + "step": 350150 + }, + { + "epoch": 1.77, + "learning_rate": 3.500966142141455e-05, + "loss": 0.006, + "step": 350160 + }, + { + "epoch": 1.77, + "learning_rate": 3.500209372840054e-05, + "loss": 0.005, + "step": 350170 + }, + { + "epoch": 1.77, + "learning_rate": 3.499452603538653e-05, + "loss": 0.0094, + "step": 350180 + }, + { + "epoch": 1.77, + "learning_rate": 3.498695834237252e-05, + "loss": 0.0097, + "step": 350190 + }, + { + "epoch": 1.77, + "learning_rate": 3.497939064935851e-05, + "loss": 0.0058, + "step": 350200 + }, + { + "epoch": 1.77, + "learning_rate": 3.49718229563445e-05, + "loss": 0.0055, + "step": 350210 + }, + { + "epoch": 1.77, + "learning_rate": 3.496425526333049e-05, + "loss": 0.0064, + "step": 350220 + }, + { + "epoch": 1.77, + "learning_rate": 3.495668757031648e-05, + "loss": 0.0089, + "step": 350230 + }, + { + "epoch": 1.77, + "learning_rate": 3.494911987730247e-05, + "loss": 0.0043, + "step": 350240 + }, + { + "epoch": 1.77, + "learning_rate": 3.4941552184288457e-05, + "loss": 0.0054, + "step": 350250 + }, + { + "epoch": 1.77, + "learning_rate": 3.493398449127445e-05, + "loss": 0.0076, + "step": 350260 + }, + { + "epoch": 1.77, + "learning_rate": 3.492641679826044e-05, + "loss": 0.0048, + "step": 350270 + }, + { + "epoch": 1.77, + "learning_rate": 3.491884910524642e-05, + "loss": 0.007, + "step": 350280 + }, + { + "epoch": 1.77, + "learning_rate": 3.4911281412232416e-05, + "loss": 0.0082, + "step": 350290 + }, + { + "epoch": 1.77, + "learning_rate": 3.4903713719218404e-05, + "loss": 0.0069, + "step": 350300 + }, + { + "epoch": 1.77, + "learning_rate": 3.489614602620439e-05, + "loss": 0.0076, + "step": 350310 + }, + { + "epoch": 1.77, + "learning_rate": 3.488857833319038e-05, + "loss": 0.0048, + "step": 350320 + }, + { + "epoch": 1.77, + "learning_rate": 3.4881010640176376e-05, + "loss": 0.0054, + "step": 350330 + }, + { + "epoch": 1.77, + "learning_rate": 3.4873442947162364e-05, + "loss": 0.0047, + "step": 350340 + }, + { + "epoch": 1.77, + "learning_rate": 3.486587525414835e-05, + "loss": 0.0046, + "step": 350350 + }, + { + "epoch": 1.77, + "learning_rate": 3.485830756113434e-05, + "loss": 0.0062, + "step": 350360 + }, + { + "epoch": 1.77, + "learning_rate": 3.4850739868120336e-05, + "loss": 0.0062, + "step": 350370 + }, + { + "epoch": 1.77, + "learning_rate": 3.4843172175106324e-05, + "loss": 0.0056, + "step": 350380 + }, + { + "epoch": 1.77, + "learning_rate": 3.483560448209231e-05, + "loss": 0.0066, + "step": 350390 + }, + { + "epoch": 1.77, + "learning_rate": 3.48280367890783e-05, + "loss": 0.0049, + "step": 350400 + }, + { + "epoch": 1.77, + "learning_rate": 3.4820469096064295e-05, + "loss": 0.0058, + "step": 350410 + }, + { + "epoch": 1.77, + "learning_rate": 3.4812901403050283e-05, + "loss": 0.0108, + "step": 350420 + }, + { + "epoch": 1.77, + "learning_rate": 3.480533371003627e-05, + "loss": 0.0065, + "step": 350430 + }, + { + "epoch": 1.77, + "learning_rate": 3.479776601702226e-05, + "loss": 0.0055, + "step": 350440 + }, + { + "epoch": 1.77, + "learning_rate": 3.479019832400825e-05, + "loss": 0.0056, + "step": 350450 + }, + { + "epoch": 1.77, + "learning_rate": 3.4782630630994236e-05, + "loss": 0.0059, + "step": 350460 + }, + { + "epoch": 1.77, + "learning_rate": 3.477506293798023e-05, + "loss": 0.008, + "step": 350470 + }, + { + "epoch": 1.77, + "learning_rate": 3.476749524496622e-05, + "loss": 0.0048, + "step": 350480 + }, + { + "epoch": 1.77, + "learning_rate": 3.475992755195221e-05, + "loss": 0.0091, + "step": 350490 + }, + { + "epoch": 1.77, + "learning_rate": 3.4752359858938196e-05, + "loss": 0.0069, + "step": 350500 + }, + { + "epoch": 1.77, + "learning_rate": 3.474479216592419e-05, + "loss": 0.006, + "step": 350510 + }, + { + "epoch": 1.77, + "learning_rate": 3.473722447291018e-05, + "loss": 0.0078, + "step": 350520 + }, + { + "epoch": 1.77, + "learning_rate": 3.472965677989617e-05, + "loss": 0.0053, + "step": 350530 + }, + { + "epoch": 1.77, + "learning_rate": 3.4722089086882156e-05, + "loss": 0.0045, + "step": 350540 + }, + { + "epoch": 1.77, + "learning_rate": 3.471452139386815e-05, + "loss": 0.0074, + "step": 350550 + }, + { + "epoch": 1.77, + "learning_rate": 3.470695370085414e-05, + "loss": 0.0072, + "step": 350560 + }, + { + "epoch": 1.77, + "learning_rate": 3.469938600784013e-05, + "loss": 0.0062, + "step": 350570 + }, + { + "epoch": 1.77, + "learning_rate": 3.4691818314826115e-05, + "loss": 0.0072, + "step": 350580 + }, + { + "epoch": 1.77, + "learning_rate": 3.468425062181211e-05, + "loss": 0.0048, + "step": 350590 + }, + { + "epoch": 1.77, + "learning_rate": 3.467668292879809e-05, + "loss": 0.0071, + "step": 350600 + }, + { + "epoch": 1.77, + "learning_rate": 3.466911523578409e-05, + "loss": 0.0056, + "step": 350610 + }, + { + "epoch": 1.77, + "learning_rate": 3.4661547542770075e-05, + "loss": 0.0064, + "step": 350620 + }, + { + "epoch": 1.77, + "learning_rate": 3.465397984975606e-05, + "loss": 0.0064, + "step": 350630 + }, + { + "epoch": 1.77, + "learning_rate": 3.464641215674205e-05, + "loss": 0.007, + "step": 350640 + }, + { + "epoch": 1.77, + "learning_rate": 3.4638844463728046e-05, + "loss": 0.0062, + "step": 350650 + }, + { + "epoch": 1.77, + "learning_rate": 3.4631276770714035e-05, + "loss": 0.0057, + "step": 350660 + }, + { + "epoch": 1.77, + "learning_rate": 3.462370907770002e-05, + "loss": 0.0068, + "step": 350670 + }, + { + "epoch": 1.77, + "learning_rate": 3.461614138468601e-05, + "loss": 0.0061, + "step": 350680 + }, + { + "epoch": 1.77, + "learning_rate": 3.4608573691672006e-05, + "loss": 0.005, + "step": 350690 + }, + { + "epoch": 1.77, + "learning_rate": 3.4601005998657994e-05, + "loss": 0.0064, + "step": 350700 + }, + { + "epoch": 1.77, + "learning_rate": 3.459343830564398e-05, + "loss": 0.0048, + "step": 350710 + }, + { + "epoch": 1.77, + "learning_rate": 3.458587061262997e-05, + "loss": 0.0088, + "step": 350720 + }, + { + "epoch": 1.77, + "learning_rate": 3.4578302919615966e-05, + "loss": 0.0046, + "step": 350730 + }, + { + "epoch": 1.77, + "learning_rate": 3.4570735226601954e-05, + "loss": 0.0058, + "step": 350740 + }, + { + "epoch": 1.77, + "learning_rate": 3.456316753358794e-05, + "loss": 0.0047, + "step": 350750 + }, + { + "epoch": 1.77, + "learning_rate": 3.455559984057393e-05, + "loss": 0.0071, + "step": 350760 + }, + { + "epoch": 1.77, + "learning_rate": 3.454803214755992e-05, + "loss": 0.0062, + "step": 350770 + }, + { + "epoch": 1.77, + "learning_rate": 3.454046445454591e-05, + "loss": 0.0065, + "step": 350780 + }, + { + "epoch": 1.77, + "learning_rate": 3.45328967615319e-05, + "loss": 0.0097, + "step": 350790 + }, + { + "epoch": 1.77, + "learning_rate": 3.452532906851789e-05, + "loss": 0.0058, + "step": 350800 + }, + { + "epoch": 1.77, + "learning_rate": 3.451776137550388e-05, + "loss": 0.0065, + "step": 350810 + }, + { + "epoch": 1.77, + "learning_rate": 3.4510193682489866e-05, + "loss": 0.0065, + "step": 350820 + }, + { + "epoch": 1.77, + "learning_rate": 3.450262598947586e-05, + "loss": 0.0097, + "step": 350830 + }, + { + "epoch": 1.77, + "learning_rate": 3.449505829646185e-05, + "loss": 0.0063, + "step": 350840 + }, + { + "epoch": 1.77, + "learning_rate": 3.448749060344784e-05, + "loss": 0.0077, + "step": 350850 + }, + { + "epoch": 1.77, + "learning_rate": 3.4479922910433826e-05, + "loss": 0.0066, + "step": 350860 + }, + { + "epoch": 1.77, + "learning_rate": 3.447235521741982e-05, + "loss": 0.0061, + "step": 350870 + }, + { + "epoch": 1.77, + "learning_rate": 3.446478752440581e-05, + "loss": 0.006, + "step": 350880 + }, + { + "epoch": 1.77, + "learning_rate": 3.44572198313918e-05, + "loss": 0.0057, + "step": 350890 + }, + { + "epoch": 1.77, + "learning_rate": 3.4449652138377786e-05, + "loss": 0.0061, + "step": 350900 + }, + { + "epoch": 1.77, + "learning_rate": 3.4442084445363774e-05, + "loss": 0.0068, + "step": 350910 + }, + { + "epoch": 1.77, + "learning_rate": 3.443451675234976e-05, + "loss": 0.0059, + "step": 350920 + }, + { + "epoch": 1.77, + "learning_rate": 3.442694905933576e-05, + "loss": 0.0079, + "step": 350930 + }, + { + "epoch": 1.77, + "learning_rate": 3.4419381366321745e-05, + "loss": 0.0072, + "step": 350940 + }, + { + "epoch": 1.77, + "learning_rate": 3.4411813673307734e-05, + "loss": 0.0075, + "step": 350950 + }, + { + "epoch": 1.77, + "learning_rate": 3.440424598029372e-05, + "loss": 0.0074, + "step": 350960 + }, + { + "epoch": 1.77, + "learning_rate": 3.439667828727972e-05, + "loss": 0.0089, + "step": 350970 + }, + { + "epoch": 1.77, + "learning_rate": 3.4389110594265705e-05, + "loss": 0.006, + "step": 350980 + }, + { + "epoch": 1.77, + "learning_rate": 3.438154290125169e-05, + "loss": 0.0046, + "step": 350990 + }, + { + "epoch": 1.77, + "learning_rate": 3.437397520823768e-05, + "loss": 0.0077, + "step": 351000 + }, + { + "epoch": 1.77, + "eval_cer": 0.9144362920387732, + "eval_loss": 0.004640540108084679, + "eval_runtime": 116.6521, + "eval_samples_per_second": 17.145, + "eval_steps_per_second": 4.286, + "step": 351000 + }, + { + "epoch": 1.77, + "learning_rate": 3.4366407515223676e-05, + "loss": 0.0048, + "step": 351010 + }, + { + "epoch": 1.77, + "learning_rate": 3.4358839822209665e-05, + "loss": 0.0067, + "step": 351020 + }, + { + "epoch": 1.77, + "learning_rate": 3.435127212919565e-05, + "loss": 0.0061, + "step": 351030 + }, + { + "epoch": 1.77, + "learning_rate": 3.434370443618164e-05, + "loss": 0.0076, + "step": 351040 + }, + { + "epoch": 1.77, + "learning_rate": 3.4336136743167636e-05, + "loss": 0.0064, + "step": 351050 + }, + { + "epoch": 1.77, + "learning_rate": 3.4328569050153624e-05, + "loss": 0.0058, + "step": 351060 + }, + { + "epoch": 1.77, + "learning_rate": 3.4321001357139606e-05, + "loss": 0.0062, + "step": 351070 + }, + { + "epoch": 1.77, + "learning_rate": 3.43134336641256e-05, + "loss": 0.005, + "step": 351080 + }, + { + "epoch": 1.77, + "learning_rate": 3.430586597111159e-05, + "loss": 0.006, + "step": 351090 + }, + { + "epoch": 1.77, + "learning_rate": 3.429829827809758e-05, + "loss": 0.0062, + "step": 351100 + }, + { + "epoch": 1.77, + "learning_rate": 3.4290730585083565e-05, + "loss": 0.0078, + "step": 351110 + }, + { + "epoch": 1.77, + "learning_rate": 3.428316289206956e-05, + "loss": 0.0064, + "step": 351120 + }, + { + "epoch": 1.77, + "learning_rate": 3.427559519905555e-05, + "loss": 0.0045, + "step": 351130 + }, + { + "epoch": 1.77, + "learning_rate": 3.426802750604154e-05, + "loss": 0.0068, + "step": 351140 + }, + { + "epoch": 1.77, + "learning_rate": 3.426045981302753e-05, + "loss": 0.0054, + "step": 351150 + }, + { + "epoch": 1.77, + "learning_rate": 3.425289212001352e-05, + "loss": 0.006, + "step": 351160 + }, + { + "epoch": 1.77, + "learning_rate": 3.424532442699951e-05, + "loss": 0.0046, + "step": 351170 + }, + { + "epoch": 1.77, + "learning_rate": 3.4237756733985496e-05, + "loss": 0.0049, + "step": 351180 + }, + { + "epoch": 1.77, + "learning_rate": 3.423018904097149e-05, + "loss": 0.006, + "step": 351190 + }, + { + "epoch": 1.77, + "learning_rate": 3.422262134795748e-05, + "loss": 0.0057, + "step": 351200 + }, + { + "epoch": 1.77, + "learning_rate": 3.421505365494347e-05, + "loss": 0.0058, + "step": 351210 + }, + { + "epoch": 1.77, + "learning_rate": 3.4207485961929456e-05, + "loss": 0.0075, + "step": 351220 + }, + { + "epoch": 1.77, + "learning_rate": 3.4199918268915444e-05, + "loss": 0.0091, + "step": 351230 + }, + { + "epoch": 1.77, + "learning_rate": 3.419235057590143e-05, + "loss": 0.0062, + "step": 351240 + }, + { + "epoch": 1.77, + "learning_rate": 3.418478288288742e-05, + "loss": 0.0051, + "step": 351250 + }, + { + "epoch": 1.77, + "learning_rate": 3.4177215189873416e-05, + "loss": 0.0049, + "step": 351260 + }, + { + "epoch": 1.77, + "learning_rate": 3.4169647496859404e-05, + "loss": 0.0065, + "step": 351270 + }, + { + "epoch": 1.77, + "learning_rate": 3.416207980384539e-05, + "loss": 0.006, + "step": 351280 + }, + { + "epoch": 1.77, + "learning_rate": 3.415451211083138e-05, + "loss": 0.0072, + "step": 351290 + }, + { + "epoch": 1.77, + "learning_rate": 3.4146944417817375e-05, + "loss": 0.0039, + "step": 351300 + }, + { + "epoch": 1.77, + "learning_rate": 3.4139376724803364e-05, + "loss": 0.0055, + "step": 351310 + }, + { + "epoch": 1.77, + "learning_rate": 3.413180903178935e-05, + "loss": 0.0059, + "step": 351320 + }, + { + "epoch": 1.77, + "learning_rate": 3.412424133877534e-05, + "loss": 0.006, + "step": 351330 + }, + { + "epoch": 1.77, + "learning_rate": 3.4116673645761335e-05, + "loss": 0.0073, + "step": 351340 + }, + { + "epoch": 1.77, + "learning_rate": 3.410910595274732e-05, + "loss": 0.0059, + "step": 351350 + }, + { + "epoch": 1.77, + "learning_rate": 3.410153825973331e-05, + "loss": 0.0052, + "step": 351360 + }, + { + "epoch": 1.77, + "learning_rate": 3.40939705667193e-05, + "loss": 0.0047, + "step": 351370 + }, + { + "epoch": 1.77, + "learning_rate": 3.408640287370529e-05, + "loss": 0.0061, + "step": 351380 + }, + { + "epoch": 1.77, + "learning_rate": 3.4078835180691276e-05, + "loss": 0.0064, + "step": 351390 + }, + { + "epoch": 1.77, + "learning_rate": 3.407126748767727e-05, + "loss": 0.0049, + "step": 351400 + }, + { + "epoch": 1.77, + "learning_rate": 3.406369979466326e-05, + "loss": 0.0059, + "step": 351410 + }, + { + "epoch": 1.77, + "learning_rate": 3.405613210164925e-05, + "loss": 0.0064, + "step": 351420 + }, + { + "epoch": 1.77, + "learning_rate": 3.4048564408635236e-05, + "loss": 0.0067, + "step": 351430 + }, + { + "epoch": 1.77, + "learning_rate": 3.404099671562123e-05, + "loss": 0.0066, + "step": 351440 + }, + { + "epoch": 1.77, + "learning_rate": 3.403342902260722e-05, + "loss": 0.0073, + "step": 351450 + }, + { + "epoch": 1.77, + "learning_rate": 3.402586132959321e-05, + "loss": 0.006, + "step": 351460 + }, + { + "epoch": 1.77, + "learning_rate": 3.4018293636579195e-05, + "loss": 0.0056, + "step": 351470 + }, + { + "epoch": 1.77, + "learning_rate": 3.401072594356519e-05, + "loss": 0.0053, + "step": 351480 + }, + { + "epoch": 1.77, + "learning_rate": 3.400315825055118e-05, + "loss": 0.0055, + "step": 351490 + }, + { + "epoch": 1.77, + "learning_rate": 3.399559055753717e-05, + "loss": 0.0057, + "step": 351500 + }, + { + "epoch": 1.77, + "learning_rate": 3.3988022864523155e-05, + "loss": 0.0054, + "step": 351510 + }, + { + "epoch": 1.77, + "learning_rate": 3.398045517150915e-05, + "loss": 0.0051, + "step": 351520 + }, + { + "epoch": 1.77, + "learning_rate": 3.397288747849514e-05, + "loss": 0.0158, + "step": 351530 + }, + { + "epoch": 1.77, + "learning_rate": 3.3965319785481127e-05, + "loss": 0.0091, + "step": 351540 + }, + { + "epoch": 1.77, + "learning_rate": 3.3957752092467115e-05, + "loss": 0.0065, + "step": 351550 + }, + { + "epoch": 1.77, + "learning_rate": 3.39501843994531e-05, + "loss": 0.0068, + "step": 351560 + }, + { + "epoch": 1.77, + "learning_rate": 3.394261670643909e-05, + "loss": 0.0058, + "step": 351570 + }, + { + "epoch": 1.77, + "learning_rate": 3.3935049013425086e-05, + "loss": 0.0058, + "step": 351580 + }, + { + "epoch": 1.77, + "learning_rate": 3.3927481320411074e-05, + "loss": 0.0045, + "step": 351590 + }, + { + "epoch": 1.77, + "learning_rate": 3.391991362739706e-05, + "loss": 0.0081, + "step": 351600 + }, + { + "epoch": 1.77, + "learning_rate": 3.391234593438305e-05, + "loss": 0.0047, + "step": 351610 + }, + { + "epoch": 1.77, + "learning_rate": 3.3904778241369046e-05, + "loss": 0.0045, + "step": 351620 + }, + { + "epoch": 1.77, + "learning_rate": 3.3897210548355034e-05, + "loss": 0.005, + "step": 351630 + }, + { + "epoch": 1.77, + "learning_rate": 3.388964285534102e-05, + "loss": 0.0061, + "step": 351640 + }, + { + "epoch": 1.77, + "learning_rate": 3.388207516232701e-05, + "loss": 0.0047, + "step": 351650 + }, + { + "epoch": 1.77, + "learning_rate": 3.3874507469313005e-05, + "loss": 0.0056, + "step": 351660 + }, + { + "epoch": 1.77, + "learning_rate": 3.3866939776298994e-05, + "loss": 0.0053, + "step": 351670 + }, + { + "epoch": 1.77, + "learning_rate": 3.385937208328498e-05, + "loss": 0.0084, + "step": 351680 + }, + { + "epoch": 1.77, + "learning_rate": 3.385180439027097e-05, + "loss": 0.0062, + "step": 351690 + }, + { + "epoch": 1.77, + "learning_rate": 3.384423669725696e-05, + "loss": 0.0038, + "step": 351700 + }, + { + "epoch": 1.77, + "learning_rate": 3.3836669004242947e-05, + "loss": 0.0053, + "step": 351710 + }, + { + "epoch": 1.77, + "learning_rate": 3.382910131122894e-05, + "loss": 0.0067, + "step": 351720 + }, + { + "epoch": 1.77, + "learning_rate": 3.382153361821493e-05, + "loss": 0.0062, + "step": 351730 + }, + { + "epoch": 1.77, + "learning_rate": 3.381396592520092e-05, + "loss": 0.0066, + "step": 351740 + }, + { + "epoch": 1.77, + "learning_rate": 3.3806398232186906e-05, + "loss": 0.0072, + "step": 351750 + }, + { + "epoch": 1.77, + "learning_rate": 3.37988305391729e-05, + "loss": 0.0048, + "step": 351760 + }, + { + "epoch": 1.77, + "learning_rate": 3.379126284615889e-05, + "loss": 0.0057, + "step": 351770 + }, + { + "epoch": 1.77, + "learning_rate": 3.378369515314488e-05, + "loss": 0.0052, + "step": 351780 + }, + { + "epoch": 1.77, + "learning_rate": 3.3776127460130866e-05, + "loss": 0.0088, + "step": 351790 + }, + { + "epoch": 1.77, + "learning_rate": 3.376855976711686e-05, + "loss": 0.0054, + "step": 351800 + }, + { + "epoch": 1.77, + "learning_rate": 3.376099207410285e-05, + "loss": 0.0057, + "step": 351810 + }, + { + "epoch": 1.77, + "learning_rate": 3.375342438108884e-05, + "loss": 0.0049, + "step": 351820 + }, + { + "epoch": 1.78, + "learning_rate": 3.3745856688074826e-05, + "loss": 0.0052, + "step": 351830 + }, + { + "epoch": 1.78, + "learning_rate": 3.373828899506082e-05, + "loss": 0.004, + "step": 351840 + }, + { + "epoch": 1.78, + "learning_rate": 3.37307213020468e-05, + "loss": 0.0054, + "step": 351850 + }, + { + "epoch": 1.78, + "learning_rate": 3.37231536090328e-05, + "loss": 0.0081, + "step": 351860 + }, + { + "epoch": 1.78, + "learning_rate": 3.3715585916018785e-05, + "loss": 0.0075, + "step": 351870 + }, + { + "epoch": 1.78, + "learning_rate": 3.3708018223004773e-05, + "loss": 0.0047, + "step": 351880 + }, + { + "epoch": 1.78, + "learning_rate": 3.370045052999076e-05, + "loss": 0.0107, + "step": 351890 + }, + { + "epoch": 1.78, + "learning_rate": 3.369288283697676e-05, + "loss": 0.0055, + "step": 351900 + }, + { + "epoch": 1.78, + "learning_rate": 3.3685315143962745e-05, + "loss": 0.0044, + "step": 351910 + }, + { + "epoch": 1.78, + "learning_rate": 3.367774745094873e-05, + "loss": 0.0042, + "step": 351920 + }, + { + "epoch": 1.78, + "learning_rate": 3.367017975793472e-05, + "loss": 0.0069, + "step": 351930 + }, + { + "epoch": 1.78, + "learning_rate": 3.3662612064920716e-05, + "loss": 0.0058, + "step": 351940 + }, + { + "epoch": 1.78, + "learning_rate": 3.3655044371906704e-05, + "loss": 0.007, + "step": 351950 + }, + { + "epoch": 1.78, + "learning_rate": 3.364747667889269e-05, + "loss": 0.0055, + "step": 351960 + }, + { + "epoch": 1.78, + "learning_rate": 3.363990898587868e-05, + "loss": 0.0078, + "step": 351970 + }, + { + "epoch": 1.78, + "learning_rate": 3.3632341292864676e-05, + "loss": 0.0082, + "step": 351980 + }, + { + "epoch": 1.78, + "learning_rate": 3.3624773599850664e-05, + "loss": 0.0066, + "step": 351990 + }, + { + "epoch": 1.78, + "learning_rate": 3.361720590683665e-05, + "loss": 0.0054, + "step": 352000 + }, + { + "epoch": 1.78, + "eval_cer": 0.9144343512465224, + "eval_loss": 0.0045296261087059975, + "eval_runtime": 116.5512, + "eval_samples_per_second": 17.16, + "eval_steps_per_second": 4.29, + "step": 352000 + }, + { + "epoch": 1.78, + "learning_rate": 3.360963821382264e-05, + "loss": 0.005, + "step": 352010 + }, + { + "epoch": 1.78, + "learning_rate": 3.360207052080863e-05, + "loss": 0.0078, + "step": 352020 + }, + { + "epoch": 1.78, + "learning_rate": 3.359450282779462e-05, + "loss": 0.0063, + "step": 352030 + }, + { + "epoch": 1.78, + "learning_rate": 3.3586935134780605e-05, + "loss": 0.0055, + "step": 352040 + }, + { + "epoch": 1.78, + "learning_rate": 3.35793674417666e-05, + "loss": 0.0039, + "step": 352050 + }, + { + "epoch": 1.78, + "learning_rate": 3.357179974875259e-05, + "loss": 0.0047, + "step": 352060 + }, + { + "epoch": 1.78, + "learning_rate": 3.356423205573858e-05, + "loss": 0.0048, + "step": 352070 + }, + { + "epoch": 1.78, + "learning_rate": 3.3556664362724565e-05, + "loss": 0.0067, + "step": 352080 + }, + { + "epoch": 1.78, + "learning_rate": 3.354909666971056e-05, + "loss": 0.0095, + "step": 352090 + }, + { + "epoch": 1.78, + "learning_rate": 3.354152897669655e-05, + "loss": 0.005, + "step": 352100 + }, + { + "epoch": 1.78, + "learning_rate": 3.3533961283682536e-05, + "loss": 0.0059, + "step": 352110 + }, + { + "epoch": 1.78, + "learning_rate": 3.352639359066853e-05, + "loss": 0.0076, + "step": 352120 + }, + { + "epoch": 1.78, + "learning_rate": 3.351882589765452e-05, + "loss": 0.0042, + "step": 352130 + }, + { + "epoch": 1.78, + "learning_rate": 3.351125820464051e-05, + "loss": 0.0074, + "step": 352140 + }, + { + "epoch": 1.78, + "learning_rate": 3.3503690511626496e-05, + "loss": 0.0046, + "step": 352150 + }, + { + "epoch": 1.78, + "learning_rate": 3.349612281861249e-05, + "loss": 0.0053, + "step": 352160 + }, + { + "epoch": 1.78, + "learning_rate": 3.348855512559847e-05, + "loss": 0.0071, + "step": 352170 + }, + { + "epoch": 1.78, + "learning_rate": 3.348098743258446e-05, + "loss": 0.0051, + "step": 352180 + }, + { + "epoch": 1.78, + "learning_rate": 3.3473419739570456e-05, + "loss": 0.0065, + "step": 352190 + }, + { + "epoch": 1.78, + "learning_rate": 3.3465852046556444e-05, + "loss": 0.0063, + "step": 352200 + }, + { + "epoch": 1.78, + "learning_rate": 3.345828435354243e-05, + "loss": 0.0072, + "step": 352210 + }, + { + "epoch": 1.78, + "learning_rate": 3.345071666052842e-05, + "loss": 0.0077, + "step": 352220 + }, + { + "epoch": 1.78, + "learning_rate": 3.3443148967514415e-05, + "loss": 0.0075, + "step": 352230 + }, + { + "epoch": 1.78, + "learning_rate": 3.3435581274500403e-05, + "loss": 0.0054, + "step": 352240 + }, + { + "epoch": 1.78, + "learning_rate": 3.342801358148639e-05, + "loss": 0.0065, + "step": 352250 + }, + { + "epoch": 1.78, + "learning_rate": 3.342044588847238e-05, + "loss": 0.0053, + "step": 352260 + }, + { + "epoch": 1.78, + "learning_rate": 3.3412878195458375e-05, + "loss": 0.007, + "step": 352270 + }, + { + "epoch": 1.78, + "learning_rate": 3.340531050244436e-05, + "loss": 0.0059, + "step": 352280 + }, + { + "epoch": 1.78, + "learning_rate": 3.339774280943035e-05, + "loss": 0.0067, + "step": 352290 + }, + { + "epoch": 1.78, + "learning_rate": 3.339017511641634e-05, + "loss": 0.0048, + "step": 352300 + }, + { + "epoch": 1.78, + "learning_rate": 3.3382607423402335e-05, + "loss": 0.0072, + "step": 352310 + }, + { + "epoch": 1.78, + "learning_rate": 3.337503973038832e-05, + "loss": 0.007, + "step": 352320 + }, + { + "epoch": 1.78, + "learning_rate": 3.336747203737431e-05, + "loss": 0.0072, + "step": 352330 + }, + { + "epoch": 1.78, + "learning_rate": 3.33599043443603e-05, + "loss": 0.0063, + "step": 352340 + }, + { + "epoch": 1.78, + "learning_rate": 3.335233665134629e-05, + "loss": 0.0044, + "step": 352350 + }, + { + "epoch": 1.78, + "learning_rate": 3.3344768958332276e-05, + "loss": 0.0051, + "step": 352360 + }, + { + "epoch": 1.78, + "learning_rate": 3.333720126531827e-05, + "loss": 0.0069, + "step": 352370 + }, + { + "epoch": 1.78, + "learning_rate": 3.332963357230426e-05, + "loss": 0.0052, + "step": 352380 + }, + { + "epoch": 1.78, + "learning_rate": 3.332206587929025e-05, + "loss": 0.0093, + "step": 352390 + }, + { + "epoch": 1.78, + "learning_rate": 3.3314498186276235e-05, + "loss": 0.0068, + "step": 352400 + }, + { + "epoch": 1.78, + "learning_rate": 3.330693049326223e-05, + "loss": 0.0053, + "step": 352410 + }, + { + "epoch": 1.78, + "learning_rate": 3.329936280024822e-05, + "loss": 0.0084, + "step": 352420 + }, + { + "epoch": 1.78, + "learning_rate": 3.329179510723421e-05, + "loss": 0.0045, + "step": 352430 + }, + { + "epoch": 1.78, + "learning_rate": 3.3284227414220195e-05, + "loss": 0.006, + "step": 352440 + }, + { + "epoch": 1.78, + "learning_rate": 3.327665972120619e-05, + "loss": 0.0049, + "step": 352450 + }, + { + "epoch": 1.78, + "learning_rate": 3.326909202819218e-05, + "loss": 0.0075, + "step": 352460 + }, + { + "epoch": 1.78, + "learning_rate": 3.3261524335178166e-05, + "loss": 0.0065, + "step": 352470 + }, + { + "epoch": 1.78, + "learning_rate": 3.3253956642164155e-05, + "loss": 0.0058, + "step": 352480 + }, + { + "epoch": 1.78, + "learning_rate": 3.324638894915014e-05, + "loss": 0.0062, + "step": 352490 + }, + { + "epoch": 1.78, + "learning_rate": 3.323882125613613e-05, + "loss": 0.0051, + "step": 352500 + }, + { + "epoch": 1.78, + "learning_rate": 3.3231253563122126e-05, + "loss": 0.0049, + "step": 352510 + }, + { + "epoch": 1.78, + "learning_rate": 3.3223685870108114e-05, + "loss": 0.006, + "step": 352520 + }, + { + "epoch": 1.78, + "learning_rate": 3.32161181770941e-05, + "loss": 0.0061, + "step": 352530 + }, + { + "epoch": 1.78, + "learning_rate": 3.320855048408009e-05, + "loss": 0.0051, + "step": 352540 + }, + { + "epoch": 1.78, + "learning_rate": 3.3200982791066086e-05, + "loss": 0.0095, + "step": 352550 + }, + { + "epoch": 1.78, + "learning_rate": 3.3193415098052074e-05, + "loss": 0.0056, + "step": 352560 + }, + { + "epoch": 1.78, + "learning_rate": 3.318584740503806e-05, + "loss": 0.0069, + "step": 352570 + }, + { + "epoch": 1.78, + "learning_rate": 3.317827971202405e-05, + "loss": 0.0063, + "step": 352580 + }, + { + "epoch": 1.78, + "learning_rate": 3.3170712019010045e-05, + "loss": 0.0052, + "step": 352590 + }, + { + "epoch": 1.78, + "learning_rate": 3.3163144325996034e-05, + "loss": 0.008, + "step": 352600 + }, + { + "epoch": 1.78, + "learning_rate": 3.315557663298202e-05, + "loss": 0.0064, + "step": 352610 + }, + { + "epoch": 1.78, + "learning_rate": 3.314800893996801e-05, + "loss": 0.0057, + "step": 352620 + }, + { + "epoch": 1.78, + "learning_rate": 3.3140441246954005e-05, + "loss": 0.0068, + "step": 352630 + }, + { + "epoch": 1.78, + "learning_rate": 3.3132873553939986e-05, + "loss": 0.007, + "step": 352640 + }, + { + "epoch": 1.78, + "learning_rate": 3.312530586092598e-05, + "loss": 0.0043, + "step": 352650 + }, + { + "epoch": 1.78, + "learning_rate": 3.311773816791197e-05, + "loss": 0.0061, + "step": 352660 + }, + { + "epoch": 1.78, + "learning_rate": 3.311017047489796e-05, + "loss": 0.0048, + "step": 352670 + }, + { + "epoch": 1.78, + "learning_rate": 3.3102602781883946e-05, + "loss": 0.0068, + "step": 352680 + }, + { + "epoch": 1.78, + "learning_rate": 3.309503508886994e-05, + "loss": 0.0057, + "step": 352690 + }, + { + "epoch": 1.78, + "learning_rate": 3.308746739585593e-05, + "loss": 0.0065, + "step": 352700 + }, + { + "epoch": 1.78, + "learning_rate": 3.307989970284192e-05, + "loss": 0.0067, + "step": 352710 + }, + { + "epoch": 1.78, + "learning_rate": 3.3072332009827906e-05, + "loss": 0.0057, + "step": 352720 + }, + { + "epoch": 1.78, + "learning_rate": 3.30647643168139e-05, + "loss": 0.005, + "step": 352730 + }, + { + "epoch": 1.78, + "learning_rate": 3.305719662379989e-05, + "loss": 0.0053, + "step": 352740 + }, + { + "epoch": 1.78, + "learning_rate": 3.304962893078588e-05, + "loss": 0.0055, + "step": 352750 + }, + { + "epoch": 1.78, + "learning_rate": 3.3042061237771865e-05, + "loss": 0.0074, + "step": 352760 + }, + { + "epoch": 1.78, + "learning_rate": 3.303449354475786e-05, + "loss": 0.0051, + "step": 352770 + }, + { + "epoch": 1.78, + "learning_rate": 3.302692585174385e-05, + "loss": 0.0059, + "step": 352780 + }, + { + "epoch": 1.78, + "learning_rate": 3.301935815872984e-05, + "loss": 0.0053, + "step": 352790 + }, + { + "epoch": 1.78, + "learning_rate": 3.3011790465715825e-05, + "loss": 0.0064, + "step": 352800 + }, + { + "epoch": 1.78, + "learning_rate": 3.300422277270181e-05, + "loss": 0.0094, + "step": 352810 + }, + { + "epoch": 1.78, + "learning_rate": 3.29966550796878e-05, + "loss": 0.0074, + "step": 352820 + }, + { + "epoch": 1.78, + "learning_rate": 3.2989087386673796e-05, + "loss": 0.0062, + "step": 352830 + }, + { + "epoch": 1.78, + "learning_rate": 3.2981519693659785e-05, + "loss": 0.0058, + "step": 352840 + }, + { + "epoch": 1.78, + "learning_rate": 3.297395200064577e-05, + "loss": 0.0072, + "step": 352850 + }, + { + "epoch": 1.78, + "learning_rate": 3.296638430763176e-05, + "loss": 0.0064, + "step": 352860 + }, + { + "epoch": 1.78, + "learning_rate": 3.2958816614617756e-05, + "loss": 0.0061, + "step": 352870 + }, + { + "epoch": 1.78, + "learning_rate": 3.2951248921603744e-05, + "loss": 0.0046, + "step": 352880 + }, + { + "epoch": 1.78, + "learning_rate": 3.294368122858973e-05, + "loss": 0.0049, + "step": 352890 + }, + { + "epoch": 1.78, + "learning_rate": 3.293611353557572e-05, + "loss": 0.0062, + "step": 352900 + }, + { + "epoch": 1.78, + "learning_rate": 3.2928545842561716e-05, + "loss": 0.0092, + "step": 352910 + }, + { + "epoch": 1.78, + "learning_rate": 3.2920978149547704e-05, + "loss": 0.0059, + "step": 352920 + }, + { + "epoch": 1.78, + "learning_rate": 3.291341045653369e-05, + "loss": 0.0047, + "step": 352930 + }, + { + "epoch": 1.78, + "learning_rate": 3.290584276351968e-05, + "loss": 0.0057, + "step": 352940 + }, + { + "epoch": 1.78, + "learning_rate": 3.289827507050567e-05, + "loss": 0.006, + "step": 352950 + }, + { + "epoch": 1.78, + "learning_rate": 3.289070737749166e-05, + "loss": 0.0046, + "step": 352960 + }, + { + "epoch": 1.78, + "learning_rate": 3.2883139684477645e-05, + "loss": 0.0061, + "step": 352970 + }, + { + "epoch": 1.78, + "learning_rate": 3.287557199146364e-05, + "loss": 0.0057, + "step": 352980 + }, + { + "epoch": 1.78, + "learning_rate": 3.286800429844963e-05, + "loss": 0.0086, + "step": 352990 + }, + { + "epoch": 1.78, + "learning_rate": 3.2860436605435617e-05, + "loss": 0.0081, + "step": 353000 + }, + { + "epoch": 1.78, + "eval_cer": 0.9144139729278888, + "eval_loss": 0.0045607974752783775, + "eval_runtime": 116.7751, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, + "step": 353000 + }, + { + "epoch": 1.78, + "learning_rate": 3.2852868912421605e-05, + "loss": 0.0066, + "step": 353010 + }, + { + "epoch": 1.78, + "learning_rate": 3.28453012194076e-05, + "loss": 0.0069, + "step": 353020 + }, + { + "epoch": 1.78, + "learning_rate": 3.283773352639359e-05, + "loss": 0.0071, + "step": 353030 + }, + { + "epoch": 1.78, + "learning_rate": 3.2830165833379576e-05, + "loss": 0.009, + "step": 353040 + }, + { + "epoch": 1.78, + "learning_rate": 3.2822598140365564e-05, + "loss": 0.0079, + "step": 353050 + }, + { + "epoch": 1.78, + "learning_rate": 3.281503044735156e-05, + "loss": 0.0056, + "step": 353060 + }, + { + "epoch": 1.78, + "learning_rate": 3.280746275433755e-05, + "loss": 0.0065, + "step": 353070 + }, + { + "epoch": 1.78, + "learning_rate": 3.2799895061323536e-05, + "loss": 0.0054, + "step": 353080 + }, + { + "epoch": 1.78, + "learning_rate": 3.279232736830953e-05, + "loss": 0.0054, + "step": 353090 + }, + { + "epoch": 1.78, + "learning_rate": 3.278475967529552e-05, + "loss": 0.0043, + "step": 353100 + }, + { + "epoch": 1.78, + "learning_rate": 3.27771919822815e-05, + "loss": 0.0075, + "step": 353110 + }, + { + "epoch": 1.78, + "learning_rate": 3.2769624289267496e-05, + "loss": 0.0059, + "step": 353120 + }, + { + "epoch": 1.78, + "learning_rate": 3.2762056596253484e-05, + "loss": 0.006, + "step": 353130 + }, + { + "epoch": 1.78, + "learning_rate": 3.275448890323947e-05, + "loss": 0.0052, + "step": 353140 + }, + { + "epoch": 1.78, + "learning_rate": 3.274692121022546e-05, + "loss": 0.0079, + "step": 353150 + }, + { + "epoch": 1.78, + "learning_rate": 3.2739353517211455e-05, + "loss": 0.0156, + "step": 353160 + }, + { + "epoch": 1.78, + "learning_rate": 3.273178582419744e-05, + "loss": 0.0114, + "step": 353170 + }, + { + "epoch": 1.78, + "learning_rate": 3.272421813118343e-05, + "loss": 0.0084, + "step": 353180 + }, + { + "epoch": 1.78, + "learning_rate": 3.271665043816942e-05, + "loss": 0.0069, + "step": 353190 + }, + { + "epoch": 1.78, + "learning_rate": 3.2709082745155415e-05, + "loss": 0.0052, + "step": 353200 + }, + { + "epoch": 1.78, + "learning_rate": 3.27015150521414e-05, + "loss": 0.0043, + "step": 353210 + }, + { + "epoch": 1.78, + "learning_rate": 3.269394735912739e-05, + "loss": 0.0046, + "step": 353220 + }, + { + "epoch": 1.78, + "learning_rate": 3.268637966611338e-05, + "loss": 0.0058, + "step": 353230 + }, + { + "epoch": 1.78, + "learning_rate": 3.2678811973099374e-05, + "loss": 0.0052, + "step": 353240 + }, + { + "epoch": 1.78, + "learning_rate": 3.267124428008536e-05, + "loss": 0.0074, + "step": 353250 + }, + { + "epoch": 1.78, + "learning_rate": 3.266367658707135e-05, + "loss": 0.0065, + "step": 353260 + }, + { + "epoch": 1.78, + "learning_rate": 3.265610889405734e-05, + "loss": 0.0044, + "step": 353270 + }, + { + "epoch": 1.78, + "learning_rate": 3.264854120104333e-05, + "loss": 0.0045, + "step": 353280 + }, + { + "epoch": 1.78, + "learning_rate": 3.2640973508029316e-05, + "loss": 0.0074, + "step": 353290 + }, + { + "epoch": 1.78, + "learning_rate": 3.263340581501531e-05, + "loss": 0.0061, + "step": 353300 + }, + { + "epoch": 1.78, + "learning_rate": 3.26258381220013e-05, + "loss": 0.007, + "step": 353310 + }, + { + "epoch": 1.78, + "learning_rate": 3.261827042898729e-05, + "loss": 0.007, + "step": 353320 + }, + { + "epoch": 1.78, + "learning_rate": 3.2610702735973275e-05, + "loss": 0.0055, + "step": 353330 + }, + { + "epoch": 1.78, + "learning_rate": 3.260313504295927e-05, + "loss": 0.0072, + "step": 353340 + }, + { + "epoch": 1.78, + "learning_rate": 3.259556734994526e-05, + "loss": 0.006, + "step": 353350 + }, + { + "epoch": 1.78, + "learning_rate": 3.258799965693125e-05, + "loss": 0.0064, + "step": 353360 + }, + { + "epoch": 1.78, + "learning_rate": 3.2580431963917235e-05, + "loss": 0.0087, + "step": 353370 + }, + { + "epoch": 1.78, + "learning_rate": 3.257286427090323e-05, + "loss": 0.0064, + "step": 353380 + }, + { + "epoch": 1.78, + "learning_rate": 3.256529657788922e-05, + "loss": 0.0054, + "step": 353390 + }, + { + "epoch": 1.78, + "learning_rate": 3.2557728884875206e-05, + "loss": 0.0041, + "step": 353400 + }, + { + "epoch": 1.78, + "learning_rate": 3.2550161191861195e-05, + "loss": 0.0052, + "step": 353410 + }, + { + "epoch": 1.78, + "learning_rate": 3.254259349884719e-05, + "loss": 0.0048, + "step": 353420 + }, + { + "epoch": 1.78, + "learning_rate": 3.253502580583317e-05, + "loss": 0.0059, + "step": 353430 + }, + { + "epoch": 1.78, + "learning_rate": 3.2527458112819166e-05, + "loss": 0.0035, + "step": 353440 + }, + { + "epoch": 1.78, + "learning_rate": 3.2519890419805154e-05, + "loss": 0.0087, + "step": 353450 + }, + { + "epoch": 1.78, + "learning_rate": 3.251232272679114e-05, + "loss": 0.0055, + "step": 353460 + }, + { + "epoch": 1.78, + "learning_rate": 3.250475503377713e-05, + "loss": 0.0065, + "step": 353470 + }, + { + "epoch": 1.78, + "learning_rate": 3.2497187340763126e-05, + "loss": 0.0058, + "step": 353480 + }, + { + "epoch": 1.78, + "learning_rate": 3.2489619647749114e-05, + "loss": 0.0078, + "step": 353490 + }, + { + "epoch": 1.78, + "learning_rate": 3.24820519547351e-05, + "loss": 0.005, + "step": 353500 + }, + { + "epoch": 1.78, + "learning_rate": 3.247448426172109e-05, + "loss": 0.0069, + "step": 353510 + }, + { + "epoch": 1.78, + "learning_rate": 3.2466916568707085e-05, + "loss": 0.0073, + "step": 353520 + }, + { + "epoch": 1.78, + "learning_rate": 3.2459348875693073e-05, + "loss": 0.0044, + "step": 353530 + }, + { + "epoch": 1.78, + "learning_rate": 3.245178118267906e-05, + "loss": 0.005, + "step": 353540 + }, + { + "epoch": 1.78, + "learning_rate": 3.244421348966505e-05, + "loss": 0.0048, + "step": 353550 + }, + { + "epoch": 1.78, + "learning_rate": 3.2436645796651045e-05, + "loss": 0.0063, + "step": 353560 + }, + { + "epoch": 1.78, + "learning_rate": 3.242907810363703e-05, + "loss": 0.0058, + "step": 353570 + }, + { + "epoch": 1.78, + "learning_rate": 3.242151041062302e-05, + "loss": 0.0054, + "step": 353580 + }, + { + "epoch": 1.78, + "learning_rate": 3.241394271760901e-05, + "loss": 0.0058, + "step": 353590 + }, + { + "epoch": 1.78, + "learning_rate": 3.2406375024595e-05, + "loss": 0.0062, + "step": 353600 + }, + { + "epoch": 1.78, + "learning_rate": 3.2398807331580986e-05, + "loss": 0.0054, + "step": 353610 + }, + { + "epoch": 1.78, + "learning_rate": 3.239123963856698e-05, + "loss": 0.0071, + "step": 353620 + }, + { + "epoch": 1.78, + "learning_rate": 3.238367194555297e-05, + "loss": 0.0046, + "step": 353630 + }, + { + "epoch": 1.78, + "learning_rate": 3.237610425253896e-05, + "loss": 0.0053, + "step": 353640 + }, + { + "epoch": 1.78, + "learning_rate": 3.2368536559524946e-05, + "loss": 0.0085, + "step": 353650 + }, + { + "epoch": 1.78, + "learning_rate": 3.236096886651094e-05, + "loss": 0.0094, + "step": 353660 + }, + { + "epoch": 1.78, + "learning_rate": 3.235340117349693e-05, + "loss": 0.0066, + "step": 353670 + }, + { + "epoch": 1.78, + "learning_rate": 3.234583348048292e-05, + "loss": 0.0042, + "step": 353680 + }, + { + "epoch": 1.78, + "learning_rate": 3.2338265787468905e-05, + "loss": 0.0064, + "step": 353690 + }, + { + "epoch": 1.78, + "learning_rate": 3.23306980944549e-05, + "loss": 0.0064, + "step": 353700 + }, + { + "epoch": 1.78, + "learning_rate": 3.232313040144089e-05, + "loss": 0.0065, + "step": 353710 + }, + { + "epoch": 1.78, + "learning_rate": 3.231556270842688e-05, + "loss": 0.0071, + "step": 353720 + }, + { + "epoch": 1.78, + "learning_rate": 3.2307995015412865e-05, + "loss": 0.005, + "step": 353730 + }, + { + "epoch": 1.78, + "learning_rate": 3.230042732239885e-05, + "loss": 0.0076, + "step": 353740 + }, + { + "epoch": 1.78, + "learning_rate": 3.229285962938484e-05, + "loss": 0.0079, + "step": 353750 + }, + { + "epoch": 1.78, + "learning_rate": 3.228529193637083e-05, + "loss": 0.0043, + "step": 353760 + }, + { + "epoch": 1.78, + "learning_rate": 3.2277724243356825e-05, + "loss": 0.0055, + "step": 353770 + }, + { + "epoch": 1.78, + "learning_rate": 3.227015655034281e-05, + "loss": 0.0067, + "step": 353780 + }, + { + "epoch": 1.78, + "learning_rate": 3.22625888573288e-05, + "loss": 0.0056, + "step": 353790 + }, + { + "epoch": 1.78, + "learning_rate": 3.2255021164314796e-05, + "loss": 0.0065, + "step": 353800 + }, + { + "epoch": 1.79, + "learning_rate": 3.2247453471300784e-05, + "loss": 0.0066, + "step": 353810 + }, + { + "epoch": 1.79, + "learning_rate": 3.223988577828677e-05, + "loss": 0.0061, + "step": 353820 + }, + { + "epoch": 1.79, + "learning_rate": 3.223231808527276e-05, + "loss": 0.0085, + "step": 353830 + }, + { + "epoch": 1.79, + "learning_rate": 3.2224750392258756e-05, + "loss": 0.0033, + "step": 353840 + }, + { + "epoch": 1.79, + "learning_rate": 3.2217182699244744e-05, + "loss": 0.0059, + "step": 353850 + }, + { + "epoch": 1.79, + "learning_rate": 3.220961500623073e-05, + "loss": 0.0062, + "step": 353860 + }, + { + "epoch": 1.79, + "learning_rate": 3.220204731321672e-05, + "loss": 0.0058, + "step": 353870 + }, + { + "epoch": 1.79, + "learning_rate": 3.2194479620202715e-05, + "loss": 0.0045, + "step": 353880 + }, + { + "epoch": 1.79, + "learning_rate": 3.2186911927188704e-05, + "loss": 0.0052, + "step": 353890 + }, + { + "epoch": 1.79, + "learning_rate": 3.2179344234174685e-05, + "loss": 0.0056, + "step": 353900 + }, + { + "epoch": 1.79, + "learning_rate": 3.217177654116068e-05, + "loss": 0.0062, + "step": 353910 + }, + { + "epoch": 1.79, + "learning_rate": 3.216420884814667e-05, + "loss": 0.0062, + "step": 353920 + }, + { + "epoch": 1.79, + "learning_rate": 3.2156641155132656e-05, + "loss": 0.0081, + "step": 353930 + }, + { + "epoch": 1.79, + "learning_rate": 3.2149073462118645e-05, + "loss": 0.0058, + "step": 353940 + }, + { + "epoch": 1.79, + "learning_rate": 3.214150576910464e-05, + "loss": 0.0044, + "step": 353950 + }, + { + "epoch": 1.79, + "learning_rate": 3.213393807609063e-05, + "loss": 0.0054, + "step": 353960 + }, + { + "epoch": 1.79, + "learning_rate": 3.2126370383076616e-05, + "loss": 0.0076, + "step": 353970 + }, + { + "epoch": 1.79, + "learning_rate": 3.2118802690062604e-05, + "loss": 0.0058, + "step": 353980 + }, + { + "epoch": 1.79, + "learning_rate": 3.21112349970486e-05, + "loss": 0.0069, + "step": 353990 + }, + { + "epoch": 1.79, + "learning_rate": 3.210366730403459e-05, + "loss": 0.0051, + "step": 354000 + }, + { + "epoch": 1.79, + "eval_cer": 0.9144197953046413, + "eval_loss": 0.004529756028205156, + "eval_runtime": 116.782, + "eval_samples_per_second": 17.126, + "eval_steps_per_second": 4.281, + "step": 354000 + }, + { + "epoch": 1.79, + "learning_rate": 3.2096099611020576e-05, + "loss": 0.0069, + "step": 354010 + }, + { + "epoch": 1.79, + "learning_rate": 3.2088531918006564e-05, + "loss": 0.0073, + "step": 354020 + }, + { + "epoch": 1.79, + "learning_rate": 3.208096422499256e-05, + "loss": 0.0055, + "step": 354030 + }, + { + "epoch": 1.79, + "learning_rate": 3.207339653197855e-05, + "loss": 0.0066, + "step": 354040 + }, + { + "epoch": 1.79, + "learning_rate": 3.2065828838964535e-05, + "loss": 0.0061, + "step": 354050 + }, + { + "epoch": 1.79, + "learning_rate": 3.2058261145950524e-05, + "loss": 0.0063, + "step": 354060 + }, + { + "epoch": 1.79, + "learning_rate": 3.205069345293651e-05, + "loss": 0.0078, + "step": 354070 + }, + { + "epoch": 1.79, + "learning_rate": 3.20431257599225e-05, + "loss": 0.0059, + "step": 354080 + }, + { + "epoch": 1.79, + "learning_rate": 3.2035558066908495e-05, + "loss": 0.0059, + "step": 354090 + }, + { + "epoch": 1.79, + "learning_rate": 3.202799037389448e-05, + "loss": 0.0063, + "step": 354100 + }, + { + "epoch": 1.79, + "learning_rate": 3.202042268088047e-05, + "loss": 0.0072, + "step": 354110 + }, + { + "epoch": 1.79, + "learning_rate": 3.201285498786646e-05, + "loss": 0.0064, + "step": 354120 + }, + { + "epoch": 1.79, + "learning_rate": 3.2005287294852455e-05, + "loss": 0.0045, + "step": 354130 + }, + { + "epoch": 1.79, + "learning_rate": 3.199771960183844e-05, + "loss": 0.0072, + "step": 354140 + }, + { + "epoch": 1.79, + "learning_rate": 3.199015190882443e-05, + "loss": 0.0056, + "step": 354150 + }, + { + "epoch": 1.79, + "learning_rate": 3.198258421581042e-05, + "loss": 0.0113, + "step": 354160 + }, + { + "epoch": 1.79, + "learning_rate": 3.1975016522796414e-05, + "loss": 0.0064, + "step": 354170 + }, + { + "epoch": 1.79, + "learning_rate": 3.19674488297824e-05, + "loss": 0.0082, + "step": 354180 + }, + { + "epoch": 1.79, + "learning_rate": 3.195988113676839e-05, + "loss": 0.0063, + "step": 354190 + }, + { + "epoch": 1.79, + "learning_rate": 3.195231344375438e-05, + "loss": 0.0056, + "step": 354200 + }, + { + "epoch": 1.79, + "learning_rate": 3.194474575074037e-05, + "loss": 0.0058, + "step": 354210 + }, + { + "epoch": 1.79, + "learning_rate": 3.1937178057726355e-05, + "loss": 0.0054, + "step": 354220 + }, + { + "epoch": 1.79, + "learning_rate": 3.192961036471235e-05, + "loss": 0.0048, + "step": 354230 + }, + { + "epoch": 1.79, + "learning_rate": 3.192204267169834e-05, + "loss": 0.0055, + "step": 354240 + }, + { + "epoch": 1.79, + "learning_rate": 3.191447497868433e-05, + "loss": 0.0057, + "step": 354250 + }, + { + "epoch": 1.79, + "learning_rate": 3.1906907285670315e-05, + "loss": 0.0071, + "step": 354260 + }, + { + "epoch": 1.79, + "learning_rate": 3.189933959265631e-05, + "loss": 0.0059, + "step": 354270 + }, + { + "epoch": 1.79, + "learning_rate": 3.18917718996423e-05, + "loss": 0.0064, + "step": 354280 + }, + { + "epoch": 1.79, + "learning_rate": 3.1884204206628287e-05, + "loss": 0.0066, + "step": 354290 + }, + { + "epoch": 1.79, + "learning_rate": 3.1876636513614275e-05, + "loss": 0.0067, + "step": 354300 + }, + { + "epoch": 1.79, + "learning_rate": 3.186906882060027e-05, + "loss": 0.0059, + "step": 354310 + }, + { + "epoch": 1.79, + "learning_rate": 3.186150112758626e-05, + "loss": 0.007, + "step": 354320 + }, + { + "epoch": 1.79, + "learning_rate": 3.1853933434572246e-05, + "loss": 0.0065, + "step": 354330 + }, + { + "epoch": 1.79, + "learning_rate": 3.1846365741558234e-05, + "loss": 0.0062, + "step": 354340 + }, + { + "epoch": 1.79, + "learning_rate": 3.183879804854423e-05, + "loss": 0.0077, + "step": 354350 + }, + { + "epoch": 1.79, + "learning_rate": 3.183123035553022e-05, + "loss": 0.0062, + "step": 354360 + }, + { + "epoch": 1.79, + "learning_rate": 3.1823662662516206e-05, + "loss": 0.0074, + "step": 354370 + }, + { + "epoch": 1.79, + "learning_rate": 3.1816094969502194e-05, + "loss": 0.0086, + "step": 354380 + }, + { + "epoch": 1.79, + "learning_rate": 3.180852727648818e-05, + "loss": 0.0063, + "step": 354390 + }, + { + "epoch": 1.79, + "learning_rate": 3.180095958347417e-05, + "loss": 0.0074, + "step": 354400 + }, + { + "epoch": 1.79, + "learning_rate": 3.1793391890460165e-05, + "loss": 0.0051, + "step": 354410 + }, + { + "epoch": 1.79, + "learning_rate": 3.1785824197446154e-05, + "loss": 0.0077, + "step": 354420 + }, + { + "epoch": 1.79, + "learning_rate": 3.177825650443214e-05, + "loss": 0.0073, + "step": 354430 + }, + { + "epoch": 1.79, + "learning_rate": 3.177068881141813e-05, + "loss": 0.0068, + "step": 354440 + }, + { + "epoch": 1.79, + "learning_rate": 3.1763121118404125e-05, + "loss": 0.0048, + "step": 354450 + }, + { + "epoch": 1.79, + "learning_rate": 3.175555342539011e-05, + "loss": 0.0071, + "step": 354460 + }, + { + "epoch": 1.79, + "learning_rate": 3.17479857323761e-05, + "loss": 0.0048, + "step": 354470 + }, + { + "epoch": 1.79, + "learning_rate": 3.174041803936209e-05, + "loss": 0.0056, + "step": 354480 + }, + { + "epoch": 1.79, + "learning_rate": 3.1732850346348085e-05, + "loss": 0.0059, + "step": 354490 + }, + { + "epoch": 1.79, + "learning_rate": 3.172528265333407e-05, + "loss": 0.0053, + "step": 354500 + }, + { + "epoch": 1.79, + "learning_rate": 3.171771496032006e-05, + "loss": 0.005, + "step": 354510 + }, + { + "epoch": 1.79, + "learning_rate": 3.171014726730605e-05, + "loss": 0.007, + "step": 354520 + }, + { + "epoch": 1.79, + "learning_rate": 3.170257957429204e-05, + "loss": 0.0067, + "step": 354530 + }, + { + "epoch": 1.79, + "learning_rate": 3.1695011881278026e-05, + "loss": 0.005, + "step": 354540 + }, + { + "epoch": 1.79, + "learning_rate": 3.168744418826402e-05, + "loss": 0.0076, + "step": 354550 + }, + { + "epoch": 1.79, + "learning_rate": 3.167987649525001e-05, + "loss": 0.0054, + "step": 354560 + }, + { + "epoch": 1.79, + "learning_rate": 3.1672308802236e-05, + "loss": 0.004, + "step": 354570 + }, + { + "epoch": 1.79, + "learning_rate": 3.1664741109221986e-05, + "loss": 0.0068, + "step": 354580 + }, + { + "epoch": 1.79, + "learning_rate": 3.165717341620798e-05, + "loss": 0.0065, + "step": 354590 + }, + { + "epoch": 1.79, + "learning_rate": 3.164960572319397e-05, + "loss": 0.0076, + "step": 354600 + }, + { + "epoch": 1.79, + "learning_rate": 3.164203803017996e-05, + "loss": 0.0072, + "step": 354610 + }, + { + "epoch": 1.79, + "learning_rate": 3.1634470337165945e-05, + "loss": 0.0065, + "step": 354620 + }, + { + "epoch": 1.79, + "learning_rate": 3.162690264415194e-05, + "loss": 0.0055, + "step": 354630 + }, + { + "epoch": 1.79, + "learning_rate": 3.161933495113793e-05, + "loss": 0.0057, + "step": 354640 + }, + { + "epoch": 1.79, + "learning_rate": 3.1611767258123917e-05, + "loss": 0.0048, + "step": 354650 + }, + { + "epoch": 1.79, + "learning_rate": 3.1604199565109905e-05, + "loss": 0.0067, + "step": 354660 + }, + { + "epoch": 1.79, + "learning_rate": 3.15966318720959e-05, + "loss": 0.0064, + "step": 354670 + }, + { + "epoch": 1.79, + "learning_rate": 3.158906417908188e-05, + "loss": 0.0059, + "step": 354680 + }, + { + "epoch": 1.79, + "learning_rate": 3.158149648606787e-05, + "loss": 0.0044, + "step": 354690 + }, + { + "epoch": 1.79, + "learning_rate": 3.1573928793053864e-05, + "loss": 0.0069, + "step": 354700 + }, + { + "epoch": 1.79, + "learning_rate": 3.156636110003985e-05, + "loss": 0.0073, + "step": 354710 + }, + { + "epoch": 1.79, + "learning_rate": 3.155879340702584e-05, + "loss": 0.0057, + "step": 354720 + }, + { + "epoch": 1.79, + "learning_rate": 3.155122571401183e-05, + "loss": 0.0064, + "step": 354730 + }, + { + "epoch": 1.79, + "learning_rate": 3.1543658020997824e-05, + "loss": 0.0053, + "step": 354740 + }, + { + "epoch": 1.79, + "learning_rate": 3.153609032798381e-05, + "loss": 0.0062, + "step": 354750 + }, + { + "epoch": 1.79, + "learning_rate": 3.15285226349698e-05, + "loss": 0.0087, + "step": 354760 + }, + { + "epoch": 1.79, + "learning_rate": 3.1520954941955796e-05, + "loss": 0.0073, + "step": 354770 + }, + { + "epoch": 1.79, + "learning_rate": 3.1513387248941784e-05, + "loss": 0.0048, + "step": 354780 + }, + { + "epoch": 1.79, + "learning_rate": 3.150581955592777e-05, + "loss": 0.0047, + "step": 354790 + }, + { + "epoch": 1.79, + "learning_rate": 3.149825186291376e-05, + "loss": 0.0066, + "step": 354800 + }, + { + "epoch": 1.79, + "learning_rate": 3.1490684169899755e-05, + "loss": 0.0053, + "step": 354810 + }, + { + "epoch": 1.79, + "learning_rate": 3.1483116476885743e-05, + "loss": 0.0066, + "step": 354820 + }, + { + "epoch": 1.79, + "learning_rate": 3.147554878387173e-05, + "loss": 0.0065, + "step": 354830 + }, + { + "epoch": 1.79, + "learning_rate": 3.146798109085772e-05, + "loss": 0.006, + "step": 354840 + }, + { + "epoch": 1.79, + "learning_rate": 3.146041339784371e-05, + "loss": 0.0055, + "step": 354850 + }, + { + "epoch": 1.79, + "learning_rate": 3.1452845704829696e-05, + "loss": 0.0048, + "step": 354860 + }, + { + "epoch": 1.79, + "learning_rate": 3.1445278011815685e-05, + "loss": 0.0065, + "step": 354870 + }, + { + "epoch": 1.79, + "learning_rate": 3.143771031880168e-05, + "loss": 0.0061, + "step": 354880 + }, + { + "epoch": 1.79, + "learning_rate": 3.143014262578767e-05, + "loss": 0.0064, + "step": 354890 + }, + { + "epoch": 1.79, + "learning_rate": 3.1422574932773656e-05, + "loss": 0.008, + "step": 354900 + }, + { + "epoch": 1.79, + "learning_rate": 3.1415007239759644e-05, + "loss": 0.0046, + "step": 354910 + }, + { + "epoch": 1.79, + "learning_rate": 3.140743954674564e-05, + "loss": 0.0072, + "step": 354920 + }, + { + "epoch": 1.79, + "learning_rate": 3.139987185373163e-05, + "loss": 0.0054, + "step": 354930 + }, + { + "epoch": 1.79, + "learning_rate": 3.1392304160717616e-05, + "loss": 0.0056, + "step": 354940 + }, + { + "epoch": 1.79, + "learning_rate": 3.1384736467703604e-05, + "loss": 0.0065, + "step": 354950 + }, + { + "epoch": 1.79, + "learning_rate": 3.13771687746896e-05, + "loss": 0.0073, + "step": 354960 + }, + { + "epoch": 1.79, + "learning_rate": 3.136960108167559e-05, + "loss": 0.0052, + "step": 354970 + }, + { + "epoch": 1.79, + "learning_rate": 3.1362033388661575e-05, + "loss": 0.0064, + "step": 354980 + }, + { + "epoch": 1.79, + "learning_rate": 3.1354465695647563e-05, + "loss": 0.0048, + "step": 354990 + }, + { + "epoch": 1.79, + "learning_rate": 3.134689800263355e-05, + "loss": 0.006, + "step": 355000 + }, + { + "epoch": 1.79, + "eval_cer": 0.9144265880775191, + "eval_loss": 0.004483331926167011, + "eval_runtime": 116.7694, + "eval_samples_per_second": 17.128, + "eval_steps_per_second": 4.282, + "step": 355000 + }, + { + "epoch": 1.79, + "learning_rate": 3.133933030961954e-05, + "loss": 0.0064, + "step": 355010 + }, + { + "epoch": 1.79, + "learning_rate": 3.1331762616605535e-05, + "loss": 0.0053, + "step": 355020 + }, + { + "epoch": 1.79, + "learning_rate": 3.132419492359152e-05, + "loss": 0.0061, + "step": 355030 + }, + { + "epoch": 1.79, + "learning_rate": 3.131662723057751e-05, + "loss": 0.0045, + "step": 355040 + }, + { + "epoch": 1.79, + "learning_rate": 3.13090595375635e-05, + "loss": 0.0057, + "step": 355050 + }, + { + "epoch": 1.79, + "learning_rate": 3.1301491844549495e-05, + "loss": 0.0053, + "step": 355060 + }, + { + "epoch": 1.79, + "learning_rate": 3.129392415153548e-05, + "loss": 0.0064, + "step": 355070 + }, + { + "epoch": 1.79, + "learning_rate": 3.128635645852147e-05, + "loss": 0.0051, + "step": 355080 + }, + { + "epoch": 1.79, + "learning_rate": 3.127878876550746e-05, + "loss": 0.0088, + "step": 355090 + }, + { + "epoch": 1.79, + "learning_rate": 3.1271221072493454e-05, + "loss": 0.0071, + "step": 355100 + }, + { + "epoch": 1.79, + "learning_rate": 3.126365337947944e-05, + "loss": 0.0065, + "step": 355110 + }, + { + "epoch": 1.79, + "learning_rate": 3.125608568646543e-05, + "loss": 0.0063, + "step": 355120 + }, + { + "epoch": 1.79, + "learning_rate": 3.124851799345142e-05, + "loss": 0.0055, + "step": 355130 + }, + { + "epoch": 1.79, + "learning_rate": 3.1240950300437414e-05, + "loss": 0.0042, + "step": 355140 + }, + { + "epoch": 1.79, + "learning_rate": 3.1233382607423395e-05, + "loss": 0.0053, + "step": 355150 + }, + { + "epoch": 1.79, + "learning_rate": 3.122581491440939e-05, + "loss": 0.0043, + "step": 355160 + }, + { + "epoch": 1.79, + "learning_rate": 3.121824722139538e-05, + "loss": 0.0063, + "step": 355170 + }, + { + "epoch": 1.79, + "learning_rate": 3.121067952838137e-05, + "loss": 0.007, + "step": 355180 + }, + { + "epoch": 1.79, + "learning_rate": 3.1203111835367355e-05, + "loss": 0.0072, + "step": 355190 + }, + { + "epoch": 1.79, + "learning_rate": 3.119554414235335e-05, + "loss": 0.0075, + "step": 355200 + }, + { + "epoch": 1.79, + "learning_rate": 3.118797644933934e-05, + "loss": 0.006, + "step": 355210 + }, + { + "epoch": 1.79, + "learning_rate": 3.1180408756325326e-05, + "loss": 0.0059, + "step": 355220 + }, + { + "epoch": 1.79, + "learning_rate": 3.1172841063311315e-05, + "loss": 0.0076, + "step": 355230 + }, + { + "epoch": 1.79, + "learning_rate": 3.116527337029731e-05, + "loss": 0.0064, + "step": 355240 + }, + { + "epoch": 1.79, + "learning_rate": 3.11577056772833e-05, + "loss": 0.0044, + "step": 355250 + }, + { + "epoch": 1.79, + "learning_rate": 3.1150137984269286e-05, + "loss": 0.0054, + "step": 355260 + }, + { + "epoch": 1.79, + "learning_rate": 3.1142570291255274e-05, + "loss": 0.0054, + "step": 355270 + }, + { + "epoch": 1.79, + "learning_rate": 3.113500259824127e-05, + "loss": 0.0055, + "step": 355280 + }, + { + "epoch": 1.79, + "learning_rate": 3.112743490522726e-05, + "loss": 0.0071, + "step": 355290 + }, + { + "epoch": 1.79, + "learning_rate": 3.1119867212213246e-05, + "loss": 0.0045, + "step": 355300 + }, + { + "epoch": 1.79, + "learning_rate": 3.1112299519199234e-05, + "loss": 0.0075, + "step": 355310 + }, + { + "epoch": 1.79, + "learning_rate": 3.110473182618522e-05, + "loss": 0.0058, + "step": 355320 + }, + { + "epoch": 1.79, + "learning_rate": 3.109716413317121e-05, + "loss": 0.0053, + "step": 355330 + }, + { + "epoch": 1.79, + "learning_rate": 3.1089596440157205e-05, + "loss": 0.0053, + "step": 355340 + }, + { + "epoch": 1.79, + "learning_rate": 3.1082028747143194e-05, + "loss": 0.0032, + "step": 355350 + }, + { + "epoch": 1.79, + "learning_rate": 3.107446105412918e-05, + "loss": 0.0064, + "step": 355360 + }, + { + "epoch": 1.79, + "learning_rate": 3.106689336111517e-05, + "loss": 0.0048, + "step": 355370 + }, + { + "epoch": 1.79, + "learning_rate": 3.1059325668101165e-05, + "loss": 0.0061, + "step": 355380 + }, + { + "epoch": 1.79, + "learning_rate": 3.105175797508715e-05, + "loss": 0.0046, + "step": 355390 + }, + { + "epoch": 1.79, + "learning_rate": 3.104419028207314e-05, + "loss": 0.0058, + "step": 355400 + }, + { + "epoch": 1.79, + "learning_rate": 3.103662258905913e-05, + "loss": 0.009, + "step": 355410 + }, + { + "epoch": 1.79, + "learning_rate": 3.1029054896045125e-05, + "loss": 0.0056, + "step": 355420 + }, + { + "epoch": 1.79, + "learning_rate": 3.102148720303111e-05, + "loss": 0.0058, + "step": 355430 + }, + { + "epoch": 1.79, + "learning_rate": 3.10139195100171e-05, + "loss": 0.0049, + "step": 355440 + }, + { + "epoch": 1.79, + "learning_rate": 3.100635181700309e-05, + "loss": 0.0083, + "step": 355450 + }, + { + "epoch": 1.79, + "learning_rate": 3.0998784123989084e-05, + "loss": 0.0058, + "step": 355460 + }, + { + "epoch": 1.79, + "learning_rate": 3.0991216430975066e-05, + "loss": 0.0056, + "step": 355470 + }, + { + "epoch": 1.79, + "learning_rate": 3.098364873796106e-05, + "loss": 0.0054, + "step": 355480 + }, + { + "epoch": 1.79, + "learning_rate": 3.097608104494705e-05, + "loss": 0.0093, + "step": 355490 + }, + { + "epoch": 1.79, + "learning_rate": 3.096851335193304e-05, + "loss": 0.0048, + "step": 355500 + }, + { + "epoch": 1.79, + "learning_rate": 3.0960945658919025e-05, + "loss": 0.0056, + "step": 355510 + }, + { + "epoch": 1.79, + "learning_rate": 3.095337796590502e-05, + "loss": 0.0061, + "step": 355520 + }, + { + "epoch": 1.79, + "learning_rate": 3.094581027289101e-05, + "loss": 0.0058, + "step": 355530 + }, + { + "epoch": 1.79, + "learning_rate": 3.0938242579877e-05, + "loss": 0.0074, + "step": 355540 + }, + { + "epoch": 1.79, + "learning_rate": 3.0930674886862985e-05, + "loss": 0.006, + "step": 355550 + }, + { + "epoch": 1.79, + "learning_rate": 3.092310719384898e-05, + "loss": 0.0052, + "step": 355560 + }, + { + "epoch": 1.79, + "learning_rate": 3.091553950083497e-05, + "loss": 0.0059, + "step": 355570 + }, + { + "epoch": 1.79, + "learning_rate": 3.0907971807820956e-05, + "loss": 0.0047, + "step": 355580 + }, + { + "epoch": 1.79, + "learning_rate": 3.0900404114806945e-05, + "loss": 0.0061, + "step": 355590 + }, + { + "epoch": 1.79, + "learning_rate": 3.089283642179294e-05, + "loss": 0.0061, + "step": 355600 + }, + { + "epoch": 1.79, + "learning_rate": 3.088526872877893e-05, + "loss": 0.009, + "step": 355610 + }, + { + "epoch": 1.79, + "learning_rate": 3.0877701035764916e-05, + "loss": 0.0062, + "step": 355620 + }, + { + "epoch": 1.79, + "learning_rate": 3.0870133342750904e-05, + "loss": 0.0045, + "step": 355630 + }, + { + "epoch": 1.79, + "learning_rate": 3.086256564973689e-05, + "loss": 0.0058, + "step": 355640 + }, + { + "epoch": 1.79, + "learning_rate": 3.085499795672288e-05, + "loss": 0.0058, + "step": 355650 + }, + { + "epoch": 1.79, + "learning_rate": 3.084743026370887e-05, + "loss": 0.006, + "step": 355660 + }, + { + "epoch": 1.79, + "learning_rate": 3.0839862570694864e-05, + "loss": 0.0056, + "step": 355670 + }, + { + "epoch": 1.79, + "learning_rate": 3.083229487768085e-05, + "loss": 0.0071, + "step": 355680 + }, + { + "epoch": 1.79, + "learning_rate": 3.082472718466684e-05, + "loss": 0.006, + "step": 355690 + }, + { + "epoch": 1.79, + "learning_rate": 3.081715949165283e-05, + "loss": 0.0052, + "step": 355700 + }, + { + "epoch": 1.79, + "learning_rate": 3.0809591798638824e-05, + "loss": 0.0056, + "step": 355710 + }, + { + "epoch": 1.79, + "learning_rate": 3.080202410562481e-05, + "loss": 0.0051, + "step": 355720 + }, + { + "epoch": 1.79, + "learning_rate": 3.07944564126108e-05, + "loss": 0.007, + "step": 355730 + }, + { + "epoch": 1.79, + "learning_rate": 3.0786888719596795e-05, + "loss": 0.0045, + "step": 355740 + }, + { + "epoch": 1.79, + "learning_rate": 3.077932102658278e-05, + "loss": 0.0052, + "step": 355750 + }, + { + "epoch": 1.79, + "learning_rate": 3.077175333356877e-05, + "loss": 0.007, + "step": 355760 + }, + { + "epoch": 1.79, + "learning_rate": 3.076418564055476e-05, + "loss": 0.0086, + "step": 355770 + }, + { + "epoch": 1.79, + "learning_rate": 3.075661794754075e-05, + "loss": 0.0046, + "step": 355780 + }, + { + "epoch": 1.79, + "learning_rate": 3.0749050254526736e-05, + "loss": 0.0052, + "step": 355790 + }, + { + "epoch": 1.8, + "learning_rate": 3.0741482561512724e-05, + "loss": 0.0052, + "step": 355800 + }, + { + "epoch": 1.8, + "learning_rate": 3.073391486849872e-05, + "loss": 0.0052, + "step": 355810 + }, + { + "epoch": 1.8, + "learning_rate": 3.072634717548471e-05, + "loss": 0.0061, + "step": 355820 + }, + { + "epoch": 1.8, + "learning_rate": 3.0718779482470696e-05, + "loss": 0.0046, + "step": 355830 + }, + { + "epoch": 1.8, + "learning_rate": 3.0711211789456684e-05, + "loss": 0.0049, + "step": 355840 + }, + { + "epoch": 1.8, + "learning_rate": 3.070364409644268e-05, + "loss": 0.0061, + "step": 355850 + }, + { + "epoch": 1.8, + "learning_rate": 3.069607640342867e-05, + "loss": 0.0077, + "step": 355860 + }, + { + "epoch": 1.8, + "learning_rate": 3.0688508710414655e-05, + "loss": 0.0044, + "step": 355870 + }, + { + "epoch": 1.8, + "learning_rate": 3.0680941017400644e-05, + "loss": 0.0064, + "step": 355880 + }, + { + "epoch": 1.8, + "learning_rate": 3.067337332438664e-05, + "loss": 0.0053, + "step": 355890 + }, + { + "epoch": 1.8, + "learning_rate": 3.066580563137263e-05, + "loss": 0.0044, + "step": 355900 + }, + { + "epoch": 1.8, + "learning_rate": 3.0658237938358615e-05, + "loss": 0.0062, + "step": 355910 + }, + { + "epoch": 1.8, + "learning_rate": 3.06506702453446e-05, + "loss": 0.0064, + "step": 355920 + }, + { + "epoch": 1.8, + "learning_rate": 3.06431025523306e-05, + "loss": 0.0071, + "step": 355930 + }, + { + "epoch": 1.8, + "learning_rate": 3.063553485931658e-05, + "loss": 0.0051, + "step": 355940 + }, + { + "epoch": 1.8, + "learning_rate": 3.0627967166302575e-05, + "loss": 0.0045, + "step": 355950 + }, + { + "epoch": 1.8, + "learning_rate": 3.062039947328856e-05, + "loss": 0.0048, + "step": 355960 + }, + { + "epoch": 1.8, + "learning_rate": 3.061283178027455e-05, + "loss": 0.0049, + "step": 355970 + }, + { + "epoch": 1.8, + "learning_rate": 3.060526408726054e-05, + "loss": 0.0086, + "step": 355980 + }, + { + "epoch": 1.8, + "learning_rate": 3.0597696394246534e-05, + "loss": 0.0049, + "step": 355990 + }, + { + "epoch": 1.8, + "learning_rate": 3.059012870123252e-05, + "loss": 0.005, + "step": 356000 + }, + { + "epoch": 1.8, + "eval_cer": 0.9144130025317635, + "eval_loss": 0.0044956691563129425, + "eval_runtime": 116.7755, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, + "step": 356000 + }, + { + "epoch": 1.8, + "learning_rate": 3.058256100821851e-05, + "loss": 0.0047, + "step": 356010 + }, + { + "epoch": 1.8, + "learning_rate": 3.05749933152045e-05, + "loss": 0.0055, + "step": 356020 + }, + { + "epoch": 1.8, + "learning_rate": 3.0567425622190494e-05, + "loss": 0.0052, + "step": 356030 + }, + { + "epoch": 1.8, + "learning_rate": 3.055985792917648e-05, + "loss": 0.006, + "step": 356040 + }, + { + "epoch": 1.8, + "learning_rate": 3.055229023616247e-05, + "loss": 0.0087, + "step": 356050 + }, + { + "epoch": 1.8, + "learning_rate": 3.054472254314846e-05, + "loss": 0.0071, + "step": 356060 + }, + { + "epoch": 1.8, + "learning_rate": 3.0537154850134454e-05, + "loss": 0.0055, + "step": 356070 + }, + { + "epoch": 1.8, + "learning_rate": 3.052958715712044e-05, + "loss": 0.0057, + "step": 356080 + }, + { + "epoch": 1.8, + "learning_rate": 3.052201946410643e-05, + "loss": 0.0051, + "step": 356090 + }, + { + "epoch": 1.8, + "learning_rate": 3.051445177109242e-05, + "loss": 0.0056, + "step": 356100 + }, + { + "epoch": 1.8, + "learning_rate": 3.0506884078078407e-05, + "loss": 0.0062, + "step": 356110 + }, + { + "epoch": 1.8, + "learning_rate": 3.0499316385064398e-05, + "loss": 0.0046, + "step": 356120 + }, + { + "epoch": 1.8, + "learning_rate": 3.0491748692050386e-05, + "loss": 0.0079, + "step": 356130 + }, + { + "epoch": 1.8, + "learning_rate": 3.0484180999036378e-05, + "loss": 0.0063, + "step": 356140 + }, + { + "epoch": 1.8, + "learning_rate": 3.0476613306022366e-05, + "loss": 0.0073, + "step": 356150 + }, + { + "epoch": 1.8, + "learning_rate": 3.0469045613008358e-05, + "loss": 0.0049, + "step": 356160 + }, + { + "epoch": 1.8, + "learning_rate": 3.0461477919994346e-05, + "loss": 0.0083, + "step": 356170 + }, + { + "epoch": 1.8, + "learning_rate": 3.0453910226980338e-05, + "loss": 0.0052, + "step": 356180 + }, + { + "epoch": 1.8, + "learning_rate": 3.0446342533966326e-05, + "loss": 0.004, + "step": 356190 + }, + { + "epoch": 1.8, + "learning_rate": 3.0438774840952318e-05, + "loss": 0.0066, + "step": 356200 + }, + { + "epoch": 1.8, + "learning_rate": 3.0431207147938306e-05, + "loss": 0.0066, + "step": 356210 + }, + { + "epoch": 1.8, + "learning_rate": 3.0423639454924297e-05, + "loss": 0.0064, + "step": 356220 + }, + { + "epoch": 1.8, + "learning_rate": 3.0416071761910286e-05, + "loss": 0.0062, + "step": 356230 + }, + { + "epoch": 1.8, + "learning_rate": 3.0408504068896277e-05, + "loss": 0.0067, + "step": 356240 + }, + { + "epoch": 1.8, + "learning_rate": 3.0400936375882262e-05, + "loss": 0.0047, + "step": 356250 + }, + { + "epoch": 1.8, + "learning_rate": 3.0393368682868254e-05, + "loss": 0.0056, + "step": 356260 + }, + { + "epoch": 1.8, + "learning_rate": 3.0385800989854242e-05, + "loss": 0.0048, + "step": 356270 + }, + { + "epoch": 1.8, + "learning_rate": 3.0378233296840233e-05, + "loss": 0.0092, + "step": 356280 + }, + { + "epoch": 1.8, + "learning_rate": 3.037066560382622e-05, + "loss": 0.0062, + "step": 356290 + }, + { + "epoch": 1.8, + "learning_rate": 3.0363097910812213e-05, + "loss": 0.0042, + "step": 356300 + }, + { + "epoch": 1.8, + "learning_rate": 3.03555302177982e-05, + "loss": 0.0073, + "step": 356310 + }, + { + "epoch": 1.8, + "learning_rate": 3.0347962524784193e-05, + "loss": 0.0077, + "step": 356320 + }, + { + "epoch": 1.8, + "learning_rate": 3.034039483177018e-05, + "loss": 0.0072, + "step": 356330 + }, + { + "epoch": 1.8, + "learning_rate": 3.0332827138756173e-05, + "loss": 0.006, + "step": 356340 + }, + { + "epoch": 1.8, + "learning_rate": 3.032525944574216e-05, + "loss": 0.0058, + "step": 356350 + }, + { + "epoch": 1.8, + "learning_rate": 3.0317691752728153e-05, + "loss": 0.0056, + "step": 356360 + }, + { + "epoch": 1.8, + "learning_rate": 3.031012405971414e-05, + "loss": 0.0055, + "step": 356370 + }, + { + "epoch": 1.8, + "learning_rate": 3.0302556366700133e-05, + "loss": 0.0091, + "step": 356380 + }, + { + "epoch": 1.8, + "learning_rate": 3.029498867368612e-05, + "loss": 0.0079, + "step": 356390 + }, + { + "epoch": 1.8, + "learning_rate": 3.0287420980672112e-05, + "loss": 0.0073, + "step": 356400 + }, + { + "epoch": 1.8, + "learning_rate": 3.0279853287658097e-05, + "loss": 0.005, + "step": 356410 + }, + { + "epoch": 1.8, + "learning_rate": 3.0272285594644085e-05, + "loss": 0.0058, + "step": 356420 + }, + { + "epoch": 1.8, + "learning_rate": 3.0264717901630077e-05, + "loss": 0.0065, + "step": 356430 + }, + { + "epoch": 1.8, + "learning_rate": 3.0257150208616065e-05, + "loss": 0.0065, + "step": 356440 + }, + { + "epoch": 1.8, + "learning_rate": 3.0249582515602057e-05, + "loss": 0.0057, + "step": 356450 + }, + { + "epoch": 1.8, + "learning_rate": 3.024201482258805e-05, + "loss": 0.0058, + "step": 356460 + }, + { + "epoch": 1.8, + "learning_rate": 3.0234447129574037e-05, + "loss": 0.0057, + "step": 356470 + }, + { + "epoch": 1.8, + "learning_rate": 3.0226879436560028e-05, + "loss": 0.0058, + "step": 356480 + }, + { + "epoch": 1.8, + "learning_rate": 3.0219311743546017e-05, + "loss": 0.0075, + "step": 356490 + }, + { + "epoch": 1.8, + "learning_rate": 3.0211744050532008e-05, + "loss": 0.004, + "step": 356500 + }, + { + "epoch": 1.8, + "learning_rate": 3.0204176357517996e-05, + "loss": 0.0067, + "step": 356510 + }, + { + "epoch": 1.8, + "learning_rate": 3.0196608664503988e-05, + "loss": 0.0055, + "step": 356520 + }, + { + "epoch": 1.8, + "learning_rate": 3.0189040971489976e-05, + "loss": 0.0104, + "step": 356530 + }, + { + "epoch": 1.8, + "learning_rate": 3.0181473278475968e-05, + "loss": 0.0058, + "step": 356540 + }, + { + "epoch": 1.8, + "learning_rate": 3.0173905585461956e-05, + "loss": 0.0038, + "step": 356550 + }, + { + "epoch": 1.8, + "learning_rate": 3.0166337892447948e-05, + "loss": 0.0057, + "step": 356560 + }, + { + "epoch": 1.8, + "learning_rate": 3.0158770199433932e-05, + "loss": 0.0031, + "step": 356570 + }, + { + "epoch": 1.8, + "learning_rate": 3.015120250641992e-05, + "loss": 0.0049, + "step": 356580 + }, + { + "epoch": 1.8, + "learning_rate": 3.0143634813405912e-05, + "loss": 0.0059, + "step": 356590 + }, + { + "epoch": 1.8, + "learning_rate": 3.01360671203919e-05, + "loss": 0.0049, + "step": 356600 + }, + { + "epoch": 1.8, + "learning_rate": 3.0128499427377892e-05, + "loss": 0.0063, + "step": 356610 + }, + { + "epoch": 1.8, + "learning_rate": 3.012093173436388e-05, + "loss": 0.0051, + "step": 356620 + }, + { + "epoch": 1.8, + "learning_rate": 3.0113364041349872e-05, + "loss": 0.006, + "step": 356630 + }, + { + "epoch": 1.8, + "learning_rate": 3.010579634833586e-05, + "loss": 0.0051, + "step": 356640 + }, + { + "epoch": 1.8, + "learning_rate": 3.0098228655321852e-05, + "loss": 0.0052, + "step": 356650 + }, + { + "epoch": 1.8, + "learning_rate": 3.009066096230784e-05, + "loss": 0.0044, + "step": 356660 + }, + { + "epoch": 1.8, + "learning_rate": 3.008309326929383e-05, + "loss": 0.0072, + "step": 356670 + }, + { + "epoch": 1.8, + "learning_rate": 3.007552557627982e-05, + "loss": 0.0056, + "step": 356680 + }, + { + "epoch": 1.8, + "learning_rate": 3.006795788326581e-05, + "loss": 0.0071, + "step": 356690 + }, + { + "epoch": 1.8, + "learning_rate": 3.00603901902518e-05, + "loss": 0.0054, + "step": 356700 + }, + { + "epoch": 1.8, + "learning_rate": 3.005282249723779e-05, + "loss": 0.0047, + "step": 356710 + }, + { + "epoch": 1.8, + "learning_rate": 3.0045254804223783e-05, + "loss": 0.0075, + "step": 356720 + }, + { + "epoch": 1.8, + "learning_rate": 3.0037687111209768e-05, + "loss": 0.0047, + "step": 356730 + }, + { + "epoch": 1.8, + "learning_rate": 3.0030119418195756e-05, + "loss": 0.0061, + "step": 356740 + }, + { + "epoch": 1.8, + "learning_rate": 3.0022551725181747e-05, + "loss": 0.0066, + "step": 356750 + }, + { + "epoch": 1.8, + "learning_rate": 3.0014984032167736e-05, + "loss": 0.0065, + "step": 356760 + }, + { + "epoch": 1.8, + "learning_rate": 3.0007416339153727e-05, + "loss": 0.0051, + "step": 356770 + }, + { + "epoch": 1.8, + "learning_rate": 2.9999848646139716e-05, + "loss": 0.0065, + "step": 356780 + }, + { + "epoch": 1.8, + "learning_rate": 2.9992280953125707e-05, + "loss": 0.0065, + "step": 356790 + }, + { + "epoch": 1.8, + "learning_rate": 2.9984713260111695e-05, + "loss": 0.005, + "step": 356800 + }, + { + "epoch": 1.8, + "learning_rate": 2.9977145567097687e-05, + "loss": 0.0071, + "step": 356810 + }, + { + "epoch": 1.8, + "learning_rate": 2.9969577874083675e-05, + "loss": 0.0053, + "step": 356820 + }, + { + "epoch": 1.8, + "learning_rate": 2.9962010181069667e-05, + "loss": 0.0059, + "step": 356830 + }, + { + "epoch": 1.8, + "learning_rate": 2.9954442488055655e-05, + "loss": 0.0051, + "step": 356840 + }, + { + "epoch": 1.8, + "learning_rate": 2.9946874795041647e-05, + "loss": 0.0067, + "step": 356850 + }, + { + "epoch": 1.8, + "learning_rate": 2.9939307102027635e-05, + "loss": 0.0061, + "step": 356860 + }, + { + "epoch": 1.8, + "learning_rate": 2.9931739409013626e-05, + "loss": 0.0066, + "step": 356870 + }, + { + "epoch": 1.8, + "learning_rate": 2.992417171599961e-05, + "loss": 0.0053, + "step": 356880 + }, + { + "epoch": 1.8, + "learning_rate": 2.9916604022985603e-05, + "loss": 0.0063, + "step": 356890 + }, + { + "epoch": 1.8, + "learning_rate": 2.990903632997159e-05, + "loss": 0.0073, + "step": 356900 + }, + { + "epoch": 1.8, + "learning_rate": 2.9901468636957583e-05, + "loss": 0.008, + "step": 356910 + }, + { + "epoch": 1.8, + "learning_rate": 2.989390094394357e-05, + "loss": 0.0055, + "step": 356920 + }, + { + "epoch": 1.8, + "learning_rate": 2.9886333250929563e-05, + "loss": 0.0048, + "step": 356930 + }, + { + "epoch": 1.8, + "learning_rate": 2.987876555791555e-05, + "loss": 0.0065, + "step": 356940 + }, + { + "epoch": 1.8, + "learning_rate": 2.9871197864901542e-05, + "loss": 0.0063, + "step": 356950 + }, + { + "epoch": 1.8, + "learning_rate": 2.986363017188753e-05, + "loss": 0.0072, + "step": 356960 + }, + { + "epoch": 1.8, + "learning_rate": 2.9856062478873522e-05, + "loss": 0.0048, + "step": 356970 + }, + { + "epoch": 1.8, + "learning_rate": 2.984849478585951e-05, + "loss": 0.0053, + "step": 356980 + }, + { + "epoch": 1.8, + "learning_rate": 2.9840927092845502e-05, + "loss": 0.0047, + "step": 356990 + }, + { + "epoch": 1.8, + "learning_rate": 2.983335939983149e-05, + "loss": 0.0061, + "step": 357000 + }, + { + "epoch": 1.8, + "eval_cer": 0.9144139729278888, + "eval_loss": 0.004504029173403978, + "eval_runtime": 116.8007, + "eval_samples_per_second": 17.123, + "eval_steps_per_second": 4.281, + "step": 357000 + }, + { + "epoch": 1.8, + "learning_rate": 2.9825791706817482e-05, + "loss": 0.0057, + "step": 357010 + }, + { + "epoch": 1.8, + "learning_rate": 2.981822401380347e-05, + "loss": 0.0074, + "step": 357020 + }, + { + "epoch": 1.8, + "learning_rate": 2.981065632078946e-05, + "loss": 0.0063, + "step": 357030 + }, + { + "epoch": 1.8, + "learning_rate": 2.9803088627775446e-05, + "loss": 0.0048, + "step": 357040 + }, + { + "epoch": 1.8, + "learning_rate": 2.9795520934761438e-05, + "loss": 0.0068, + "step": 357050 + }, + { + "epoch": 1.8, + "learning_rate": 2.9787953241747426e-05, + "loss": 0.0072, + "step": 357060 + }, + { + "epoch": 1.8, + "learning_rate": 2.9780385548733418e-05, + "loss": 0.006, + "step": 357070 + }, + { + "epoch": 1.8, + "learning_rate": 2.9772817855719406e-05, + "loss": 0.0052, + "step": 357080 + }, + { + "epoch": 1.8, + "learning_rate": 2.9765250162705398e-05, + "loss": 0.0061, + "step": 357090 + }, + { + "epoch": 1.8, + "learning_rate": 2.9757682469691386e-05, + "loss": 0.0069, + "step": 357100 + }, + { + "epoch": 1.8, + "learning_rate": 2.9750114776677378e-05, + "loss": 0.0077, + "step": 357110 + }, + { + "epoch": 1.8, + "learning_rate": 2.9742547083663366e-05, + "loss": 0.0031, + "step": 357120 + }, + { + "epoch": 1.8, + "learning_rate": 2.9734979390649357e-05, + "loss": 0.0046, + "step": 357130 + }, + { + "epoch": 1.8, + "learning_rate": 2.9727411697635346e-05, + "loss": 0.0067, + "step": 357140 + }, + { + "epoch": 1.8, + "learning_rate": 2.9719844004621337e-05, + "loss": 0.0053, + "step": 357150 + }, + { + "epoch": 1.8, + "learning_rate": 2.9712276311607325e-05, + "loss": 0.0041, + "step": 357160 + }, + { + "epoch": 1.8, + "learning_rate": 2.9704708618593317e-05, + "loss": 0.0084, + "step": 357170 + }, + { + "epoch": 1.8, + "learning_rate": 2.9697140925579305e-05, + "loss": 0.005, + "step": 357180 + }, + { + "epoch": 1.8, + "learning_rate": 2.9689573232565297e-05, + "loss": 0.0074, + "step": 357190 + }, + { + "epoch": 1.8, + "learning_rate": 2.968200553955128e-05, + "loss": 0.011, + "step": 357200 + }, + { + "epoch": 1.8, + "learning_rate": 2.9674437846537273e-05, + "loss": 0.0068, + "step": 357210 + }, + { + "epoch": 1.8, + "learning_rate": 2.966687015352326e-05, + "loss": 0.0044, + "step": 357220 + }, + { + "epoch": 1.8, + "learning_rate": 2.9659302460509253e-05, + "loss": 0.0077, + "step": 357230 + }, + { + "epoch": 1.8, + "learning_rate": 2.965173476749524e-05, + "loss": 0.0072, + "step": 357240 + }, + { + "epoch": 1.8, + "learning_rate": 2.9644167074481233e-05, + "loss": 0.0061, + "step": 357250 + }, + { + "epoch": 1.8, + "learning_rate": 2.963659938146722e-05, + "loss": 0.0044, + "step": 357260 + }, + { + "epoch": 1.8, + "learning_rate": 2.9629031688453213e-05, + "loss": 0.0044, + "step": 357270 + }, + { + "epoch": 1.8, + "learning_rate": 2.96214639954392e-05, + "loss": 0.008, + "step": 357280 + }, + { + "epoch": 1.8, + "learning_rate": 2.9613896302425193e-05, + "loss": 0.0048, + "step": 357290 + }, + { + "epoch": 1.8, + "learning_rate": 2.960632860941118e-05, + "loss": 0.0053, + "step": 357300 + }, + { + "epoch": 1.8, + "learning_rate": 2.9598760916397172e-05, + "loss": 0.0058, + "step": 357310 + }, + { + "epoch": 1.8, + "learning_rate": 2.959119322338316e-05, + "loss": 0.0065, + "step": 357320 + }, + { + "epoch": 1.8, + "learning_rate": 2.9583625530369152e-05, + "loss": 0.0045, + "step": 357330 + }, + { + "epoch": 1.8, + "learning_rate": 2.957605783735514e-05, + "loss": 0.0059, + "step": 357340 + }, + { + "epoch": 1.8, + "learning_rate": 2.9568490144341125e-05, + "loss": 0.0061, + "step": 357350 + }, + { + "epoch": 1.8, + "learning_rate": 2.9560922451327117e-05, + "loss": 0.0051, + "step": 357360 + }, + { + "epoch": 1.8, + "learning_rate": 2.9553354758313105e-05, + "loss": 0.0058, + "step": 357370 + }, + { + "epoch": 1.8, + "learning_rate": 2.9545787065299097e-05, + "loss": 0.0067, + "step": 357380 + }, + { + "epoch": 1.8, + "learning_rate": 2.9538219372285085e-05, + "loss": 0.0051, + "step": 357390 + }, + { + "epoch": 1.8, + "learning_rate": 2.9530651679271077e-05, + "loss": 0.0057, + "step": 357400 + }, + { + "epoch": 1.8, + "learning_rate": 2.9523083986257065e-05, + "loss": 0.0065, + "step": 357410 + }, + { + "epoch": 1.8, + "learning_rate": 2.9515516293243056e-05, + "loss": 0.0054, + "step": 357420 + }, + { + "epoch": 1.8, + "learning_rate": 2.9507948600229048e-05, + "loss": 0.0049, + "step": 357430 + }, + { + "epoch": 1.8, + "learning_rate": 2.9500380907215036e-05, + "loss": 0.0047, + "step": 357440 + }, + { + "epoch": 1.8, + "learning_rate": 2.9492813214201028e-05, + "loss": 0.0056, + "step": 357450 + }, + { + "epoch": 1.8, + "learning_rate": 2.9485245521187016e-05, + "loss": 0.0084, + "step": 357460 + }, + { + "epoch": 1.8, + "learning_rate": 2.9477677828173008e-05, + "loss": 0.0066, + "step": 357470 + }, + { + "epoch": 1.8, + "learning_rate": 2.9470110135158996e-05, + "loss": 0.007, + "step": 357480 + }, + { + "epoch": 1.8, + "learning_rate": 2.9462542442144987e-05, + "loss": 0.0054, + "step": 357490 + }, + { + "epoch": 1.8, + "learning_rate": 2.9454974749130976e-05, + "loss": 0.0049, + "step": 357500 + }, + { + "epoch": 1.8, + "learning_rate": 2.944740705611696e-05, + "loss": 0.0056, + "step": 357510 + }, + { + "epoch": 1.8, + "learning_rate": 2.9439839363102952e-05, + "loss": 0.006, + "step": 357520 + }, + { + "epoch": 1.8, + "learning_rate": 2.943227167008894e-05, + "loss": 0.0063, + "step": 357530 + }, + { + "epoch": 1.8, + "learning_rate": 2.9424703977074932e-05, + "loss": 0.0048, + "step": 357540 + }, + { + "epoch": 1.8, + "learning_rate": 2.941713628406092e-05, + "loss": 0.0061, + "step": 357550 + }, + { + "epoch": 1.8, + "learning_rate": 2.9409568591046912e-05, + "loss": 0.006, + "step": 357560 + }, + { + "epoch": 1.8, + "learning_rate": 2.94020008980329e-05, + "loss": 0.0059, + "step": 357570 + }, + { + "epoch": 1.8, + "learning_rate": 2.939443320501889e-05, + "loss": 0.0077, + "step": 357580 + }, + { + "epoch": 1.8, + "learning_rate": 2.938686551200488e-05, + "loss": 0.0057, + "step": 357590 + }, + { + "epoch": 1.8, + "learning_rate": 2.937929781899087e-05, + "loss": 0.0061, + "step": 357600 + }, + { + "epoch": 1.8, + "learning_rate": 2.937173012597686e-05, + "loss": 0.0055, + "step": 357610 + }, + { + "epoch": 1.8, + "learning_rate": 2.936416243296285e-05, + "loss": 0.0061, + "step": 357620 + }, + { + "epoch": 1.8, + "learning_rate": 2.935659473994884e-05, + "loss": 0.0054, + "step": 357630 + }, + { + "epoch": 1.8, + "learning_rate": 2.934902704693483e-05, + "loss": 0.0048, + "step": 357640 + }, + { + "epoch": 1.8, + "learning_rate": 2.934145935392082e-05, + "loss": 0.0059, + "step": 357650 + }, + { + "epoch": 1.8, + "learning_rate": 2.933389166090681e-05, + "loss": 0.0051, + "step": 357660 + }, + { + "epoch": 1.8, + "learning_rate": 2.9326323967892796e-05, + "loss": 0.0069, + "step": 357670 + }, + { + "epoch": 1.8, + "learning_rate": 2.9318756274878787e-05, + "loss": 0.0069, + "step": 357680 + }, + { + "epoch": 1.8, + "learning_rate": 2.9311188581864776e-05, + "loss": 0.0061, + "step": 357690 + }, + { + "epoch": 1.8, + "learning_rate": 2.9303620888850767e-05, + "loss": 0.0049, + "step": 357700 + }, + { + "epoch": 1.8, + "learning_rate": 2.9296053195836755e-05, + "loss": 0.007, + "step": 357710 + }, + { + "epoch": 1.8, + "learning_rate": 2.9288485502822747e-05, + "loss": 0.0053, + "step": 357720 + }, + { + "epoch": 1.8, + "learning_rate": 2.9280917809808735e-05, + "loss": 0.0079, + "step": 357730 + }, + { + "epoch": 1.8, + "learning_rate": 2.9273350116794727e-05, + "loss": 0.0074, + "step": 357740 + }, + { + "epoch": 1.8, + "learning_rate": 2.9265782423780715e-05, + "loss": 0.0097, + "step": 357750 + }, + { + "epoch": 1.8, + "learning_rate": 2.9258214730766707e-05, + "loss": 0.0051, + "step": 357760 + }, + { + "epoch": 1.8, + "learning_rate": 2.9250647037752695e-05, + "loss": 0.0054, + "step": 357770 + }, + { + "epoch": 1.81, + "learning_rate": 2.9243079344738686e-05, + "loss": 0.0065, + "step": 357780 + }, + { + "epoch": 1.81, + "learning_rate": 2.9235511651724675e-05, + "loss": 0.0065, + "step": 357790 + }, + { + "epoch": 1.81, + "learning_rate": 2.9227943958710666e-05, + "loss": 0.0074, + "step": 357800 + }, + { + "epoch": 1.81, + "learning_rate": 2.9220376265696655e-05, + "loss": 0.0054, + "step": 357810 + }, + { + "epoch": 1.81, + "learning_rate": 2.9212808572682643e-05, + "loss": 0.0062, + "step": 357820 + }, + { + "epoch": 1.81, + "learning_rate": 2.920524087966863e-05, + "loss": 0.0064, + "step": 357830 + }, + { + "epoch": 1.81, + "learning_rate": 2.9197673186654623e-05, + "loss": 0.0068, + "step": 357840 + }, + { + "epoch": 1.81, + "learning_rate": 2.919010549364061e-05, + "loss": 0.0054, + "step": 357850 + }, + { + "epoch": 1.81, + "learning_rate": 2.9182537800626602e-05, + "loss": 0.0061, + "step": 357860 + }, + { + "epoch": 1.81, + "learning_rate": 2.917497010761259e-05, + "loss": 0.0075, + "step": 357870 + }, + { + "epoch": 1.81, + "learning_rate": 2.9167402414598582e-05, + "loss": 0.0053, + "step": 357880 + }, + { + "epoch": 1.81, + "learning_rate": 2.915983472158457e-05, + "loss": 0.0065, + "step": 357890 + }, + { + "epoch": 1.81, + "learning_rate": 2.9152267028570562e-05, + "loss": 0.0058, + "step": 357900 + }, + { + "epoch": 1.81, + "learning_rate": 2.914469933555655e-05, + "loss": 0.0052, + "step": 357910 + }, + { + "epoch": 1.81, + "learning_rate": 2.9137131642542542e-05, + "loss": 0.0056, + "step": 357920 + }, + { + "epoch": 1.81, + "learning_rate": 2.912956394952853e-05, + "loss": 0.0074, + "step": 357930 + }, + { + "epoch": 1.81, + "learning_rate": 2.912199625651452e-05, + "loss": 0.0075, + "step": 357940 + }, + { + "epoch": 1.81, + "learning_rate": 2.911442856350051e-05, + "loss": 0.0053, + "step": 357950 + }, + { + "epoch": 1.81, + "learning_rate": 2.91068608704865e-05, + "loss": 0.0077, + "step": 357960 + }, + { + "epoch": 1.81, + "learning_rate": 2.909929317747249e-05, + "loss": 0.0072, + "step": 357970 + }, + { + "epoch": 1.81, + "learning_rate": 2.9091725484458478e-05, + "loss": 0.0036, + "step": 357980 + }, + { + "epoch": 1.81, + "learning_rate": 2.9084157791444466e-05, + "loss": 0.0061, + "step": 357990 + }, + { + "epoch": 1.81, + "learning_rate": 2.9076590098430458e-05, + "loss": 0.0079, + "step": 358000 + }, + { + "epoch": 1.81, + "eval_cer": 0.9144353216426477, + "eval_loss": 0.004471032880246639, + "eval_runtime": 116.5217, + "eval_samples_per_second": 17.164, + "eval_steps_per_second": 4.291, + "step": 358000 + }, + { + "epoch": 1.81, + "learning_rate": 2.9069022405416446e-05, + "loss": 0.0062, + "step": 358010 + }, + { + "epoch": 1.81, + "learning_rate": 2.9061454712402438e-05, + "loss": 0.007, + "step": 358020 + }, + { + "epoch": 1.81, + "learning_rate": 2.9053887019388426e-05, + "loss": 0.0066, + "step": 358030 + }, + { + "epoch": 1.81, + "learning_rate": 2.9046319326374417e-05, + "loss": 0.0092, + "step": 358040 + }, + { + "epoch": 1.81, + "learning_rate": 2.9038751633360406e-05, + "loss": 0.0076, + "step": 358050 + }, + { + "epoch": 1.81, + "learning_rate": 2.9031183940346397e-05, + "loss": 0.0057, + "step": 358060 + }, + { + "epoch": 1.81, + "learning_rate": 2.9023616247332385e-05, + "loss": 0.0057, + "step": 358070 + }, + { + "epoch": 1.81, + "learning_rate": 2.9016048554318377e-05, + "loss": 0.005, + "step": 358080 + }, + { + "epoch": 1.81, + "learning_rate": 2.9008480861304365e-05, + "loss": 0.0064, + "step": 358090 + }, + { + "epoch": 1.81, + "learning_rate": 2.9000913168290357e-05, + "loss": 0.0067, + "step": 358100 + }, + { + "epoch": 1.81, + "learning_rate": 2.8993345475276345e-05, + "loss": 0.0092, + "step": 358110 + }, + { + "epoch": 1.81, + "learning_rate": 2.8985777782262337e-05, + "loss": 0.006, + "step": 358120 + }, + { + "epoch": 1.81, + "learning_rate": 2.8978210089248325e-05, + "loss": 0.0065, + "step": 358130 + }, + { + "epoch": 1.81, + "learning_rate": 2.8970642396234313e-05, + "loss": 0.0053, + "step": 358140 + }, + { + "epoch": 1.81, + "learning_rate": 2.89630747032203e-05, + "loss": 0.0052, + "step": 358150 + }, + { + "epoch": 1.81, + "learning_rate": 2.8955507010206293e-05, + "loss": 0.0041, + "step": 358160 + }, + { + "epoch": 1.81, + "learning_rate": 2.894793931719228e-05, + "loss": 0.005, + "step": 358170 + }, + { + "epoch": 1.81, + "learning_rate": 2.8940371624178273e-05, + "loss": 0.0078, + "step": 358180 + }, + { + "epoch": 1.81, + "learning_rate": 2.893280393116426e-05, + "loss": 0.0055, + "step": 358190 + }, + { + "epoch": 1.81, + "learning_rate": 2.8925236238150253e-05, + "loss": 0.0056, + "step": 358200 + }, + { + "epoch": 1.81, + "learning_rate": 2.891766854513624e-05, + "loss": 0.0062, + "step": 358210 + }, + { + "epoch": 1.81, + "learning_rate": 2.8910100852122232e-05, + "loss": 0.0051, + "step": 358220 + }, + { + "epoch": 1.81, + "learning_rate": 2.890253315910822e-05, + "loss": 0.0067, + "step": 358230 + }, + { + "epoch": 1.81, + "learning_rate": 2.8894965466094212e-05, + "loss": 0.0067, + "step": 358240 + }, + { + "epoch": 1.81, + "learning_rate": 2.88873977730802e-05, + "loss": 0.0075, + "step": 358250 + }, + { + "epoch": 1.81, + "learning_rate": 2.8879830080066192e-05, + "loss": 0.0066, + "step": 358260 + }, + { + "epoch": 1.81, + "learning_rate": 2.887226238705218e-05, + "loss": 0.0061, + "step": 358270 + }, + { + "epoch": 1.81, + "learning_rate": 2.8864694694038172e-05, + "loss": 0.0055, + "step": 358280 + }, + { + "epoch": 1.81, + "learning_rate": 2.885712700102416e-05, + "loss": 0.0077, + "step": 358290 + }, + { + "epoch": 1.81, + "learning_rate": 2.8849559308010145e-05, + "loss": 0.0058, + "step": 358300 + }, + { + "epoch": 1.81, + "learning_rate": 2.8841991614996137e-05, + "loss": 0.0062, + "step": 358310 + }, + { + "epoch": 1.81, + "learning_rate": 2.8834423921982125e-05, + "loss": 0.0038, + "step": 358320 + }, + { + "epoch": 1.81, + "learning_rate": 2.8826856228968116e-05, + "loss": 0.0077, + "step": 358330 + }, + { + "epoch": 1.81, + "learning_rate": 2.8819288535954105e-05, + "loss": 0.0065, + "step": 358340 + }, + { + "epoch": 1.81, + "learning_rate": 2.8811720842940096e-05, + "loss": 0.0053, + "step": 358350 + }, + { + "epoch": 1.81, + "learning_rate": 2.8804153149926084e-05, + "loss": 0.0059, + "step": 358360 + }, + { + "epoch": 1.81, + "learning_rate": 2.8796585456912076e-05, + "loss": 0.0056, + "step": 358370 + }, + { + "epoch": 1.81, + "learning_rate": 2.8789017763898064e-05, + "loss": 0.0081, + "step": 358380 + }, + { + "epoch": 1.81, + "learning_rate": 2.8781450070884056e-05, + "loss": 0.0075, + "step": 358390 + }, + { + "epoch": 1.81, + "learning_rate": 2.8773882377870048e-05, + "loss": 0.0079, + "step": 358400 + }, + { + "epoch": 1.81, + "learning_rate": 2.8766314684856036e-05, + "loss": 0.0058, + "step": 358410 + }, + { + "epoch": 1.81, + "learning_rate": 2.8758746991842027e-05, + "loss": 0.0059, + "step": 358420 + }, + { + "epoch": 1.81, + "learning_rate": 2.8751179298828016e-05, + "loss": 0.0052, + "step": 358430 + }, + { + "epoch": 1.81, + "learning_rate": 2.8743611605814007e-05, + "loss": 0.0047, + "step": 358440 + }, + { + "epoch": 1.81, + "learning_rate": 2.8736043912799992e-05, + "loss": 0.0057, + "step": 358450 + }, + { + "epoch": 1.81, + "learning_rate": 2.872847621978598e-05, + "loss": 0.0066, + "step": 358460 + }, + { + "epoch": 1.81, + "learning_rate": 2.8720908526771972e-05, + "loss": 0.0065, + "step": 358470 + }, + { + "epoch": 1.81, + "learning_rate": 2.871334083375796e-05, + "loss": 0.0056, + "step": 358480 + }, + { + "epoch": 1.81, + "learning_rate": 2.870577314074395e-05, + "loss": 0.0066, + "step": 358490 + }, + { + "epoch": 1.81, + "learning_rate": 2.869820544772994e-05, + "loss": 0.0057, + "step": 358500 + }, + { + "epoch": 1.81, + "learning_rate": 2.869063775471593e-05, + "loss": 0.006, + "step": 358510 + }, + { + "epoch": 1.81, + "learning_rate": 2.868307006170192e-05, + "loss": 0.0064, + "step": 358520 + }, + { + "epoch": 1.81, + "learning_rate": 2.867550236868791e-05, + "loss": 0.0069, + "step": 358530 + }, + { + "epoch": 1.81, + "learning_rate": 2.86679346756739e-05, + "loss": 0.0065, + "step": 358540 + }, + { + "epoch": 1.81, + "learning_rate": 2.866036698265989e-05, + "loss": 0.0046, + "step": 358550 + }, + { + "epoch": 1.81, + "learning_rate": 2.865279928964588e-05, + "loss": 0.0058, + "step": 358560 + }, + { + "epoch": 1.81, + "learning_rate": 2.864523159663187e-05, + "loss": 0.0069, + "step": 358570 + }, + { + "epoch": 1.81, + "learning_rate": 2.863766390361786e-05, + "loss": 0.0066, + "step": 358580 + }, + { + "epoch": 1.81, + "learning_rate": 2.863009621060385e-05, + "loss": 0.0065, + "step": 358590 + }, + { + "epoch": 1.81, + "learning_rate": 2.862252851758984e-05, + "loss": 0.0074, + "step": 358600 + }, + { + "epoch": 1.81, + "learning_rate": 2.8614960824575827e-05, + "loss": 0.0041, + "step": 358610 + }, + { + "epoch": 1.81, + "learning_rate": 2.8607393131561815e-05, + "loss": 0.0051, + "step": 358620 + }, + { + "epoch": 1.81, + "learning_rate": 2.8599825438547807e-05, + "loss": 0.0069, + "step": 358630 + }, + { + "epoch": 1.81, + "learning_rate": 2.8592257745533795e-05, + "loss": 0.0049, + "step": 358640 + }, + { + "epoch": 1.81, + "learning_rate": 2.8584690052519787e-05, + "loss": 0.0074, + "step": 358650 + }, + { + "epoch": 1.81, + "learning_rate": 2.8577122359505775e-05, + "loss": 0.0068, + "step": 358660 + }, + { + "epoch": 1.81, + "learning_rate": 2.8569554666491767e-05, + "loss": 0.0071, + "step": 358670 + }, + { + "epoch": 1.81, + "learning_rate": 2.8561986973477755e-05, + "loss": 0.0072, + "step": 358680 + }, + { + "epoch": 1.81, + "learning_rate": 2.8554419280463747e-05, + "loss": 0.0061, + "step": 358690 + }, + { + "epoch": 1.81, + "learning_rate": 2.8546851587449735e-05, + "loss": 0.006, + "step": 358700 + }, + { + "epoch": 1.81, + "learning_rate": 2.8539283894435726e-05, + "loss": 0.0052, + "step": 358710 + }, + { + "epoch": 1.81, + "learning_rate": 2.8531716201421715e-05, + "loss": 0.0063, + "step": 358720 + }, + { + "epoch": 1.81, + "learning_rate": 2.8524148508407706e-05, + "loss": 0.0047, + "step": 358730 + }, + { + "epoch": 1.81, + "learning_rate": 2.8516580815393694e-05, + "loss": 0.0073, + "step": 358740 + }, + { + "epoch": 1.81, + "learning_rate": 2.8509013122379686e-05, + "loss": 0.0047, + "step": 358750 + }, + { + "epoch": 1.81, + "learning_rate": 2.8501445429365674e-05, + "loss": 0.0063, + "step": 358760 + }, + { + "epoch": 1.81, + "learning_rate": 2.8493877736351662e-05, + "loss": 0.0066, + "step": 358770 + }, + { + "epoch": 1.81, + "learning_rate": 2.848631004333765e-05, + "loss": 0.0092, + "step": 358780 + }, + { + "epoch": 1.81, + "learning_rate": 2.8478742350323642e-05, + "loss": 0.0044, + "step": 358790 + }, + { + "epoch": 1.81, + "learning_rate": 2.847117465730963e-05, + "loss": 0.0055, + "step": 358800 + }, + { + "epoch": 1.81, + "learning_rate": 2.8463606964295622e-05, + "loss": 0.0067, + "step": 358810 + }, + { + "epoch": 1.81, + "learning_rate": 2.845603927128161e-05, + "loss": 0.0046, + "step": 358820 + }, + { + "epoch": 1.81, + "learning_rate": 2.8448471578267602e-05, + "loss": 0.0059, + "step": 358830 + }, + { + "epoch": 1.81, + "learning_rate": 2.844090388525359e-05, + "loss": 0.0054, + "step": 358840 + }, + { + "epoch": 1.81, + "learning_rate": 2.8433336192239582e-05, + "loss": 0.0067, + "step": 358850 + }, + { + "epoch": 1.81, + "learning_rate": 2.842576849922557e-05, + "loss": 0.0062, + "step": 358860 + }, + { + "epoch": 1.81, + "learning_rate": 2.841820080621156e-05, + "loss": 0.008, + "step": 358870 + }, + { + "epoch": 1.81, + "learning_rate": 2.841063311319755e-05, + "loss": 0.0059, + "step": 358880 + }, + { + "epoch": 1.81, + "learning_rate": 2.840306542018354e-05, + "loss": 0.0058, + "step": 358890 + }, + { + "epoch": 1.81, + "learning_rate": 2.839549772716953e-05, + "loss": 0.0058, + "step": 358900 + }, + { + "epoch": 1.81, + "learning_rate": 2.838793003415552e-05, + "loss": 0.0068, + "step": 358910 + }, + { + "epoch": 1.81, + "learning_rate": 2.8380362341141506e-05, + "loss": 0.0058, + "step": 358920 + }, + { + "epoch": 1.81, + "learning_rate": 2.8372794648127498e-05, + "loss": 0.0049, + "step": 358930 + }, + { + "epoch": 1.81, + "learning_rate": 2.8365226955113486e-05, + "loss": 0.0073, + "step": 358940 + }, + { + "epoch": 1.81, + "learning_rate": 2.8357659262099477e-05, + "loss": 0.0047, + "step": 358950 + }, + { + "epoch": 1.81, + "learning_rate": 2.8350091569085466e-05, + "loss": 0.0046, + "step": 358960 + }, + { + "epoch": 1.81, + "learning_rate": 2.8342523876071457e-05, + "loss": 0.004, + "step": 358970 + }, + { + "epoch": 1.81, + "learning_rate": 2.8334956183057446e-05, + "loss": 0.0052, + "step": 358980 + }, + { + "epoch": 1.81, + "learning_rate": 2.8327388490043437e-05, + "loss": 0.0059, + "step": 358990 + }, + { + "epoch": 1.81, + "learning_rate": 2.8319820797029425e-05, + "loss": 0.0065, + "step": 359000 + }, + { + "epoch": 1.81, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004385951440781355, + "eval_runtime": 116.7254, + "eval_samples_per_second": 17.134, + "eval_steps_per_second": 4.284, + "step": 359000 + }, + { + "epoch": 1.81, + "learning_rate": 2.8312253104015417e-05, + "loss": 0.0066, + "step": 359010 + }, + { + "epoch": 1.81, + "learning_rate": 2.8304685411001405e-05, + "loss": 0.0076, + "step": 359020 + }, + { + "epoch": 1.81, + "learning_rate": 2.8297117717987397e-05, + "loss": 0.0056, + "step": 359030 + }, + { + "epoch": 1.81, + "learning_rate": 2.8289550024973385e-05, + "loss": 0.0047, + "step": 359040 + }, + { + "epoch": 1.81, + "learning_rate": 2.8281982331959377e-05, + "loss": 0.0052, + "step": 359050 + }, + { + "epoch": 1.81, + "learning_rate": 2.8274414638945365e-05, + "loss": 0.0079, + "step": 359060 + }, + { + "epoch": 1.81, + "learning_rate": 2.8266846945931356e-05, + "loss": 0.0053, + "step": 359070 + }, + { + "epoch": 1.81, + "learning_rate": 2.825927925291734e-05, + "loss": 0.0071, + "step": 359080 + }, + { + "epoch": 1.81, + "learning_rate": 2.825171155990333e-05, + "loss": 0.0071, + "step": 359090 + }, + { + "epoch": 1.81, + "learning_rate": 2.824414386688932e-05, + "loss": 0.0053, + "step": 359100 + }, + { + "epoch": 1.81, + "learning_rate": 2.8236576173875313e-05, + "loss": 0.0052, + "step": 359110 + }, + { + "epoch": 1.81, + "learning_rate": 2.82290084808613e-05, + "loss": 0.0076, + "step": 359120 + }, + { + "epoch": 1.81, + "learning_rate": 2.8221440787847293e-05, + "loss": 0.0054, + "step": 359130 + }, + { + "epoch": 1.81, + "learning_rate": 2.821387309483328e-05, + "loss": 0.0067, + "step": 359140 + }, + { + "epoch": 1.81, + "learning_rate": 2.8206305401819272e-05, + "loss": 0.0045, + "step": 359150 + }, + { + "epoch": 1.81, + "learning_rate": 2.819873770880526e-05, + "loss": 0.0044, + "step": 359160 + }, + { + "epoch": 1.81, + "learning_rate": 2.8191170015791252e-05, + "loss": 0.004, + "step": 359170 + }, + { + "epoch": 1.81, + "learning_rate": 2.818360232277724e-05, + "loss": 0.0063, + "step": 359180 + }, + { + "epoch": 1.81, + "learning_rate": 2.8176034629763232e-05, + "loss": 0.0052, + "step": 359190 + }, + { + "epoch": 1.81, + "learning_rate": 2.816846693674922e-05, + "loss": 0.005, + "step": 359200 + }, + { + "epoch": 1.81, + "learning_rate": 2.8160899243735212e-05, + "loss": 0.007, + "step": 359210 + }, + { + "epoch": 1.81, + "learning_rate": 2.81533315507212e-05, + "loss": 0.0076, + "step": 359220 + }, + { + "epoch": 1.81, + "learning_rate": 2.814576385770719e-05, + "loss": 0.0062, + "step": 359230 + }, + { + "epoch": 1.81, + "learning_rate": 2.8138196164693176e-05, + "loss": 0.0054, + "step": 359240 + }, + { + "epoch": 1.81, + "learning_rate": 2.8130628471679165e-05, + "loss": 0.0068, + "step": 359250 + }, + { + "epoch": 1.81, + "learning_rate": 2.8123060778665156e-05, + "loss": 0.0081, + "step": 359260 + }, + { + "epoch": 1.81, + "learning_rate": 2.8115493085651145e-05, + "loss": 0.0052, + "step": 359270 + }, + { + "epoch": 1.81, + "learning_rate": 2.8107925392637136e-05, + "loss": 0.0054, + "step": 359280 + }, + { + "epoch": 1.81, + "learning_rate": 2.8100357699623124e-05, + "loss": 0.0065, + "step": 359290 + }, + { + "epoch": 1.81, + "learning_rate": 2.8092790006609116e-05, + "loss": 0.0041, + "step": 359300 + }, + { + "epoch": 1.81, + "learning_rate": 2.8085222313595104e-05, + "loss": 0.0068, + "step": 359310 + }, + { + "epoch": 1.81, + "learning_rate": 2.8077654620581096e-05, + "loss": 0.0066, + "step": 359320 + }, + { + "epoch": 1.81, + "learning_rate": 2.8070086927567084e-05, + "loss": 0.0066, + "step": 359330 + }, + { + "epoch": 1.81, + "learning_rate": 2.8062519234553076e-05, + "loss": 0.0041, + "step": 359340 + }, + { + "epoch": 1.81, + "learning_rate": 2.8054951541539064e-05, + "loss": 0.006, + "step": 359350 + }, + { + "epoch": 1.81, + "learning_rate": 2.8047383848525055e-05, + "loss": 0.0081, + "step": 359360 + }, + { + "epoch": 1.81, + "learning_rate": 2.8039816155511047e-05, + "loss": 0.0053, + "step": 359370 + }, + { + "epoch": 1.81, + "learning_rate": 2.8032248462497035e-05, + "loss": 0.0066, + "step": 359380 + }, + { + "epoch": 1.81, + "learning_rate": 2.8024680769483027e-05, + "loss": 0.0047, + "step": 359390 + }, + { + "epoch": 1.81, + "learning_rate": 2.801711307646901e-05, + "loss": 0.0052, + "step": 359400 + }, + { + "epoch": 1.81, + "learning_rate": 2.8009545383455e-05, + "loss": 0.0101, + "step": 359410 + }, + { + "epoch": 1.81, + "learning_rate": 2.800197769044099e-05, + "loss": 0.0105, + "step": 359420 + }, + { + "epoch": 1.81, + "learning_rate": 2.799440999742698e-05, + "loss": 0.0047, + "step": 359430 + }, + { + "epoch": 1.81, + "learning_rate": 2.798684230441297e-05, + "loss": 0.0063, + "step": 359440 + }, + { + "epoch": 1.81, + "learning_rate": 2.797927461139896e-05, + "loss": 0.0055, + "step": 359450 + }, + { + "epoch": 1.81, + "learning_rate": 2.797170691838495e-05, + "loss": 0.0061, + "step": 359460 + }, + { + "epoch": 1.81, + "learning_rate": 2.796413922537094e-05, + "loss": 0.0055, + "step": 359470 + }, + { + "epoch": 1.81, + "learning_rate": 2.795657153235693e-05, + "loss": 0.0067, + "step": 359480 + }, + { + "epoch": 1.81, + "learning_rate": 2.794900383934292e-05, + "loss": 0.0061, + "step": 359490 + }, + { + "epoch": 1.81, + "learning_rate": 2.794143614632891e-05, + "loss": 0.0044, + "step": 359500 + }, + { + "epoch": 1.81, + "learning_rate": 2.79338684533149e-05, + "loss": 0.0049, + "step": 359510 + }, + { + "epoch": 1.81, + "learning_rate": 2.792630076030089e-05, + "loss": 0.0061, + "step": 359520 + }, + { + "epoch": 1.81, + "learning_rate": 2.791873306728688e-05, + "loss": 0.0046, + "step": 359530 + }, + { + "epoch": 1.81, + "learning_rate": 2.791116537427287e-05, + "loss": 0.0055, + "step": 359540 + }, + { + "epoch": 1.81, + "learning_rate": 2.7903597681258855e-05, + "loss": 0.0067, + "step": 359550 + }, + { + "epoch": 1.81, + "learning_rate": 2.7896029988244847e-05, + "loss": 0.0064, + "step": 359560 + }, + { + "epoch": 1.81, + "learning_rate": 2.7888462295230835e-05, + "loss": 0.0055, + "step": 359570 + }, + { + "epoch": 1.81, + "learning_rate": 2.7880894602216827e-05, + "loss": 0.0054, + "step": 359580 + }, + { + "epoch": 1.81, + "learning_rate": 2.7873326909202815e-05, + "loss": 0.0102, + "step": 359590 + }, + { + "epoch": 1.81, + "learning_rate": 2.7865759216188807e-05, + "loss": 0.0068, + "step": 359600 + }, + { + "epoch": 1.81, + "learning_rate": 2.7858191523174795e-05, + "loss": 0.0067, + "step": 359610 + }, + { + "epoch": 1.81, + "learning_rate": 2.7850623830160786e-05, + "loss": 0.0047, + "step": 359620 + }, + { + "epoch": 1.81, + "learning_rate": 2.7843056137146775e-05, + "loss": 0.0068, + "step": 359630 + }, + { + "epoch": 1.81, + "learning_rate": 2.7835488444132766e-05, + "loss": 0.0063, + "step": 359640 + }, + { + "epoch": 1.81, + "learning_rate": 2.7827920751118754e-05, + "loss": 0.008, + "step": 359650 + }, + { + "epoch": 1.81, + "learning_rate": 2.7820353058104746e-05, + "loss": 0.0058, + "step": 359660 + }, + { + "epoch": 1.81, + "learning_rate": 2.7812785365090734e-05, + "loss": 0.0055, + "step": 359670 + }, + { + "epoch": 1.81, + "learning_rate": 2.7805217672076726e-05, + "loss": 0.0066, + "step": 359680 + }, + { + "epoch": 1.81, + "learning_rate": 2.7797649979062714e-05, + "loss": 0.0077, + "step": 359690 + }, + { + "epoch": 1.81, + "learning_rate": 2.7790082286048706e-05, + "loss": 0.0082, + "step": 359700 + }, + { + "epoch": 1.81, + "learning_rate": 2.778251459303469e-05, + "loss": 0.0055, + "step": 359710 + }, + { + "epoch": 1.81, + "learning_rate": 2.7774946900020682e-05, + "loss": 0.0069, + "step": 359720 + }, + { + "epoch": 1.81, + "learning_rate": 2.776737920700667e-05, + "loss": 0.0083, + "step": 359730 + }, + { + "epoch": 1.81, + "learning_rate": 2.7759811513992662e-05, + "loss": 0.0053, + "step": 359740 + }, + { + "epoch": 1.81, + "learning_rate": 2.775224382097865e-05, + "loss": 0.0048, + "step": 359750 + }, + { + "epoch": 1.82, + "learning_rate": 2.7744676127964642e-05, + "loss": 0.0055, + "step": 359760 + }, + { + "epoch": 1.82, + "learning_rate": 2.773710843495063e-05, + "loss": 0.006, + "step": 359770 + }, + { + "epoch": 1.82, + "learning_rate": 2.772954074193662e-05, + "loss": 0.0056, + "step": 359780 + }, + { + "epoch": 1.82, + "learning_rate": 2.772197304892261e-05, + "loss": 0.0043, + "step": 359790 + }, + { + "epoch": 1.82, + "learning_rate": 2.77144053559086e-05, + "loss": 0.0061, + "step": 359800 + }, + { + "epoch": 1.82, + "learning_rate": 2.770683766289459e-05, + "loss": 0.0079, + "step": 359810 + }, + { + "epoch": 1.82, + "learning_rate": 2.769926996988058e-05, + "loss": 0.0067, + "step": 359820 + }, + { + "epoch": 1.82, + "learning_rate": 2.769170227686657e-05, + "loss": 0.0063, + "step": 359830 + }, + { + "epoch": 1.82, + "learning_rate": 2.768413458385256e-05, + "loss": 0.0048, + "step": 359840 + }, + { + "epoch": 1.82, + "learning_rate": 2.767656689083855e-05, + "loss": 0.0062, + "step": 359850 + }, + { + "epoch": 1.82, + "learning_rate": 2.766899919782454e-05, + "loss": 0.0091, + "step": 359860 + }, + { + "epoch": 1.82, + "learning_rate": 2.7661431504810526e-05, + "loss": 0.0055, + "step": 359870 + }, + { + "epoch": 1.82, + "learning_rate": 2.7653863811796517e-05, + "loss": 0.0074, + "step": 359880 + }, + { + "epoch": 1.82, + "learning_rate": 2.7646296118782506e-05, + "loss": 0.0074, + "step": 359890 + }, + { + "epoch": 1.82, + "learning_rate": 2.7638728425768497e-05, + "loss": 0.006, + "step": 359900 + }, + { + "epoch": 1.82, + "learning_rate": 2.7631160732754485e-05, + "loss": 0.005, + "step": 359910 + }, + { + "epoch": 1.82, + "learning_rate": 2.7623593039740477e-05, + "loss": 0.0066, + "step": 359920 + }, + { + "epoch": 1.82, + "learning_rate": 2.7616025346726465e-05, + "loss": 0.0063, + "step": 359930 + }, + { + "epoch": 1.82, + "learning_rate": 2.7608457653712457e-05, + "loss": 0.0047, + "step": 359940 + }, + { + "epoch": 1.82, + "learning_rate": 2.7600889960698445e-05, + "loss": 0.0057, + "step": 359950 + }, + { + "epoch": 1.82, + "learning_rate": 2.7593322267684437e-05, + "loss": 0.0074, + "step": 359960 + }, + { + "epoch": 1.82, + "learning_rate": 2.7585754574670425e-05, + "loss": 0.007, + "step": 359970 + }, + { + "epoch": 1.82, + "learning_rate": 2.7578186881656416e-05, + "loss": 0.0047, + "step": 359980 + }, + { + "epoch": 1.82, + "learning_rate": 2.7570619188642405e-05, + "loss": 0.0048, + "step": 359990 + }, + { + "epoch": 1.82, + "learning_rate": 2.7563051495628396e-05, + "loss": 0.0062, + "step": 360000 + }, + { + "epoch": 1.82, + "eval_cer": 0.9144062097588856, + "eval_loss": 0.0043929265812039375, + "eval_runtime": 116.599, + "eval_samples_per_second": 17.153, + "eval_steps_per_second": 4.288, + "step": 360000 + }, + { + "epoch": 1.82, + "learning_rate": 2.7555483802614385e-05, + "loss": 0.0062, + "step": 360010 + }, + { + "epoch": 1.82, + "learning_rate": 2.754791610960037e-05, + "loss": 0.0045, + "step": 360020 + }, + { + "epoch": 1.82, + "learning_rate": 2.754034841658636e-05, + "loss": 0.0056, + "step": 360030 + }, + { + "epoch": 1.82, + "learning_rate": 2.753278072357235e-05, + "loss": 0.0054, + "step": 360040 + }, + { + "epoch": 1.82, + "learning_rate": 2.752521303055834e-05, + "loss": 0.0068, + "step": 360050 + }, + { + "epoch": 1.82, + "learning_rate": 2.751764533754433e-05, + "loss": 0.0068, + "step": 360060 + }, + { + "epoch": 1.82, + "learning_rate": 2.751007764453032e-05, + "loss": 0.0061, + "step": 360070 + }, + { + "epoch": 1.82, + "learning_rate": 2.7502509951516312e-05, + "loss": 0.0055, + "step": 360080 + }, + { + "epoch": 1.82, + "learning_rate": 2.74949422585023e-05, + "loss": 0.0047, + "step": 360090 + }, + { + "epoch": 1.82, + "learning_rate": 2.7487374565488292e-05, + "loss": 0.0057, + "step": 360100 + }, + { + "epoch": 1.82, + "learning_rate": 2.747980687247428e-05, + "loss": 0.0058, + "step": 360110 + }, + { + "epoch": 1.82, + "learning_rate": 2.7472239179460272e-05, + "loss": 0.0076, + "step": 360120 + }, + { + "epoch": 1.82, + "learning_rate": 2.746467148644626e-05, + "loss": 0.0048, + "step": 360130 + }, + { + "epoch": 1.82, + "learning_rate": 2.745710379343225e-05, + "loss": 0.0059, + "step": 360140 + }, + { + "epoch": 1.82, + "learning_rate": 2.744953610041824e-05, + "loss": 0.0064, + "step": 360150 + }, + { + "epoch": 1.82, + "learning_rate": 2.744196840740423e-05, + "loss": 0.0056, + "step": 360160 + }, + { + "epoch": 1.82, + "learning_rate": 2.743440071439022e-05, + "loss": 0.0048, + "step": 360170 + }, + { + "epoch": 1.82, + "learning_rate": 2.7426833021376205e-05, + "loss": 0.0056, + "step": 360180 + }, + { + "epoch": 1.82, + "learning_rate": 2.7419265328362196e-05, + "loss": 0.0053, + "step": 360190 + }, + { + "epoch": 1.82, + "learning_rate": 2.7411697635348184e-05, + "loss": 0.0065, + "step": 360200 + }, + { + "epoch": 1.82, + "learning_rate": 2.7404129942334176e-05, + "loss": 0.0051, + "step": 360210 + }, + { + "epoch": 1.82, + "learning_rate": 2.7396562249320164e-05, + "loss": 0.0063, + "step": 360220 + }, + { + "epoch": 1.82, + "learning_rate": 2.7388994556306156e-05, + "loss": 0.0052, + "step": 360230 + }, + { + "epoch": 1.82, + "learning_rate": 2.7381426863292144e-05, + "loss": 0.0051, + "step": 360240 + }, + { + "epoch": 1.82, + "learning_rate": 2.7373859170278136e-05, + "loss": 0.0059, + "step": 360250 + }, + { + "epoch": 1.82, + "learning_rate": 2.7366291477264124e-05, + "loss": 0.0054, + "step": 360260 + }, + { + "epoch": 1.82, + "learning_rate": 2.7358723784250115e-05, + "loss": 0.0048, + "step": 360270 + }, + { + "epoch": 1.82, + "learning_rate": 2.7351156091236104e-05, + "loss": 0.0048, + "step": 360280 + }, + { + "epoch": 1.82, + "learning_rate": 2.7343588398222095e-05, + "loss": 0.0056, + "step": 360290 + }, + { + "epoch": 1.82, + "learning_rate": 2.7336020705208084e-05, + "loss": 0.0051, + "step": 360300 + }, + { + "epoch": 1.82, + "learning_rate": 2.7328453012194075e-05, + "loss": 0.0045, + "step": 360310 + }, + { + "epoch": 1.82, + "learning_rate": 2.7320885319180063e-05, + "loss": 0.0113, + "step": 360320 + }, + { + "epoch": 1.82, + "learning_rate": 2.7313317626166055e-05, + "loss": 0.0082, + "step": 360330 + }, + { + "epoch": 1.82, + "learning_rate": 2.730574993315204e-05, + "loss": 0.0063, + "step": 360340 + }, + { + "epoch": 1.82, + "learning_rate": 2.729818224013803e-05, + "loss": 0.006, + "step": 360350 + }, + { + "epoch": 1.82, + "learning_rate": 2.729061454712402e-05, + "loss": 0.0074, + "step": 360360 + }, + { + "epoch": 1.82, + "learning_rate": 2.728304685411001e-05, + "loss": 0.0053, + "step": 360370 + }, + { + "epoch": 1.82, + "learning_rate": 2.7275479161096e-05, + "loss": 0.0054, + "step": 360380 + }, + { + "epoch": 1.82, + "learning_rate": 2.726791146808199e-05, + "loss": 0.0063, + "step": 360390 + }, + { + "epoch": 1.82, + "learning_rate": 2.726034377506798e-05, + "loss": 0.0048, + "step": 360400 + }, + { + "epoch": 1.82, + "learning_rate": 2.725277608205397e-05, + "loss": 0.0064, + "step": 360410 + }, + { + "epoch": 1.82, + "learning_rate": 2.724520838903996e-05, + "loss": 0.0049, + "step": 360420 + }, + { + "epoch": 1.82, + "learning_rate": 2.723764069602595e-05, + "loss": 0.0059, + "step": 360430 + }, + { + "epoch": 1.82, + "learning_rate": 2.723007300301194e-05, + "loss": 0.0106, + "step": 360440 + }, + { + "epoch": 1.82, + "learning_rate": 2.722250530999793e-05, + "loss": 0.0067, + "step": 360450 + }, + { + "epoch": 1.82, + "learning_rate": 2.721493761698392e-05, + "loss": 0.0059, + "step": 360460 + }, + { + "epoch": 1.82, + "learning_rate": 2.720736992396991e-05, + "loss": 0.008, + "step": 360470 + }, + { + "epoch": 1.82, + "learning_rate": 2.71998022309559e-05, + "loss": 0.0051, + "step": 360480 + }, + { + "epoch": 1.82, + "learning_rate": 2.719223453794189e-05, + "loss": 0.0041, + "step": 360490 + }, + { + "epoch": 1.82, + "learning_rate": 2.7184666844927875e-05, + "loss": 0.0056, + "step": 360500 + }, + { + "epoch": 1.82, + "learning_rate": 2.7177099151913867e-05, + "loss": 0.0052, + "step": 360510 + }, + { + "epoch": 1.82, + "learning_rate": 2.7169531458899855e-05, + "loss": 0.0053, + "step": 360520 + }, + { + "epoch": 1.82, + "learning_rate": 2.7161963765885846e-05, + "loss": 0.0062, + "step": 360530 + }, + { + "epoch": 1.82, + "learning_rate": 2.7154396072871835e-05, + "loss": 0.0051, + "step": 360540 + }, + { + "epoch": 1.82, + "learning_rate": 2.7146828379857826e-05, + "loss": 0.0052, + "step": 360550 + }, + { + "epoch": 1.82, + "learning_rate": 2.7139260686843814e-05, + "loss": 0.0064, + "step": 360560 + }, + { + "epoch": 1.82, + "learning_rate": 2.7131692993829806e-05, + "loss": 0.0047, + "step": 360570 + }, + { + "epoch": 1.82, + "learning_rate": 2.7124125300815794e-05, + "loss": 0.0066, + "step": 360580 + }, + { + "epoch": 1.82, + "learning_rate": 2.7116557607801786e-05, + "loss": 0.0045, + "step": 360590 + }, + { + "epoch": 1.82, + "learning_rate": 2.7108989914787774e-05, + "loss": 0.0078, + "step": 360600 + }, + { + "epoch": 1.82, + "learning_rate": 2.7101422221773766e-05, + "loss": 0.0072, + "step": 360610 + }, + { + "epoch": 1.82, + "learning_rate": 2.7093854528759754e-05, + "loss": 0.0058, + "step": 360620 + }, + { + "epoch": 1.82, + "learning_rate": 2.7086286835745746e-05, + "loss": 0.0043, + "step": 360630 + }, + { + "epoch": 1.82, + "learning_rate": 2.7078719142731734e-05, + "loss": 0.0078, + "step": 360640 + }, + { + "epoch": 1.82, + "learning_rate": 2.7071151449717722e-05, + "loss": 0.0047, + "step": 360650 + }, + { + "epoch": 1.82, + "learning_rate": 2.706358375670371e-05, + "loss": 0.0066, + "step": 360660 + }, + { + "epoch": 1.82, + "learning_rate": 2.7056016063689702e-05, + "loss": 0.0058, + "step": 360670 + }, + { + "epoch": 1.82, + "learning_rate": 2.704844837067569e-05, + "loss": 0.005, + "step": 360680 + }, + { + "epoch": 1.82, + "learning_rate": 2.704088067766168e-05, + "loss": 0.0067, + "step": 360690 + }, + { + "epoch": 1.82, + "learning_rate": 2.703331298464767e-05, + "loss": 0.0082, + "step": 360700 + }, + { + "epoch": 1.82, + "learning_rate": 2.702574529163366e-05, + "loss": 0.0062, + "step": 360710 + }, + { + "epoch": 1.82, + "learning_rate": 2.701817759861965e-05, + "loss": 0.013, + "step": 360720 + }, + { + "epoch": 1.82, + "learning_rate": 2.701060990560564e-05, + "loss": 0.0068, + "step": 360730 + }, + { + "epoch": 1.82, + "learning_rate": 2.700304221259163e-05, + "loss": 0.0064, + "step": 360740 + }, + { + "epoch": 1.82, + "learning_rate": 2.699547451957762e-05, + "loss": 0.0074, + "step": 360750 + }, + { + "epoch": 1.82, + "learning_rate": 2.698790682656361e-05, + "loss": 0.0058, + "step": 360760 + }, + { + "epoch": 1.82, + "learning_rate": 2.69803391335496e-05, + "loss": 0.0029, + "step": 360770 + }, + { + "epoch": 1.82, + "learning_rate": 2.697277144053559e-05, + "loss": 0.0085, + "step": 360780 + }, + { + "epoch": 1.82, + "learning_rate": 2.696520374752158e-05, + "loss": 0.0093, + "step": 360790 + }, + { + "epoch": 1.82, + "learning_rate": 2.695763605450757e-05, + "loss": 0.0061, + "step": 360800 + }, + { + "epoch": 1.82, + "learning_rate": 2.6950068361493557e-05, + "loss": 0.0061, + "step": 360810 + }, + { + "epoch": 1.82, + "learning_rate": 2.6942500668479545e-05, + "loss": 0.0066, + "step": 360820 + }, + { + "epoch": 1.82, + "learning_rate": 2.6934932975465537e-05, + "loss": 0.0062, + "step": 360830 + }, + { + "epoch": 1.82, + "learning_rate": 2.6927365282451525e-05, + "loss": 0.0064, + "step": 360840 + }, + { + "epoch": 1.82, + "learning_rate": 2.6919797589437517e-05, + "loss": 0.005, + "step": 360850 + }, + { + "epoch": 1.82, + "learning_rate": 2.6912229896423505e-05, + "loss": 0.0067, + "step": 360860 + }, + { + "epoch": 1.82, + "learning_rate": 2.6904662203409497e-05, + "loss": 0.005, + "step": 360870 + }, + { + "epoch": 1.82, + "learning_rate": 2.6897094510395485e-05, + "loss": 0.0059, + "step": 360880 + }, + { + "epoch": 1.82, + "learning_rate": 2.6889526817381477e-05, + "loss": 0.005, + "step": 360890 + }, + { + "epoch": 1.82, + "learning_rate": 2.6881959124367465e-05, + "loss": 0.0093, + "step": 360900 + }, + { + "epoch": 1.82, + "learning_rate": 2.6874391431353456e-05, + "loss": 0.0057, + "step": 360910 + }, + { + "epoch": 1.82, + "learning_rate": 2.6866823738339445e-05, + "loss": 0.0088, + "step": 360920 + }, + { + "epoch": 1.82, + "learning_rate": 2.6859256045325436e-05, + "loss": 0.0055, + "step": 360930 + }, + { + "epoch": 1.82, + "learning_rate": 2.6851688352311424e-05, + "loss": 0.0049, + "step": 360940 + }, + { + "epoch": 1.82, + "learning_rate": 2.6844120659297416e-05, + "loss": 0.0049, + "step": 360950 + }, + { + "epoch": 1.82, + "learning_rate": 2.6836552966283404e-05, + "loss": 0.0059, + "step": 360960 + }, + { + "epoch": 1.82, + "learning_rate": 2.682898527326939e-05, + "loss": 0.0042, + "step": 360970 + }, + { + "epoch": 1.82, + "learning_rate": 2.682141758025538e-05, + "loss": 0.0071, + "step": 360980 + }, + { + "epoch": 1.82, + "learning_rate": 2.681384988724137e-05, + "loss": 0.0062, + "step": 360990 + }, + { + "epoch": 1.82, + "learning_rate": 2.680628219422736e-05, + "loss": 0.0057, + "step": 361000 + }, + { + "epoch": 1.82, + "eval_cer": 0.9144256176813937, + "eval_loss": 0.004407630767673254, + "eval_runtime": 116.7425, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, + "step": 361000 + }, + { + "epoch": 1.82, + "learning_rate": 2.679871450121335e-05, + "loss": 0.0085, + "step": 361010 + }, + { + "epoch": 1.82, + "learning_rate": 2.679114680819934e-05, + "loss": 0.0054, + "step": 361020 + }, + { + "epoch": 1.82, + "learning_rate": 2.678357911518533e-05, + "loss": 0.0053, + "step": 361030 + }, + { + "epoch": 1.82, + "learning_rate": 2.677601142217132e-05, + "loss": 0.0045, + "step": 361040 + }, + { + "epoch": 1.82, + "learning_rate": 2.6768443729157312e-05, + "loss": 0.0075, + "step": 361050 + }, + { + "epoch": 1.82, + "learning_rate": 2.67608760361433e-05, + "loss": 0.0074, + "step": 361060 + }, + { + "epoch": 1.82, + "learning_rate": 2.675330834312929e-05, + "loss": 0.0052, + "step": 361070 + }, + { + "epoch": 1.82, + "learning_rate": 2.674574065011528e-05, + "loss": 0.0078, + "step": 361080 + }, + { + "epoch": 1.82, + "learning_rate": 2.673817295710127e-05, + "loss": 0.0057, + "step": 361090 + }, + { + "epoch": 1.82, + "learning_rate": 2.673060526408726e-05, + "loss": 0.0061, + "step": 361100 + }, + { + "epoch": 1.82, + "learning_rate": 2.672303757107325e-05, + "loss": 0.0063, + "step": 361110 + }, + { + "epoch": 1.82, + "learning_rate": 2.6715469878059236e-05, + "loss": 0.0055, + "step": 361120 + }, + { + "epoch": 1.82, + "learning_rate": 2.6707902185045224e-05, + "loss": 0.0046, + "step": 361130 + }, + { + "epoch": 1.82, + "learning_rate": 2.6700334492031216e-05, + "loss": 0.005, + "step": 361140 + }, + { + "epoch": 1.82, + "learning_rate": 2.6692766799017204e-05, + "loss": 0.0045, + "step": 361150 + }, + { + "epoch": 1.82, + "learning_rate": 2.6685199106003196e-05, + "loss": 0.0059, + "step": 361160 + }, + { + "epoch": 1.82, + "learning_rate": 2.6677631412989184e-05, + "loss": 0.006, + "step": 361170 + }, + { + "epoch": 1.82, + "learning_rate": 2.6670063719975176e-05, + "loss": 0.0058, + "step": 361180 + }, + { + "epoch": 1.82, + "learning_rate": 2.6662496026961164e-05, + "loss": 0.0045, + "step": 361190 + }, + { + "epoch": 1.82, + "learning_rate": 2.6654928333947155e-05, + "loss": 0.0069, + "step": 361200 + }, + { + "epoch": 1.82, + "learning_rate": 2.6647360640933144e-05, + "loss": 0.0047, + "step": 361210 + }, + { + "epoch": 1.82, + "learning_rate": 2.6639792947919135e-05, + "loss": 0.0058, + "step": 361220 + }, + { + "epoch": 1.82, + "learning_rate": 2.6632225254905123e-05, + "loss": 0.0072, + "step": 361230 + }, + { + "epoch": 1.82, + "learning_rate": 2.6624657561891115e-05, + "loss": 0.0057, + "step": 361240 + }, + { + "epoch": 1.82, + "learning_rate": 2.6617089868877103e-05, + "loss": 0.006, + "step": 361250 + }, + { + "epoch": 1.82, + "learning_rate": 2.6609522175863095e-05, + "loss": 0.0061, + "step": 361260 + }, + { + "epoch": 1.82, + "learning_rate": 2.6601954482849083e-05, + "loss": 0.0065, + "step": 361270 + }, + { + "epoch": 1.82, + "learning_rate": 2.659438678983507e-05, + "loss": 0.0081, + "step": 361280 + }, + { + "epoch": 1.82, + "learning_rate": 2.658681909682106e-05, + "loss": 0.0053, + "step": 361290 + }, + { + "epoch": 1.82, + "learning_rate": 2.657925140380705e-05, + "loss": 0.0057, + "step": 361300 + }, + { + "epoch": 1.82, + "learning_rate": 2.657168371079304e-05, + "loss": 0.0062, + "step": 361310 + }, + { + "epoch": 1.82, + "learning_rate": 2.656411601777903e-05, + "loss": 0.0067, + "step": 361320 + }, + { + "epoch": 1.82, + "learning_rate": 2.655654832476502e-05, + "loss": 0.0064, + "step": 361330 + }, + { + "epoch": 1.82, + "learning_rate": 2.654898063175101e-05, + "loss": 0.0043, + "step": 361340 + }, + { + "epoch": 1.82, + "learning_rate": 2.6541412938737e-05, + "loss": 0.0062, + "step": 361350 + }, + { + "epoch": 1.82, + "learning_rate": 2.653384524572299e-05, + "loss": 0.0061, + "step": 361360 + }, + { + "epoch": 1.82, + "learning_rate": 2.652627755270898e-05, + "loss": 0.0054, + "step": 361370 + }, + { + "epoch": 1.82, + "learning_rate": 2.651870985969497e-05, + "loss": 0.0057, + "step": 361380 + }, + { + "epoch": 1.82, + "learning_rate": 2.651114216668096e-05, + "loss": 0.0048, + "step": 361390 + }, + { + "epoch": 1.82, + "learning_rate": 2.650357447366695e-05, + "loss": 0.0049, + "step": 361400 + }, + { + "epoch": 1.82, + "learning_rate": 2.649600678065294e-05, + "loss": 0.0063, + "step": 361410 + }, + { + "epoch": 1.82, + "learning_rate": 2.648843908763893e-05, + "loss": 0.0069, + "step": 361420 + }, + { + "epoch": 1.82, + "learning_rate": 2.6480871394624918e-05, + "loss": 0.0058, + "step": 361430 + }, + { + "epoch": 1.82, + "learning_rate": 2.6473303701610906e-05, + "loss": 0.0084, + "step": 361440 + }, + { + "epoch": 1.82, + "learning_rate": 2.6465736008596895e-05, + "loss": 0.0063, + "step": 361450 + }, + { + "epoch": 1.82, + "learning_rate": 2.6458168315582886e-05, + "loss": 0.0062, + "step": 361460 + }, + { + "epoch": 1.82, + "learning_rate": 2.6450600622568875e-05, + "loss": 0.0063, + "step": 361470 + }, + { + "epoch": 1.82, + "learning_rate": 2.6443032929554866e-05, + "loss": 0.0049, + "step": 361480 + }, + { + "epoch": 1.82, + "learning_rate": 2.6435465236540854e-05, + "loss": 0.0056, + "step": 361490 + }, + { + "epoch": 1.82, + "learning_rate": 2.6427897543526846e-05, + "loss": 0.0072, + "step": 361500 + }, + { + "epoch": 1.82, + "learning_rate": 2.6420329850512834e-05, + "loss": 0.0067, + "step": 361510 + }, + { + "epoch": 1.82, + "learning_rate": 2.6412762157498826e-05, + "loss": 0.0039, + "step": 361520 + }, + { + "epoch": 1.82, + "learning_rate": 2.6405194464484814e-05, + "loss": 0.005, + "step": 361530 + }, + { + "epoch": 1.82, + "learning_rate": 2.6397626771470806e-05, + "loss": 0.006, + "step": 361540 + }, + { + "epoch": 1.82, + "learning_rate": 2.6390059078456794e-05, + "loss": 0.005, + "step": 361550 + }, + { + "epoch": 1.82, + "learning_rate": 2.6382491385442785e-05, + "loss": 0.0061, + "step": 361560 + }, + { + "epoch": 1.82, + "learning_rate": 2.6374923692428774e-05, + "loss": 0.006, + "step": 361570 + }, + { + "epoch": 1.82, + "learning_rate": 2.6367355999414765e-05, + "loss": 0.0053, + "step": 361580 + }, + { + "epoch": 1.82, + "learning_rate": 2.6359788306400753e-05, + "loss": 0.0038, + "step": 361590 + }, + { + "epoch": 1.82, + "learning_rate": 2.635222061338674e-05, + "loss": 0.0052, + "step": 361600 + }, + { + "epoch": 1.82, + "learning_rate": 2.634465292037273e-05, + "loss": 0.008, + "step": 361610 + }, + { + "epoch": 1.82, + "learning_rate": 2.633708522735872e-05, + "loss": 0.0053, + "step": 361620 + }, + { + "epoch": 1.82, + "learning_rate": 2.632951753434471e-05, + "loss": 0.0062, + "step": 361630 + }, + { + "epoch": 1.82, + "learning_rate": 2.63219498413307e-05, + "loss": 0.0051, + "step": 361640 + }, + { + "epoch": 1.82, + "learning_rate": 2.631438214831669e-05, + "loss": 0.0066, + "step": 361650 + }, + { + "epoch": 1.82, + "learning_rate": 2.630681445530268e-05, + "loss": 0.0042, + "step": 361660 + }, + { + "epoch": 1.82, + "learning_rate": 2.629924676228867e-05, + "loss": 0.007, + "step": 361670 + }, + { + "epoch": 1.82, + "learning_rate": 2.629167906927466e-05, + "loss": 0.0068, + "step": 361680 + }, + { + "epoch": 1.82, + "learning_rate": 2.628411137626065e-05, + "loss": 0.0044, + "step": 361690 + }, + { + "epoch": 1.82, + "learning_rate": 2.627654368324664e-05, + "loss": 0.0062, + "step": 361700 + }, + { + "epoch": 1.82, + "learning_rate": 2.626897599023263e-05, + "loss": 0.0061, + "step": 361710 + }, + { + "epoch": 1.82, + "learning_rate": 2.626140829721862e-05, + "loss": 0.0074, + "step": 361720 + }, + { + "epoch": 1.82, + "learning_rate": 2.625384060420461e-05, + "loss": 0.0062, + "step": 361730 + }, + { + "epoch": 1.83, + "learning_rate": 2.62462729111906e-05, + "loss": 0.0066, + "step": 361740 + }, + { + "epoch": 1.83, + "learning_rate": 2.6238705218176585e-05, + "loss": 0.0052, + "step": 361750 + }, + { + "epoch": 1.83, + "learning_rate": 2.6231137525162577e-05, + "loss": 0.0045, + "step": 361760 + }, + { + "epoch": 1.83, + "learning_rate": 2.6223569832148565e-05, + "loss": 0.0039, + "step": 361770 + }, + { + "epoch": 1.83, + "learning_rate": 2.6216002139134557e-05, + "loss": 0.0052, + "step": 361780 + }, + { + "epoch": 1.83, + "learning_rate": 2.6208434446120545e-05, + "loss": 0.0055, + "step": 361790 + }, + { + "epoch": 1.83, + "learning_rate": 2.6200866753106537e-05, + "loss": 0.0067, + "step": 361800 + }, + { + "epoch": 1.83, + "learning_rate": 2.6193299060092525e-05, + "loss": 0.0066, + "step": 361810 + }, + { + "epoch": 1.83, + "learning_rate": 2.6185731367078516e-05, + "loss": 0.0093, + "step": 361820 + }, + { + "epoch": 1.83, + "learning_rate": 2.6178163674064505e-05, + "loss": 0.0068, + "step": 361830 + }, + { + "epoch": 1.83, + "learning_rate": 2.6170595981050496e-05, + "loss": 0.0061, + "step": 361840 + }, + { + "epoch": 1.83, + "learning_rate": 2.6163028288036484e-05, + "loss": 0.0065, + "step": 361850 + }, + { + "epoch": 1.83, + "learning_rate": 2.6155460595022476e-05, + "loss": 0.0058, + "step": 361860 + }, + { + "epoch": 1.83, + "learning_rate": 2.6147892902008464e-05, + "loss": 0.0058, + "step": 361870 + }, + { + "epoch": 1.83, + "learning_rate": 2.6140325208994456e-05, + "loss": 0.0068, + "step": 361880 + }, + { + "epoch": 1.83, + "learning_rate": 2.6132757515980444e-05, + "loss": 0.0055, + "step": 361890 + }, + { + "epoch": 1.83, + "learning_rate": 2.6125189822966436e-05, + "loss": 0.0049, + "step": 361900 + }, + { + "epoch": 1.83, + "learning_rate": 2.611762212995242e-05, + "loss": 0.0048, + "step": 361910 + }, + { + "epoch": 1.83, + "learning_rate": 2.611005443693841e-05, + "loss": 0.0061, + "step": 361920 + }, + { + "epoch": 1.83, + "learning_rate": 2.61024867439244e-05, + "loss": 0.0044, + "step": 361930 + }, + { + "epoch": 1.83, + "learning_rate": 2.609491905091039e-05, + "loss": 0.006, + "step": 361940 + }, + { + "epoch": 1.83, + "learning_rate": 2.608735135789638e-05, + "loss": 0.0066, + "step": 361950 + }, + { + "epoch": 1.83, + "learning_rate": 2.607978366488237e-05, + "loss": 0.0086, + "step": 361960 + }, + { + "epoch": 1.83, + "learning_rate": 2.607221597186836e-05, + "loss": 0.0061, + "step": 361970 + }, + { + "epoch": 1.83, + "learning_rate": 2.6064648278854348e-05, + "loss": 0.0078, + "step": 361980 + }, + { + "epoch": 1.83, + "learning_rate": 2.605708058584034e-05, + "loss": 0.0048, + "step": 361990 + }, + { + "epoch": 1.83, + "learning_rate": 2.6049512892826328e-05, + "loss": 0.0065, + "step": 362000 + }, + { + "epoch": 1.83, + "eval_cer": 0.9144314400581461, + "eval_loss": 0.004417457617819309, + "eval_runtime": 116.6172, + "eval_samples_per_second": 17.15, + "eval_steps_per_second": 4.288, + "step": 362000 + }, + { + "epoch": 1.83, + "learning_rate": 2.604194519981232e-05, + "loss": 0.0051, + "step": 362010 + }, + { + "epoch": 1.83, + "learning_rate": 2.603437750679831e-05, + "loss": 0.0065, + "step": 362020 + }, + { + "epoch": 1.83, + "learning_rate": 2.60268098137843e-05, + "loss": 0.0086, + "step": 362030 + }, + { + "epoch": 1.83, + "learning_rate": 2.601924212077029e-05, + "loss": 0.0066, + "step": 362040 + }, + { + "epoch": 1.83, + "learning_rate": 2.601167442775628e-05, + "loss": 0.0053, + "step": 362050 + }, + { + "epoch": 1.83, + "learning_rate": 2.600410673474227e-05, + "loss": 0.0049, + "step": 362060 + }, + { + "epoch": 1.83, + "learning_rate": 2.5996539041728256e-05, + "loss": 0.005, + "step": 362070 + }, + { + "epoch": 1.83, + "learning_rate": 2.5988971348714244e-05, + "loss": 0.0059, + "step": 362080 + }, + { + "epoch": 1.83, + "learning_rate": 2.5981403655700236e-05, + "loss": 0.0065, + "step": 362090 + }, + { + "epoch": 1.83, + "learning_rate": 2.5973835962686224e-05, + "loss": 0.0058, + "step": 362100 + }, + { + "epoch": 1.83, + "learning_rate": 2.5966268269672215e-05, + "loss": 0.0067, + "step": 362110 + }, + { + "epoch": 1.83, + "learning_rate": 2.5958700576658204e-05, + "loss": 0.0067, + "step": 362120 + }, + { + "epoch": 1.83, + "learning_rate": 2.5951132883644195e-05, + "loss": 0.0054, + "step": 362130 + }, + { + "epoch": 1.83, + "learning_rate": 2.5943565190630183e-05, + "loss": 0.0043, + "step": 362140 + }, + { + "epoch": 1.83, + "learning_rate": 2.5935997497616175e-05, + "loss": 0.0057, + "step": 362150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5928429804602163e-05, + "loss": 0.0045, + "step": 362160 + }, + { + "epoch": 1.83, + "learning_rate": 2.5920862111588155e-05, + "loss": 0.006, + "step": 362170 + }, + { + "epoch": 1.83, + "learning_rate": 2.5913294418574143e-05, + "loss": 0.0074, + "step": 362180 + }, + { + "epoch": 1.83, + "learning_rate": 2.5905726725560135e-05, + "loss": 0.0053, + "step": 362190 + }, + { + "epoch": 1.83, + "learning_rate": 2.5898159032546123e-05, + "loss": 0.0063, + "step": 362200 + }, + { + "epoch": 1.83, + "learning_rate": 2.5890591339532115e-05, + "loss": 0.0046, + "step": 362210 + }, + { + "epoch": 1.83, + "learning_rate": 2.58830236465181e-05, + "loss": 0.0072, + "step": 362220 + }, + { + "epoch": 1.83, + "learning_rate": 2.587545595350409e-05, + "loss": 0.0055, + "step": 362230 + }, + { + "epoch": 1.83, + "learning_rate": 2.586788826049008e-05, + "loss": 0.0078, + "step": 362240 + }, + { + "epoch": 1.83, + "learning_rate": 2.586032056747607e-05, + "loss": 0.0065, + "step": 362250 + }, + { + "epoch": 1.83, + "learning_rate": 2.585275287446206e-05, + "loss": 0.0075, + "step": 362260 + }, + { + "epoch": 1.83, + "learning_rate": 2.584518518144805e-05, + "loss": 0.0065, + "step": 362270 + }, + { + "epoch": 1.83, + "learning_rate": 2.583761748843404e-05, + "loss": 0.0063, + "step": 362280 + }, + { + "epoch": 1.83, + "learning_rate": 2.583004979542003e-05, + "loss": 0.0042, + "step": 362290 + }, + { + "epoch": 1.83, + "learning_rate": 2.582248210240602e-05, + "loss": 0.0082, + "step": 362300 + }, + { + "epoch": 1.83, + "learning_rate": 2.581491440939201e-05, + "loss": 0.0085, + "step": 362310 + }, + { + "epoch": 1.83, + "learning_rate": 2.5807346716378e-05, + "loss": 0.0074, + "step": 362320 + }, + { + "epoch": 1.83, + "learning_rate": 2.579977902336399e-05, + "loss": 0.0051, + "step": 362330 + }, + { + "epoch": 1.83, + "learning_rate": 2.5792211330349978e-05, + "loss": 0.0059, + "step": 362340 + }, + { + "epoch": 1.83, + "learning_rate": 2.578464363733597e-05, + "loss": 0.0074, + "step": 362350 + }, + { + "epoch": 1.83, + "learning_rate": 2.5777075944321958e-05, + "loss": 0.0079, + "step": 362360 + }, + { + "epoch": 1.83, + "learning_rate": 2.576950825130795e-05, + "loss": 0.0064, + "step": 362370 + }, + { + "epoch": 1.83, + "learning_rate": 2.5761940558293935e-05, + "loss": 0.0068, + "step": 362380 + }, + { + "epoch": 1.83, + "learning_rate": 2.5754372865279926e-05, + "loss": 0.005, + "step": 362390 + }, + { + "epoch": 1.83, + "learning_rate": 2.5746805172265914e-05, + "loss": 0.0056, + "step": 362400 + }, + { + "epoch": 1.83, + "learning_rate": 2.5739237479251906e-05, + "loss": 0.006, + "step": 362410 + }, + { + "epoch": 1.83, + "learning_rate": 2.5731669786237894e-05, + "loss": 0.0094, + "step": 362420 + }, + { + "epoch": 1.83, + "learning_rate": 2.5724102093223886e-05, + "loss": 0.0069, + "step": 362430 + }, + { + "epoch": 1.83, + "learning_rate": 2.5716534400209874e-05, + "loss": 0.0073, + "step": 362440 + }, + { + "epoch": 1.83, + "learning_rate": 2.5708966707195866e-05, + "loss": 0.0065, + "step": 362450 + }, + { + "epoch": 1.83, + "learning_rate": 2.5701399014181854e-05, + "loss": 0.0045, + "step": 362460 + }, + { + "epoch": 1.83, + "learning_rate": 2.5693831321167845e-05, + "loss": 0.0073, + "step": 362470 + }, + { + "epoch": 1.83, + "learning_rate": 2.5686263628153834e-05, + "loss": 0.0069, + "step": 362480 + }, + { + "epoch": 1.83, + "learning_rate": 2.5678695935139825e-05, + "loss": 0.0059, + "step": 362490 + }, + { + "epoch": 1.83, + "learning_rate": 2.5671128242125814e-05, + "loss": 0.0088, + "step": 362500 + }, + { + "epoch": 1.83, + "learning_rate": 2.5663560549111805e-05, + "loss": 0.0039, + "step": 362510 + }, + { + "epoch": 1.83, + "learning_rate": 2.5655992856097793e-05, + "loss": 0.0061, + "step": 362520 + }, + { + "epoch": 1.83, + "learning_rate": 2.5648425163083785e-05, + "loss": 0.006, + "step": 362530 + }, + { + "epoch": 1.83, + "learning_rate": 2.564085747006977e-05, + "loss": 0.0065, + "step": 362540 + }, + { + "epoch": 1.83, + "learning_rate": 2.563328977705576e-05, + "loss": 0.0036, + "step": 362550 + }, + { + "epoch": 1.83, + "learning_rate": 2.562572208404175e-05, + "loss": 0.0071, + "step": 362560 + }, + { + "epoch": 1.83, + "learning_rate": 2.561815439102774e-05, + "loss": 0.0054, + "step": 362570 + }, + { + "epoch": 1.83, + "learning_rate": 2.561058669801373e-05, + "loss": 0.004, + "step": 362580 + }, + { + "epoch": 1.83, + "learning_rate": 2.560301900499972e-05, + "loss": 0.0061, + "step": 362590 + }, + { + "epoch": 1.83, + "learning_rate": 2.559545131198571e-05, + "loss": 0.0055, + "step": 362600 + }, + { + "epoch": 1.83, + "learning_rate": 2.55878836189717e-05, + "loss": 0.0066, + "step": 362610 + }, + { + "epoch": 1.83, + "learning_rate": 2.558031592595769e-05, + "loss": 0.0054, + "step": 362620 + }, + { + "epoch": 1.83, + "learning_rate": 2.557274823294368e-05, + "loss": 0.0054, + "step": 362630 + }, + { + "epoch": 1.83, + "learning_rate": 2.556518053992967e-05, + "loss": 0.0076, + "step": 362640 + }, + { + "epoch": 1.83, + "learning_rate": 2.555761284691566e-05, + "loss": 0.0058, + "step": 362650 + }, + { + "epoch": 1.83, + "learning_rate": 2.555004515390165e-05, + "loss": 0.0034, + "step": 362660 + }, + { + "epoch": 1.83, + "learning_rate": 2.554247746088764e-05, + "loss": 0.0066, + "step": 362670 + }, + { + "epoch": 1.83, + "learning_rate": 2.553490976787363e-05, + "loss": 0.0059, + "step": 362680 + }, + { + "epoch": 1.83, + "learning_rate": 2.552734207485962e-05, + "loss": 0.0046, + "step": 362690 + }, + { + "epoch": 1.83, + "learning_rate": 2.5519774381845605e-05, + "loss": 0.0078, + "step": 362700 + }, + { + "epoch": 1.83, + "learning_rate": 2.5512206688831593e-05, + "loss": 0.006, + "step": 362710 + }, + { + "epoch": 1.83, + "learning_rate": 2.5504638995817585e-05, + "loss": 0.0065, + "step": 362720 + }, + { + "epoch": 1.83, + "learning_rate": 2.5497071302803576e-05, + "loss": 0.0041, + "step": 362730 + }, + { + "epoch": 1.83, + "learning_rate": 2.5489503609789565e-05, + "loss": 0.0069, + "step": 362740 + }, + { + "epoch": 1.83, + "learning_rate": 2.5481935916775556e-05, + "loss": 0.0054, + "step": 362750 + }, + { + "epoch": 1.83, + "learning_rate": 2.5474368223761544e-05, + "loss": 0.0077, + "step": 362760 + }, + { + "epoch": 1.83, + "learning_rate": 2.5466800530747536e-05, + "loss": 0.0075, + "step": 362770 + }, + { + "epoch": 1.83, + "learning_rate": 2.5459232837733524e-05, + "loss": 0.0047, + "step": 362780 + }, + { + "epoch": 1.83, + "learning_rate": 2.5451665144719516e-05, + "loss": 0.0051, + "step": 362790 + }, + { + "epoch": 1.83, + "learning_rate": 2.5444097451705504e-05, + "loss": 0.0067, + "step": 362800 + }, + { + "epoch": 1.83, + "learning_rate": 2.5436529758691496e-05, + "loss": 0.0065, + "step": 362810 + }, + { + "epoch": 1.83, + "learning_rate": 2.5428962065677484e-05, + "loss": 0.0066, + "step": 362820 + }, + { + "epoch": 1.83, + "learning_rate": 2.5421394372663476e-05, + "loss": 0.0057, + "step": 362830 + }, + { + "epoch": 1.83, + "learning_rate": 2.5413826679649464e-05, + "loss": 0.0092, + "step": 362840 + }, + { + "epoch": 1.83, + "learning_rate": 2.540625898663545e-05, + "loss": 0.0068, + "step": 362850 + }, + { + "epoch": 1.83, + "learning_rate": 2.539869129362144e-05, + "loss": 0.0053, + "step": 362860 + }, + { + "epoch": 1.83, + "learning_rate": 2.539112360060743e-05, + "loss": 0.0053, + "step": 362870 + }, + { + "epoch": 1.83, + "learning_rate": 2.538355590759342e-05, + "loss": 0.0061, + "step": 362880 + }, + { + "epoch": 1.83, + "learning_rate": 2.5375988214579408e-05, + "loss": 0.0059, + "step": 362890 + }, + { + "epoch": 1.83, + "learning_rate": 2.53684205215654e-05, + "loss": 0.0055, + "step": 362900 + }, + { + "epoch": 1.83, + "learning_rate": 2.5360852828551388e-05, + "loss": 0.0081, + "step": 362910 + }, + { + "epoch": 1.83, + "learning_rate": 2.535328513553738e-05, + "loss": 0.0071, + "step": 362920 + }, + { + "epoch": 1.83, + "learning_rate": 2.5345717442523368e-05, + "loss": 0.0067, + "step": 362930 + }, + { + "epoch": 1.83, + "learning_rate": 2.533814974950936e-05, + "loss": 0.0065, + "step": 362940 + }, + { + "epoch": 1.83, + "learning_rate": 2.5330582056495348e-05, + "loss": 0.0061, + "step": 362950 + }, + { + "epoch": 1.83, + "learning_rate": 2.532301436348134e-05, + "loss": 0.004, + "step": 362960 + }, + { + "epoch": 1.83, + "learning_rate": 2.5315446670467328e-05, + "loss": 0.0056, + "step": 362970 + }, + { + "epoch": 1.83, + "learning_rate": 2.530787897745332e-05, + "loss": 0.0048, + "step": 362980 + }, + { + "epoch": 1.83, + "learning_rate": 2.530031128443931e-05, + "loss": 0.0088, + "step": 362990 + }, + { + "epoch": 1.83, + "learning_rate": 2.52927435914253e-05, + "loss": 0.0045, + "step": 363000 + }, + { + "epoch": 1.83, + "eval_cer": 0.9144324104542716, + "eval_loss": 0.004368518013507128, + "eval_runtime": 116.7968, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, + "step": 363000 + }, + { + "epoch": 1.83, + "learning_rate": 2.5285175898411284e-05, + "loss": 0.0062, + "step": 363010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5277608205397275e-05, + "loss": 0.0062, + "step": 363020 + }, + { + "epoch": 1.83, + "learning_rate": 2.5270040512383264e-05, + "loss": 0.0061, + "step": 363030 + }, + { + "epoch": 1.83, + "learning_rate": 2.5262472819369255e-05, + "loss": 0.0047, + "step": 363040 + }, + { + "epoch": 1.83, + "learning_rate": 2.5254905126355243e-05, + "loss": 0.0046, + "step": 363050 + }, + { + "epoch": 1.83, + "learning_rate": 2.5247337433341235e-05, + "loss": 0.0072, + "step": 363060 + }, + { + "epoch": 1.83, + "learning_rate": 2.5239769740327223e-05, + "loss": 0.0071, + "step": 363070 + }, + { + "epoch": 1.83, + "learning_rate": 2.5232202047313215e-05, + "loss": 0.0081, + "step": 363080 + }, + { + "epoch": 1.83, + "learning_rate": 2.5224634354299203e-05, + "loss": 0.0079, + "step": 363090 + }, + { + "epoch": 1.83, + "learning_rate": 2.5217066661285195e-05, + "loss": 0.0046, + "step": 363100 + }, + { + "epoch": 1.83, + "learning_rate": 2.5209498968271183e-05, + "loss": 0.0065, + "step": 363110 + }, + { + "epoch": 1.83, + "learning_rate": 2.5201931275257175e-05, + "loss": 0.0054, + "step": 363120 + }, + { + "epoch": 1.83, + "learning_rate": 2.5194363582243163e-05, + "loss": 0.005, + "step": 363130 + }, + { + "epoch": 1.83, + "learning_rate": 2.5186795889229154e-05, + "loss": 0.0062, + "step": 363140 + }, + { + "epoch": 1.83, + "learning_rate": 2.5179228196215143e-05, + "loss": 0.006, + "step": 363150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5171660503201134e-05, + "loss": 0.0087, + "step": 363160 + }, + { + "epoch": 1.83, + "learning_rate": 2.516409281018712e-05, + "loss": 0.0048, + "step": 363170 + }, + { + "epoch": 1.83, + "learning_rate": 2.515652511717311e-05, + "loss": 0.0053, + "step": 363180 + }, + { + "epoch": 1.83, + "learning_rate": 2.51489574241591e-05, + "loss": 0.006, + "step": 363190 + }, + { + "epoch": 1.83, + "learning_rate": 2.514138973114509e-05, + "loss": 0.0057, + "step": 363200 + }, + { + "epoch": 1.83, + "learning_rate": 2.513382203813108e-05, + "loss": 0.0076, + "step": 363210 + }, + { + "epoch": 1.83, + "learning_rate": 2.512625434511707e-05, + "loss": 0.005, + "step": 363220 + }, + { + "epoch": 1.83, + "learning_rate": 2.511868665210306e-05, + "loss": 0.006, + "step": 363230 + }, + { + "epoch": 1.83, + "learning_rate": 2.511111895908905e-05, + "loss": 0.0041, + "step": 363240 + }, + { + "epoch": 1.83, + "learning_rate": 2.510355126607504e-05, + "loss": 0.0079, + "step": 363250 + }, + { + "epoch": 1.83, + "learning_rate": 2.509598357306103e-05, + "loss": 0.0062, + "step": 363260 + }, + { + "epoch": 1.83, + "learning_rate": 2.5088415880047018e-05, + "loss": 0.0057, + "step": 363270 + }, + { + "epoch": 1.83, + "learning_rate": 2.508084818703301e-05, + "loss": 0.0059, + "step": 363280 + }, + { + "epoch": 1.83, + "learning_rate": 2.5073280494018998e-05, + "loss": 0.0076, + "step": 363290 + }, + { + "epoch": 1.83, + "learning_rate": 2.506571280100499e-05, + "loss": 0.0045, + "step": 363300 + }, + { + "epoch": 1.83, + "learning_rate": 2.5058145107990978e-05, + "loss": 0.0058, + "step": 363310 + }, + { + "epoch": 1.83, + "learning_rate": 2.5050577414976966e-05, + "loss": 0.0056, + "step": 363320 + }, + { + "epoch": 1.83, + "learning_rate": 2.5043009721962954e-05, + "loss": 0.0055, + "step": 363330 + }, + { + "epoch": 1.83, + "learning_rate": 2.5035442028948946e-05, + "loss": 0.0068, + "step": 363340 + }, + { + "epoch": 1.83, + "learning_rate": 2.5027874335934934e-05, + "loss": 0.007, + "step": 363350 + }, + { + "epoch": 1.83, + "learning_rate": 2.5020306642920926e-05, + "loss": 0.0048, + "step": 363360 + }, + { + "epoch": 1.83, + "learning_rate": 2.5012738949906914e-05, + "loss": 0.0047, + "step": 363370 + }, + { + "epoch": 1.83, + "learning_rate": 2.5005171256892906e-05, + "loss": 0.0059, + "step": 363380 + }, + { + "epoch": 1.83, + "learning_rate": 2.4997603563878894e-05, + "loss": 0.0045, + "step": 363390 + }, + { + "epoch": 1.83, + "learning_rate": 2.4990035870864885e-05, + "loss": 0.0066, + "step": 363400 + }, + { + "epoch": 1.83, + "learning_rate": 2.4982468177850874e-05, + "loss": 0.0053, + "step": 363410 + }, + { + "epoch": 1.83, + "learning_rate": 2.4974900484836865e-05, + "loss": 0.0041, + "step": 363420 + }, + { + "epoch": 1.83, + "learning_rate": 2.4967332791822853e-05, + "loss": 0.0074, + "step": 363430 + }, + { + "epoch": 1.83, + "learning_rate": 2.4959765098808845e-05, + "loss": 0.0078, + "step": 363440 + }, + { + "epoch": 1.83, + "learning_rate": 2.4952197405794833e-05, + "loss": 0.008, + "step": 363450 + }, + { + "epoch": 1.83, + "learning_rate": 2.4944629712780825e-05, + "loss": 0.0049, + "step": 363460 + }, + { + "epoch": 1.83, + "learning_rate": 2.4937062019766813e-05, + "loss": 0.0061, + "step": 363470 + }, + { + "epoch": 1.83, + "learning_rate": 2.49294943267528e-05, + "loss": 0.0058, + "step": 363480 + }, + { + "epoch": 1.83, + "learning_rate": 2.492192663373879e-05, + "loss": 0.0044, + "step": 363490 + }, + { + "epoch": 1.83, + "learning_rate": 2.491435894072478e-05, + "loss": 0.0055, + "step": 363500 + }, + { + "epoch": 1.83, + "learning_rate": 2.490679124771077e-05, + "loss": 0.0052, + "step": 363510 + }, + { + "epoch": 1.83, + "learning_rate": 2.489922355469676e-05, + "loss": 0.0052, + "step": 363520 + }, + { + "epoch": 1.83, + "learning_rate": 2.489165586168275e-05, + "loss": 0.0049, + "step": 363530 + }, + { + "epoch": 1.83, + "learning_rate": 2.488408816866874e-05, + "loss": 0.0056, + "step": 363540 + }, + { + "epoch": 1.83, + "learning_rate": 2.487652047565473e-05, + "loss": 0.0059, + "step": 363550 + }, + { + "epoch": 1.83, + "learning_rate": 2.486895278264072e-05, + "loss": 0.0062, + "step": 363560 + }, + { + "epoch": 1.83, + "learning_rate": 2.486138508962671e-05, + "loss": 0.0074, + "step": 363570 + }, + { + "epoch": 1.83, + "learning_rate": 2.48538173966127e-05, + "loss": 0.005, + "step": 363580 + }, + { + "epoch": 1.83, + "learning_rate": 2.484624970359869e-05, + "loss": 0.0047, + "step": 363590 + }, + { + "epoch": 1.83, + "learning_rate": 2.483868201058468e-05, + "loss": 0.0092, + "step": 363600 + }, + { + "epoch": 1.83, + "learning_rate": 2.483111431757067e-05, + "loss": 0.0067, + "step": 363610 + }, + { + "epoch": 1.83, + "learning_rate": 2.482354662455666e-05, + "loss": 0.0083, + "step": 363620 + }, + { + "epoch": 1.83, + "learning_rate": 2.4815978931542648e-05, + "loss": 0.006, + "step": 363630 + }, + { + "epoch": 1.83, + "learning_rate": 2.4808411238528633e-05, + "loss": 0.0065, + "step": 363640 + }, + { + "epoch": 1.83, + "learning_rate": 2.4800843545514625e-05, + "loss": 0.0067, + "step": 363650 + }, + { + "epoch": 1.83, + "learning_rate": 2.4793275852500613e-05, + "loss": 0.0042, + "step": 363660 + }, + { + "epoch": 1.83, + "learning_rate": 2.4785708159486605e-05, + "loss": 0.0044, + "step": 363670 + }, + { + "epoch": 1.83, + "learning_rate": 2.4778140466472593e-05, + "loss": 0.0048, + "step": 363680 + }, + { + "epoch": 1.83, + "learning_rate": 2.4770572773458584e-05, + "loss": 0.0057, + "step": 363690 + }, + { + "epoch": 1.83, + "learning_rate": 2.4763005080444576e-05, + "loss": 0.0062, + "step": 363700 + }, + { + "epoch": 1.83, + "learning_rate": 2.4755437387430564e-05, + "loss": 0.0062, + "step": 363710 + }, + { + "epoch": 1.84, + "learning_rate": 2.4747869694416556e-05, + "loss": 0.0048, + "step": 363720 + }, + { + "epoch": 1.84, + "learning_rate": 2.4740302001402544e-05, + "loss": 0.0061, + "step": 363730 + }, + { + "epoch": 1.84, + "learning_rate": 2.4732734308388536e-05, + "loss": 0.0067, + "step": 363740 + }, + { + "epoch": 1.84, + "learning_rate": 2.4725166615374524e-05, + "loss": 0.0059, + "step": 363750 + }, + { + "epoch": 1.84, + "learning_rate": 2.4717598922360515e-05, + "loss": 0.0052, + "step": 363760 + }, + { + "epoch": 1.84, + "learning_rate": 2.4710031229346504e-05, + "loss": 0.0037, + "step": 363770 + }, + { + "epoch": 1.84, + "learning_rate": 2.4702463536332495e-05, + "loss": 0.0053, + "step": 363780 + }, + { + "epoch": 1.84, + "learning_rate": 2.4694895843318483e-05, + "loss": 0.007, + "step": 363790 + }, + { + "epoch": 1.84, + "learning_rate": 2.468732815030447e-05, + "loss": 0.0055, + "step": 363800 + }, + { + "epoch": 1.84, + "learning_rate": 2.467976045729046e-05, + "loss": 0.0065, + "step": 363810 + }, + { + "epoch": 1.84, + "learning_rate": 2.4672192764276448e-05, + "loss": 0.004, + "step": 363820 + }, + { + "epoch": 1.84, + "learning_rate": 2.466462507126244e-05, + "loss": 0.0065, + "step": 363830 + }, + { + "epoch": 1.84, + "learning_rate": 2.4657057378248428e-05, + "loss": 0.007, + "step": 363840 + }, + { + "epoch": 1.84, + "learning_rate": 2.464948968523442e-05, + "loss": 0.0065, + "step": 363850 + }, + { + "epoch": 1.84, + "learning_rate": 2.4641921992220408e-05, + "loss": 0.0046, + "step": 363860 + }, + { + "epoch": 1.84, + "learning_rate": 2.46343542992064e-05, + "loss": 0.0065, + "step": 363870 + }, + { + "epoch": 1.84, + "learning_rate": 2.4626786606192388e-05, + "loss": 0.0052, + "step": 363880 + }, + { + "epoch": 1.84, + "learning_rate": 2.461921891317838e-05, + "loss": 0.0069, + "step": 363890 + }, + { + "epoch": 1.84, + "learning_rate": 2.4611651220164367e-05, + "loss": 0.0072, + "step": 363900 + }, + { + "epoch": 1.84, + "learning_rate": 2.460408352715036e-05, + "loss": 0.0074, + "step": 363910 + }, + { + "epoch": 1.84, + "learning_rate": 2.4596515834136347e-05, + "loss": 0.0058, + "step": 363920 + }, + { + "epoch": 1.84, + "learning_rate": 2.458894814112234e-05, + "loss": 0.0069, + "step": 363930 + }, + { + "epoch": 1.84, + "learning_rate": 2.4581380448108327e-05, + "loss": 0.0073, + "step": 363940 + }, + { + "epoch": 1.84, + "learning_rate": 2.4573812755094315e-05, + "loss": 0.0068, + "step": 363950 + }, + { + "epoch": 1.84, + "learning_rate": 2.4566245062080304e-05, + "loss": 0.0043, + "step": 363960 + }, + { + "epoch": 1.84, + "learning_rate": 2.4558677369066295e-05, + "loss": 0.004, + "step": 363970 + }, + { + "epoch": 1.84, + "learning_rate": 2.4551109676052283e-05, + "loss": 0.0039, + "step": 363980 + }, + { + "epoch": 1.84, + "learning_rate": 2.4543541983038275e-05, + "loss": 0.0056, + "step": 363990 + }, + { + "epoch": 1.84, + "learning_rate": 2.4535974290024263e-05, + "loss": 0.0058, + "step": 364000 + }, + { + "epoch": 1.84, + "eval_cer": 0.9144071801550111, + "eval_loss": 0.004426935221999884, + "eval_runtime": 116.6371, + "eval_samples_per_second": 17.147, + "eval_steps_per_second": 4.287, + "step": 364000 + }, + { + "epoch": 1.84, + "learning_rate": 2.4528406597010255e-05, + "loss": 0.0055, + "step": 364010 + }, + { + "epoch": 1.84, + "learning_rate": 2.4520838903996243e-05, + "loss": 0.006, + "step": 364020 + }, + { + "epoch": 1.84, + "learning_rate": 2.4513271210982235e-05, + "loss": 0.0074, + "step": 364030 + }, + { + "epoch": 1.84, + "learning_rate": 2.4505703517968223e-05, + "loss": 0.0064, + "step": 364040 + }, + { + "epoch": 1.84, + "learning_rate": 2.4498135824954214e-05, + "loss": 0.0067, + "step": 364050 + }, + { + "epoch": 1.84, + "learning_rate": 2.4490568131940203e-05, + "loss": 0.0051, + "step": 364060 + }, + { + "epoch": 1.84, + "learning_rate": 2.4483000438926194e-05, + "loss": 0.0048, + "step": 364070 + }, + { + "epoch": 1.84, + "learning_rate": 2.4475432745912182e-05, + "loss": 0.007, + "step": 364080 + }, + { + "epoch": 1.84, + "learning_rate": 2.4467865052898174e-05, + "loss": 0.0066, + "step": 364090 + }, + { + "epoch": 1.84, + "learning_rate": 2.4460297359884162e-05, + "loss": 0.0058, + "step": 364100 + }, + { + "epoch": 1.84, + "learning_rate": 2.445272966687015e-05, + "loss": 0.0048, + "step": 364110 + }, + { + "epoch": 1.84, + "learning_rate": 2.444516197385614e-05, + "loss": 0.0044, + "step": 364120 + }, + { + "epoch": 1.84, + "learning_rate": 2.443759428084213e-05, + "loss": 0.0064, + "step": 364130 + }, + { + "epoch": 1.84, + "learning_rate": 2.443002658782812e-05, + "loss": 0.0062, + "step": 364140 + }, + { + "epoch": 1.84, + "learning_rate": 2.442245889481411e-05, + "loss": 0.0054, + "step": 364150 + }, + { + "epoch": 1.84, + "learning_rate": 2.44148912018001e-05, + "loss": 0.0049, + "step": 364160 + }, + { + "epoch": 1.84, + "learning_rate": 2.440732350878609e-05, + "loss": 0.0049, + "step": 364170 + }, + { + "epoch": 1.84, + "learning_rate": 2.4399755815772078e-05, + "loss": 0.0063, + "step": 364180 + }, + { + "epoch": 1.84, + "learning_rate": 2.439218812275807e-05, + "loss": 0.0054, + "step": 364190 + }, + { + "epoch": 1.84, + "learning_rate": 2.4384620429744058e-05, + "loss": 0.005, + "step": 364200 + }, + { + "epoch": 1.84, + "learning_rate": 2.437705273673005e-05, + "loss": 0.0052, + "step": 364210 + }, + { + "epoch": 1.84, + "learning_rate": 2.4369485043716038e-05, + "loss": 0.0083, + "step": 364220 + }, + { + "epoch": 1.84, + "learning_rate": 2.436191735070203e-05, + "loss": 0.0056, + "step": 364230 + }, + { + "epoch": 1.84, + "learning_rate": 2.4354349657688018e-05, + "loss": 0.0063, + "step": 364240 + }, + { + "epoch": 1.84, + "learning_rate": 2.434678196467401e-05, + "loss": 0.0061, + "step": 364250 + }, + { + "epoch": 1.84, + "learning_rate": 2.4339214271659998e-05, + "loss": 0.006, + "step": 364260 + }, + { + "epoch": 1.84, + "learning_rate": 2.4331646578645986e-05, + "loss": 0.0062, + "step": 364270 + }, + { + "epoch": 1.84, + "learning_rate": 2.4324078885631974e-05, + "loss": 0.0061, + "step": 364280 + }, + { + "epoch": 1.84, + "learning_rate": 2.4316511192617966e-05, + "loss": 0.005, + "step": 364290 + }, + { + "epoch": 1.84, + "learning_rate": 2.4308943499603954e-05, + "loss": 0.005, + "step": 364300 + }, + { + "epoch": 1.84, + "learning_rate": 2.4301375806589945e-05, + "loss": 0.0085, + "step": 364310 + }, + { + "epoch": 1.84, + "learning_rate": 2.4293808113575934e-05, + "loss": 0.0096, + "step": 364320 + }, + { + "epoch": 1.84, + "learning_rate": 2.4286240420561925e-05, + "loss": 0.0056, + "step": 364330 + }, + { + "epoch": 1.84, + "learning_rate": 2.4278672727547913e-05, + "loss": 0.0081, + "step": 364340 + }, + { + "epoch": 1.84, + "learning_rate": 2.4271105034533905e-05, + "loss": 0.0048, + "step": 364350 + }, + { + "epoch": 1.84, + "learning_rate": 2.4263537341519893e-05, + "loss": 0.0052, + "step": 364360 + }, + { + "epoch": 1.84, + "learning_rate": 2.4255969648505885e-05, + "loss": 0.0048, + "step": 364370 + }, + { + "epoch": 1.84, + "learning_rate": 2.4248401955491873e-05, + "loss": 0.0046, + "step": 364380 + }, + { + "epoch": 1.84, + "learning_rate": 2.4240834262477865e-05, + "loss": 0.0079, + "step": 364390 + }, + { + "epoch": 1.84, + "learning_rate": 2.4233266569463853e-05, + "loss": 0.0051, + "step": 364400 + }, + { + "epoch": 1.84, + "learning_rate": 2.4225698876449845e-05, + "loss": 0.0056, + "step": 364410 + }, + { + "epoch": 1.84, + "learning_rate": 2.421813118343583e-05, + "loss": 0.0053, + "step": 364420 + }, + { + "epoch": 1.84, + "learning_rate": 2.421056349042182e-05, + "loss": 0.0048, + "step": 364430 + }, + { + "epoch": 1.84, + "learning_rate": 2.420299579740781e-05, + "loss": 0.0057, + "step": 364440 + }, + { + "epoch": 1.84, + "learning_rate": 2.41954281043938e-05, + "loss": 0.0048, + "step": 364450 + }, + { + "epoch": 1.84, + "learning_rate": 2.418786041137979e-05, + "loss": 0.0048, + "step": 364460 + }, + { + "epoch": 1.84, + "learning_rate": 2.418029271836578e-05, + "loss": 0.0061, + "step": 364470 + }, + { + "epoch": 1.84, + "learning_rate": 2.417272502535177e-05, + "loss": 0.0056, + "step": 364480 + }, + { + "epoch": 1.84, + "learning_rate": 2.416515733233776e-05, + "loss": 0.0045, + "step": 364490 + }, + { + "epoch": 1.84, + "learning_rate": 2.415758963932375e-05, + "loss": 0.005, + "step": 364500 + }, + { + "epoch": 1.84, + "learning_rate": 2.415002194630974e-05, + "loss": 0.0048, + "step": 364510 + }, + { + "epoch": 1.84, + "learning_rate": 2.414245425329573e-05, + "loss": 0.0047, + "step": 364520 + }, + { + "epoch": 1.84, + "learning_rate": 2.413488656028172e-05, + "loss": 0.0063, + "step": 364530 + }, + { + "epoch": 1.84, + "learning_rate": 2.412731886726771e-05, + "loss": 0.0065, + "step": 364540 + }, + { + "epoch": 1.84, + "learning_rate": 2.41197511742537e-05, + "loss": 0.0071, + "step": 364550 + }, + { + "epoch": 1.84, + "learning_rate": 2.4112183481239688e-05, + "loss": 0.0055, + "step": 364560 + }, + { + "epoch": 1.84, + "learning_rate": 2.410461578822568e-05, + "loss": 0.0047, + "step": 364570 + }, + { + "epoch": 1.84, + "learning_rate": 2.4097048095211665e-05, + "loss": 0.0059, + "step": 364580 + }, + { + "epoch": 1.84, + "learning_rate": 2.4089480402197653e-05, + "loss": 0.0064, + "step": 364590 + }, + { + "epoch": 1.84, + "learning_rate": 2.4081912709183644e-05, + "loss": 0.0052, + "step": 364600 + }, + { + "epoch": 1.84, + "learning_rate": 2.4074345016169633e-05, + "loss": 0.0067, + "step": 364610 + }, + { + "epoch": 1.84, + "learning_rate": 2.4066777323155624e-05, + "loss": 0.0045, + "step": 364620 + }, + { + "epoch": 1.84, + "learning_rate": 2.4059209630141612e-05, + "loss": 0.0077, + "step": 364630 + }, + { + "epoch": 1.84, + "learning_rate": 2.4051641937127604e-05, + "loss": 0.0061, + "step": 364640 + }, + { + "epoch": 1.84, + "learning_rate": 2.4044074244113592e-05, + "loss": 0.0049, + "step": 364650 + }, + { + "epoch": 1.84, + "learning_rate": 2.4036506551099584e-05, + "loss": 0.0055, + "step": 364660 + }, + { + "epoch": 1.84, + "learning_rate": 2.4028938858085575e-05, + "loss": 0.0048, + "step": 364670 + }, + { + "epoch": 1.84, + "learning_rate": 2.4021371165071564e-05, + "loss": 0.0047, + "step": 364680 + }, + { + "epoch": 1.84, + "learning_rate": 2.4013803472057555e-05, + "loss": 0.0062, + "step": 364690 + }, + { + "epoch": 1.84, + "learning_rate": 2.4006235779043544e-05, + "loss": 0.0066, + "step": 364700 + }, + { + "epoch": 1.84, + "learning_rate": 2.3998668086029535e-05, + "loss": 0.0053, + "step": 364710 + }, + { + "epoch": 1.84, + "learning_rate": 2.3991100393015523e-05, + "loss": 0.0043, + "step": 364720 + }, + { + "epoch": 1.84, + "learning_rate": 2.3983532700001515e-05, + "loss": 0.0054, + "step": 364730 + }, + { + "epoch": 1.84, + "learning_rate": 2.39759650069875e-05, + "loss": 0.0055, + "step": 364740 + }, + { + "epoch": 1.84, + "learning_rate": 2.3968397313973488e-05, + "loss": 0.0058, + "step": 364750 + }, + { + "epoch": 1.84, + "learning_rate": 2.396082962095948e-05, + "loss": 0.0056, + "step": 364760 + }, + { + "epoch": 1.84, + "learning_rate": 2.3953261927945468e-05, + "loss": 0.0051, + "step": 364770 + }, + { + "epoch": 1.84, + "learning_rate": 2.394569423493146e-05, + "loss": 0.0061, + "step": 364780 + }, + { + "epoch": 1.84, + "learning_rate": 2.3938126541917448e-05, + "loss": 0.0068, + "step": 364790 + }, + { + "epoch": 1.84, + "learning_rate": 2.393055884890344e-05, + "loss": 0.0056, + "step": 364800 + }, + { + "epoch": 1.84, + "learning_rate": 2.3922991155889427e-05, + "loss": 0.0046, + "step": 364810 + }, + { + "epoch": 1.84, + "learning_rate": 2.391542346287542e-05, + "loss": 0.0066, + "step": 364820 + }, + { + "epoch": 1.84, + "learning_rate": 2.3907855769861407e-05, + "loss": 0.0063, + "step": 364830 + }, + { + "epoch": 1.84, + "learning_rate": 2.39002880768474e-05, + "loss": 0.0067, + "step": 364840 + }, + { + "epoch": 1.84, + "learning_rate": 2.3892720383833387e-05, + "loss": 0.0056, + "step": 364850 + }, + { + "epoch": 1.84, + "learning_rate": 2.388515269081938e-05, + "loss": 0.0039, + "step": 364860 + }, + { + "epoch": 1.84, + "learning_rate": 2.3877584997805367e-05, + "loss": 0.0083, + "step": 364870 + }, + { + "epoch": 1.84, + "learning_rate": 2.387001730479136e-05, + "loss": 0.0064, + "step": 364880 + }, + { + "epoch": 1.84, + "learning_rate": 2.3862449611777343e-05, + "loss": 0.0097, + "step": 364890 + }, + { + "epoch": 1.84, + "learning_rate": 2.3854881918763335e-05, + "loss": 0.0063, + "step": 364900 + }, + { + "epoch": 1.84, + "learning_rate": 2.3847314225749323e-05, + "loss": 0.0059, + "step": 364910 + }, + { + "epoch": 1.84, + "learning_rate": 2.3839746532735315e-05, + "loss": 0.0048, + "step": 364920 + }, + { + "epoch": 1.84, + "learning_rate": 2.3832178839721303e-05, + "loss": 0.0045, + "step": 364930 + }, + { + "epoch": 1.84, + "learning_rate": 2.3824611146707295e-05, + "loss": 0.0064, + "step": 364940 + }, + { + "epoch": 1.84, + "learning_rate": 2.3817043453693283e-05, + "loss": 0.0047, + "step": 364950 + }, + { + "epoch": 1.84, + "learning_rate": 2.3809475760679274e-05, + "loss": 0.0058, + "step": 364960 + }, + { + "epoch": 1.84, + "learning_rate": 2.3801908067665263e-05, + "loss": 0.0059, + "step": 364970 + }, + { + "epoch": 1.84, + "learning_rate": 2.3794340374651254e-05, + "loss": 0.004, + "step": 364980 + }, + { + "epoch": 1.84, + "learning_rate": 2.3786772681637243e-05, + "loss": 0.0045, + "step": 364990 + }, + { + "epoch": 1.84, + "learning_rate": 2.3779204988623234e-05, + "loss": 0.0054, + "step": 365000 + }, + { + "epoch": 1.84, + "eval_cer": 0.9144207657007667, + "eval_loss": 0.0044406414963305, + "eval_runtime": 116.6279, + "eval_samples_per_second": 17.149, + "eval_steps_per_second": 4.287, + "step": 365000 + }, + { + "epoch": 1.84, + "learning_rate": 2.3771637295609222e-05, + "loss": 0.004, + "step": 365010 + }, + { + "epoch": 1.84, + "learning_rate": 2.3764069602595214e-05, + "loss": 0.0067, + "step": 365020 + }, + { + "epoch": 1.84, + "learning_rate": 2.3756501909581202e-05, + "loss": 0.0058, + "step": 365030 + }, + { + "epoch": 1.84, + "learning_rate": 2.3748934216567194e-05, + "loss": 0.0055, + "step": 365040 + }, + { + "epoch": 1.84, + "learning_rate": 2.374136652355318e-05, + "loss": 0.0063, + "step": 365050 + }, + { + "epoch": 1.84, + "learning_rate": 2.373379883053917e-05, + "loss": 0.0056, + "step": 365060 + }, + { + "epoch": 1.84, + "learning_rate": 2.372623113752516e-05, + "loss": 0.007, + "step": 365070 + }, + { + "epoch": 1.84, + "learning_rate": 2.371866344451115e-05, + "loss": 0.0063, + "step": 365080 + }, + { + "epoch": 1.84, + "learning_rate": 2.3711095751497138e-05, + "loss": 0.0058, + "step": 365090 + }, + { + "epoch": 1.84, + "learning_rate": 2.370352805848313e-05, + "loss": 0.0053, + "step": 365100 + }, + { + "epoch": 1.84, + "learning_rate": 2.3695960365469118e-05, + "loss": 0.0065, + "step": 365110 + }, + { + "epoch": 1.84, + "learning_rate": 2.368839267245511e-05, + "loss": 0.0032, + "step": 365120 + }, + { + "epoch": 1.84, + "learning_rate": 2.3680824979441098e-05, + "loss": 0.0056, + "step": 365130 + }, + { + "epoch": 1.84, + "learning_rate": 2.367325728642709e-05, + "loss": 0.0047, + "step": 365140 + }, + { + "epoch": 1.84, + "learning_rate": 2.3665689593413078e-05, + "loss": 0.0051, + "step": 365150 + }, + { + "epoch": 1.84, + "learning_rate": 2.365812190039907e-05, + "loss": 0.0054, + "step": 365160 + }, + { + "epoch": 1.84, + "learning_rate": 2.3650554207385058e-05, + "loss": 0.0056, + "step": 365170 + }, + { + "epoch": 1.84, + "learning_rate": 2.364298651437105e-05, + "loss": 0.0054, + "step": 365180 + }, + { + "epoch": 1.84, + "learning_rate": 2.3635418821357037e-05, + "loss": 0.005, + "step": 365190 + }, + { + "epoch": 1.84, + "learning_rate": 2.362785112834303e-05, + "loss": 0.0056, + "step": 365200 + }, + { + "epoch": 1.84, + "learning_rate": 2.3620283435329014e-05, + "loss": 0.0072, + "step": 365210 + }, + { + "epoch": 1.84, + "learning_rate": 2.3612715742315005e-05, + "loss": 0.0042, + "step": 365220 + }, + { + "epoch": 1.84, + "learning_rate": 2.3605148049300994e-05, + "loss": 0.0073, + "step": 365230 + }, + { + "epoch": 1.84, + "learning_rate": 2.3597580356286985e-05, + "loss": 0.0079, + "step": 365240 + }, + { + "epoch": 1.84, + "learning_rate": 2.3590012663272973e-05, + "loss": 0.0054, + "step": 365250 + }, + { + "epoch": 1.84, + "learning_rate": 2.3582444970258965e-05, + "loss": 0.0055, + "step": 365260 + }, + { + "epoch": 1.84, + "learning_rate": 2.3574877277244953e-05, + "loss": 0.0067, + "step": 365270 + }, + { + "epoch": 1.84, + "learning_rate": 2.3567309584230945e-05, + "loss": 0.0083, + "step": 365280 + }, + { + "epoch": 1.84, + "learning_rate": 2.3559741891216933e-05, + "loss": 0.0051, + "step": 365290 + }, + { + "epoch": 1.84, + "learning_rate": 2.3552174198202925e-05, + "loss": 0.0046, + "step": 365300 + }, + { + "epoch": 1.84, + "learning_rate": 2.3544606505188913e-05, + "loss": 0.0056, + "step": 365310 + }, + { + "epoch": 1.84, + "learning_rate": 2.3537038812174905e-05, + "loss": 0.0059, + "step": 365320 + }, + { + "epoch": 1.84, + "learning_rate": 2.3529471119160893e-05, + "loss": 0.0046, + "step": 365330 + }, + { + "epoch": 1.84, + "learning_rate": 2.3521903426146884e-05, + "loss": 0.0064, + "step": 365340 + }, + { + "epoch": 1.84, + "learning_rate": 2.3514335733132873e-05, + "loss": 0.0057, + "step": 365350 + }, + { + "epoch": 1.84, + "learning_rate": 2.3506768040118864e-05, + "loss": 0.0059, + "step": 365360 + }, + { + "epoch": 1.84, + "learning_rate": 2.349920034710485e-05, + "loss": 0.0049, + "step": 365370 + }, + { + "epoch": 1.84, + "learning_rate": 2.3491632654090837e-05, + "loss": 0.0061, + "step": 365380 + }, + { + "epoch": 1.84, + "learning_rate": 2.348406496107683e-05, + "loss": 0.0052, + "step": 365390 + }, + { + "epoch": 1.84, + "learning_rate": 2.347649726806282e-05, + "loss": 0.0071, + "step": 365400 + }, + { + "epoch": 1.84, + "learning_rate": 2.346892957504881e-05, + "loss": 0.0056, + "step": 365410 + }, + { + "epoch": 1.84, + "learning_rate": 2.34613618820348e-05, + "loss": 0.006, + "step": 365420 + }, + { + "epoch": 1.84, + "learning_rate": 2.345379418902079e-05, + "loss": 0.0054, + "step": 365430 + }, + { + "epoch": 1.84, + "learning_rate": 2.344622649600678e-05, + "loss": 0.0058, + "step": 365440 + }, + { + "epoch": 1.84, + "learning_rate": 2.343865880299277e-05, + "loss": 0.0073, + "step": 365450 + }, + { + "epoch": 1.84, + "learning_rate": 2.343109110997876e-05, + "loss": 0.0074, + "step": 365460 + }, + { + "epoch": 1.84, + "learning_rate": 2.3423523416964748e-05, + "loss": 0.0055, + "step": 365470 + }, + { + "epoch": 1.84, + "learning_rate": 2.341595572395074e-05, + "loss": 0.0062, + "step": 365480 + }, + { + "epoch": 1.84, + "learning_rate": 2.3408388030936728e-05, + "loss": 0.0054, + "step": 365490 + }, + { + "epoch": 1.84, + "learning_rate": 2.340082033792272e-05, + "loss": 0.0058, + "step": 365500 + }, + { + "epoch": 1.84, + "learning_rate": 2.3393252644908708e-05, + "loss": 0.0069, + "step": 365510 + }, + { + "epoch": 1.84, + "learning_rate": 2.3385684951894693e-05, + "loss": 0.0055, + "step": 365520 + }, + { + "epoch": 1.84, + "learning_rate": 2.3378117258880684e-05, + "loss": 0.0055, + "step": 365530 + }, + { + "epoch": 1.84, + "learning_rate": 2.3370549565866672e-05, + "loss": 0.0039, + "step": 365540 + }, + { + "epoch": 1.84, + "learning_rate": 2.3362981872852664e-05, + "loss": 0.0066, + "step": 365550 + }, + { + "epoch": 1.84, + "learning_rate": 2.3355414179838652e-05, + "loss": 0.0055, + "step": 365560 + }, + { + "epoch": 1.84, + "learning_rate": 2.3347846486824644e-05, + "loss": 0.0081, + "step": 365570 + }, + { + "epoch": 1.84, + "learning_rate": 2.3340278793810632e-05, + "loss": 0.0068, + "step": 365580 + }, + { + "epoch": 1.84, + "learning_rate": 2.3332711100796624e-05, + "loss": 0.0064, + "step": 365590 + }, + { + "epoch": 1.84, + "learning_rate": 2.3325143407782612e-05, + "loss": 0.0052, + "step": 365600 + }, + { + "epoch": 1.84, + "learning_rate": 2.3317575714768604e-05, + "loss": 0.0057, + "step": 365610 + }, + { + "epoch": 1.84, + "learning_rate": 2.3310008021754592e-05, + "loss": 0.0037, + "step": 365620 + }, + { + "epoch": 1.84, + "learning_rate": 2.3302440328740583e-05, + "loss": 0.0042, + "step": 365630 + }, + { + "epoch": 1.84, + "learning_rate": 2.3294872635726575e-05, + "loss": 0.0054, + "step": 365640 + }, + { + "epoch": 1.84, + "learning_rate": 2.3287304942712563e-05, + "loss": 0.0048, + "step": 365650 + }, + { + "epoch": 1.84, + "learning_rate": 2.3279737249698555e-05, + "loss": 0.0053, + "step": 365660 + }, + { + "epoch": 1.84, + "learning_rate": 2.3272169556684543e-05, + "loss": 0.0039, + "step": 365670 + }, + { + "epoch": 1.84, + "learning_rate": 2.3264601863670528e-05, + "loss": 0.005, + "step": 365680 + }, + { + "epoch": 1.84, + "learning_rate": 2.325703417065652e-05, + "loss": 0.0067, + "step": 365690 + }, + { + "epoch": 1.84, + "learning_rate": 2.3249466477642508e-05, + "loss": 0.0058, + "step": 365700 + }, + { + "epoch": 1.85, + "learning_rate": 2.32418987846285e-05, + "loss": 0.0065, + "step": 365710 + }, + { + "epoch": 1.85, + "learning_rate": 2.3234331091614488e-05, + "loss": 0.0055, + "step": 365720 + }, + { + "epoch": 1.85, + "learning_rate": 2.322676339860048e-05, + "loss": 0.0078, + "step": 365730 + }, + { + "epoch": 1.85, + "learning_rate": 2.3219195705586467e-05, + "loss": 0.0055, + "step": 365740 + }, + { + "epoch": 1.85, + "learning_rate": 2.321162801257246e-05, + "loss": 0.0074, + "step": 365750 + }, + { + "epoch": 1.85, + "learning_rate": 2.3204060319558447e-05, + "loss": 0.0057, + "step": 365760 + }, + { + "epoch": 1.85, + "learning_rate": 2.319649262654444e-05, + "loss": 0.006, + "step": 365770 + }, + { + "epoch": 1.85, + "learning_rate": 2.3188924933530427e-05, + "loss": 0.0105, + "step": 365780 + }, + { + "epoch": 1.85, + "learning_rate": 2.318135724051642e-05, + "loss": 0.0054, + "step": 365790 + }, + { + "epoch": 1.85, + "learning_rate": 2.3173789547502407e-05, + "loss": 0.0059, + "step": 365800 + }, + { + "epoch": 1.85, + "learning_rate": 2.31662218544884e-05, + "loss": 0.0075, + "step": 365810 + }, + { + "epoch": 1.85, + "learning_rate": 2.3158654161474387e-05, + "loss": 0.0051, + "step": 365820 + }, + { + "epoch": 1.85, + "learning_rate": 2.3151086468460378e-05, + "loss": 0.0066, + "step": 365830 + }, + { + "epoch": 1.85, + "learning_rate": 2.3143518775446363e-05, + "loss": 0.0042, + "step": 365840 + }, + { + "epoch": 1.85, + "learning_rate": 2.3135951082432355e-05, + "loss": 0.0051, + "step": 365850 + }, + { + "epoch": 1.85, + "learning_rate": 2.3128383389418343e-05, + "loss": 0.0064, + "step": 365860 + }, + { + "epoch": 1.85, + "learning_rate": 2.3120815696404335e-05, + "loss": 0.0054, + "step": 365870 + }, + { + "epoch": 1.85, + "learning_rate": 2.3113248003390323e-05, + "loss": 0.0041, + "step": 365880 + }, + { + "epoch": 1.85, + "learning_rate": 2.3105680310376314e-05, + "loss": 0.0057, + "step": 365890 + }, + { + "epoch": 1.85, + "learning_rate": 2.3098112617362303e-05, + "loss": 0.0057, + "step": 365900 + }, + { + "epoch": 1.85, + "learning_rate": 2.3090544924348294e-05, + "loss": 0.0064, + "step": 365910 + }, + { + "epoch": 1.85, + "learning_rate": 2.3082977231334282e-05, + "loss": 0.0051, + "step": 365920 + }, + { + "epoch": 1.85, + "learning_rate": 2.3075409538320274e-05, + "loss": 0.0053, + "step": 365930 + }, + { + "epoch": 1.85, + "learning_rate": 2.3067841845306262e-05, + "loss": 0.0063, + "step": 365940 + }, + { + "epoch": 1.85, + "learning_rate": 2.3060274152292254e-05, + "loss": 0.0064, + "step": 365950 + }, + { + "epoch": 1.85, + "learning_rate": 2.3052706459278242e-05, + "loss": 0.0065, + "step": 365960 + }, + { + "epoch": 1.85, + "learning_rate": 2.3045138766264234e-05, + "loss": 0.0063, + "step": 365970 + }, + { + "epoch": 1.85, + "learning_rate": 2.3037571073250222e-05, + "loss": 0.0052, + "step": 365980 + }, + { + "epoch": 1.85, + "learning_rate": 2.303000338023621e-05, + "loss": 0.0091, + "step": 365990 + }, + { + "epoch": 1.85, + "learning_rate": 2.30224356872222e-05, + "loss": 0.0038, + "step": 366000 + }, + { + "epoch": 1.85, + "eval_cer": 0.914423676889143, + "eval_loss": 0.004396693781018257, + "eval_runtime": 116.8468, + "eval_samples_per_second": 17.116, + "eval_steps_per_second": 4.279, + "step": 366000 + }, + { + "epoch": 1.85, + "learning_rate": 2.301486799420819e-05, + "loss": 0.0056, + "step": 366010 + }, + { + "epoch": 1.85, + "learning_rate": 2.3007300301194178e-05, + "loss": 0.005, + "step": 366020 + }, + { + "epoch": 1.85, + "learning_rate": 2.299973260818017e-05, + "loss": 0.0065, + "step": 366030 + }, + { + "epoch": 1.85, + "learning_rate": 2.2992164915166158e-05, + "loss": 0.0061, + "step": 366040 + }, + { + "epoch": 1.85, + "learning_rate": 2.298459722215215e-05, + "loss": 0.0049, + "step": 366050 + }, + { + "epoch": 1.85, + "learning_rate": 2.2977029529138138e-05, + "loss": 0.0045, + "step": 366060 + }, + { + "epoch": 1.85, + "learning_rate": 2.296946183612413e-05, + "loss": 0.0051, + "step": 366070 + }, + { + "epoch": 1.85, + "learning_rate": 2.2961894143110118e-05, + "loss": 0.006, + "step": 366080 + }, + { + "epoch": 1.85, + "learning_rate": 2.295432645009611e-05, + "loss": 0.0051, + "step": 366090 + }, + { + "epoch": 1.85, + "learning_rate": 2.2946758757082097e-05, + "loss": 0.0056, + "step": 366100 + }, + { + "epoch": 1.85, + "learning_rate": 2.293919106406809e-05, + "loss": 0.0087, + "step": 366110 + }, + { + "epoch": 1.85, + "learning_rate": 2.2931623371054077e-05, + "loss": 0.0076, + "step": 366120 + }, + { + "epoch": 1.85, + "learning_rate": 2.292405567804007e-05, + "loss": 0.0091, + "step": 366130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2916487985026057e-05, + "loss": 0.0043, + "step": 366140 + }, + { + "epoch": 1.85, + "learning_rate": 2.2908920292012045e-05, + "loss": 0.0055, + "step": 366150 + }, + { + "epoch": 1.85, + "learning_rate": 2.2901352598998034e-05, + "loss": 0.0061, + "step": 366160 + }, + { + "epoch": 1.85, + "learning_rate": 2.2893784905984025e-05, + "loss": 0.006, + "step": 366170 + }, + { + "epoch": 1.85, + "learning_rate": 2.2886217212970013e-05, + "loss": 0.0042, + "step": 366180 + }, + { + "epoch": 1.85, + "learning_rate": 2.2878649519956005e-05, + "loss": 0.0045, + "step": 366190 + }, + { + "epoch": 1.85, + "learning_rate": 2.2871081826941993e-05, + "loss": 0.0049, + "step": 366200 + }, + { + "epoch": 1.85, + "learning_rate": 2.2863514133927985e-05, + "loss": 0.0078, + "step": 366210 + }, + { + "epoch": 1.85, + "learning_rate": 2.2855946440913973e-05, + "loss": 0.007, + "step": 366220 + }, + { + "epoch": 1.85, + "learning_rate": 2.2848378747899965e-05, + "loss": 0.0053, + "step": 366230 + }, + { + "epoch": 1.85, + "learning_rate": 2.2840811054885953e-05, + "loss": 0.006, + "step": 366240 + }, + { + "epoch": 1.85, + "learning_rate": 2.2833243361871944e-05, + "loss": 0.0057, + "step": 366250 + }, + { + "epoch": 1.85, + "learning_rate": 2.2825675668857933e-05, + "loss": 0.0073, + "step": 366260 + }, + { + "epoch": 1.85, + "learning_rate": 2.2818107975843924e-05, + "loss": 0.0053, + "step": 366270 + }, + { + "epoch": 1.85, + "learning_rate": 2.2810540282829912e-05, + "loss": 0.005, + "step": 366280 + }, + { + "epoch": 1.85, + "learning_rate": 2.2802972589815904e-05, + "loss": 0.0056, + "step": 366290 + }, + { + "epoch": 1.85, + "learning_rate": 2.2795404896801892e-05, + "loss": 0.0051, + "step": 366300 + }, + { + "epoch": 1.85, + "learning_rate": 2.2787837203787877e-05, + "loss": 0.0057, + "step": 366310 + }, + { + "epoch": 1.85, + "learning_rate": 2.278026951077387e-05, + "loss": 0.0084, + "step": 366320 + }, + { + "epoch": 1.85, + "learning_rate": 2.2772701817759857e-05, + "loss": 0.005, + "step": 366330 + }, + { + "epoch": 1.85, + "learning_rate": 2.276513412474585e-05, + "loss": 0.0068, + "step": 366340 + }, + { + "epoch": 1.85, + "learning_rate": 2.2757566431731837e-05, + "loss": 0.0077, + "step": 366350 + }, + { + "epoch": 1.85, + "learning_rate": 2.274999873871783e-05, + "loss": 0.005, + "step": 366360 + }, + { + "epoch": 1.85, + "learning_rate": 2.274243104570382e-05, + "loss": 0.0065, + "step": 366370 + }, + { + "epoch": 1.85, + "learning_rate": 2.2734863352689808e-05, + "loss": 0.0048, + "step": 366380 + }, + { + "epoch": 1.85, + "learning_rate": 2.27272956596758e-05, + "loss": 0.0069, + "step": 366390 + }, + { + "epoch": 1.85, + "learning_rate": 2.2719727966661788e-05, + "loss": 0.0067, + "step": 366400 + }, + { + "epoch": 1.85, + "learning_rate": 2.271216027364778e-05, + "loss": 0.0062, + "step": 366410 + }, + { + "epoch": 1.85, + "learning_rate": 2.2704592580633768e-05, + "loss": 0.0051, + "step": 366420 + }, + { + "epoch": 1.85, + "learning_rate": 2.269702488761976e-05, + "loss": 0.0047, + "step": 366430 + }, + { + "epoch": 1.85, + "learning_rate": 2.2689457194605748e-05, + "loss": 0.0062, + "step": 366440 + }, + { + "epoch": 1.85, + "learning_rate": 2.268188950159174e-05, + "loss": 0.0053, + "step": 366450 + }, + { + "epoch": 1.85, + "learning_rate": 2.2674321808577728e-05, + "loss": 0.006, + "step": 366460 + }, + { + "epoch": 1.85, + "learning_rate": 2.2666754115563712e-05, + "loss": 0.0065, + "step": 366470 + }, + { + "epoch": 1.85, + "learning_rate": 2.2659186422549704e-05, + "loss": 0.0086, + "step": 366480 + }, + { + "epoch": 1.85, + "learning_rate": 2.2651618729535692e-05, + "loss": 0.0059, + "step": 366490 + }, + { + "epoch": 1.85, + "learning_rate": 2.2644051036521684e-05, + "loss": 0.0064, + "step": 366500 + }, + { + "epoch": 1.85, + "learning_rate": 2.2636483343507672e-05, + "loss": 0.0068, + "step": 366510 + }, + { + "epoch": 1.85, + "learning_rate": 2.2628915650493664e-05, + "loss": 0.0054, + "step": 366520 + }, + { + "epoch": 1.85, + "learning_rate": 2.2621347957479652e-05, + "loss": 0.0053, + "step": 366530 + }, + { + "epoch": 1.85, + "learning_rate": 2.2613780264465643e-05, + "loss": 0.0063, + "step": 366540 + }, + { + "epoch": 1.85, + "learning_rate": 2.260621257145163e-05, + "loss": 0.0059, + "step": 366550 + }, + { + "epoch": 1.85, + "learning_rate": 2.2598644878437623e-05, + "loss": 0.0059, + "step": 366560 + }, + { + "epoch": 1.85, + "learning_rate": 2.259107718542361e-05, + "loss": 0.005, + "step": 366570 + }, + { + "epoch": 1.85, + "learning_rate": 2.2583509492409603e-05, + "loss": 0.0065, + "step": 366580 + }, + { + "epoch": 1.85, + "learning_rate": 2.257594179939559e-05, + "loss": 0.0045, + "step": 366590 + }, + { + "epoch": 1.85, + "learning_rate": 2.2568374106381583e-05, + "loss": 0.0062, + "step": 366600 + }, + { + "epoch": 1.85, + "learning_rate": 2.256080641336757e-05, + "loss": 0.0068, + "step": 366610 + }, + { + "epoch": 1.85, + "learning_rate": 2.255323872035356e-05, + "loss": 0.0078, + "step": 366620 + }, + { + "epoch": 1.85, + "learning_rate": 2.2545671027339548e-05, + "loss": 0.0067, + "step": 366630 + }, + { + "epoch": 1.85, + "learning_rate": 2.253810333432554e-05, + "loss": 0.0056, + "step": 366640 + }, + { + "epoch": 1.85, + "learning_rate": 2.2530535641311527e-05, + "loss": 0.0059, + "step": 366650 + }, + { + "epoch": 1.85, + "learning_rate": 2.252296794829752e-05, + "loss": 0.008, + "step": 366660 + }, + { + "epoch": 1.85, + "learning_rate": 2.2515400255283507e-05, + "loss": 0.0044, + "step": 366670 + }, + { + "epoch": 1.85, + "learning_rate": 2.25078325622695e-05, + "loss": 0.0053, + "step": 366680 + }, + { + "epoch": 1.85, + "learning_rate": 2.2500264869255487e-05, + "loss": 0.0057, + "step": 366690 + }, + { + "epoch": 1.85, + "learning_rate": 2.249269717624148e-05, + "loss": 0.0053, + "step": 366700 + }, + { + "epoch": 1.85, + "learning_rate": 2.2485129483227467e-05, + "loss": 0.0041, + "step": 366710 + }, + { + "epoch": 1.85, + "learning_rate": 2.247756179021346e-05, + "loss": 0.0064, + "step": 366720 + }, + { + "epoch": 1.85, + "learning_rate": 2.2469994097199447e-05, + "loss": 0.007, + "step": 366730 + }, + { + "epoch": 1.85, + "learning_rate": 2.246242640418544e-05, + "loss": 0.0075, + "step": 366740 + }, + { + "epoch": 1.85, + "learning_rate": 2.2454858711171427e-05, + "loss": 0.007, + "step": 366750 + }, + { + "epoch": 1.85, + "learning_rate": 2.2447291018157418e-05, + "loss": 0.0063, + "step": 366760 + }, + { + "epoch": 1.85, + "learning_rate": 2.2439723325143406e-05, + "loss": 0.007, + "step": 366770 + }, + { + "epoch": 1.85, + "learning_rate": 2.2432155632129395e-05, + "loss": 0.0046, + "step": 366780 + }, + { + "epoch": 1.85, + "learning_rate": 2.2424587939115383e-05, + "loss": 0.0059, + "step": 366790 + }, + { + "epoch": 1.85, + "learning_rate": 2.2417020246101374e-05, + "loss": 0.0092, + "step": 366800 + }, + { + "epoch": 1.85, + "learning_rate": 2.2409452553087363e-05, + "loss": 0.0059, + "step": 366810 + }, + { + "epoch": 1.85, + "learning_rate": 2.2401884860073354e-05, + "loss": 0.0065, + "step": 366820 + }, + { + "epoch": 1.85, + "learning_rate": 2.2394317167059342e-05, + "loss": 0.0085, + "step": 366830 + }, + { + "epoch": 1.85, + "learning_rate": 2.2386749474045334e-05, + "loss": 0.0045, + "step": 366840 + }, + { + "epoch": 1.85, + "learning_rate": 2.2379181781031322e-05, + "loss": 0.0069, + "step": 366850 + }, + { + "epoch": 1.85, + "learning_rate": 2.2371614088017314e-05, + "loss": 0.0078, + "step": 366860 + }, + { + "epoch": 1.85, + "learning_rate": 2.2364046395003302e-05, + "loss": 0.0075, + "step": 366870 + }, + { + "epoch": 1.85, + "learning_rate": 2.2356478701989294e-05, + "loss": 0.0053, + "step": 366880 + }, + { + "epoch": 1.85, + "learning_rate": 2.2348911008975282e-05, + "loss": 0.0076, + "step": 366890 + }, + { + "epoch": 1.85, + "learning_rate": 2.2341343315961274e-05, + "loss": 0.0053, + "step": 366900 + }, + { + "epoch": 1.85, + "learning_rate": 2.2333775622947262e-05, + "loss": 0.0082, + "step": 366910 + }, + { + "epoch": 1.85, + "learning_rate": 2.2326207929933253e-05, + "loss": 0.0058, + "step": 366920 + }, + { + "epoch": 1.85, + "learning_rate": 2.231864023691924e-05, + "loss": 0.0041, + "step": 366930 + }, + { + "epoch": 1.85, + "learning_rate": 2.231107254390523e-05, + "loss": 0.0062, + "step": 366940 + }, + { + "epoch": 1.85, + "learning_rate": 2.2303504850891218e-05, + "loss": 0.0054, + "step": 366950 + }, + { + "epoch": 1.85, + "learning_rate": 2.229593715787721e-05, + "loss": 0.0057, + "step": 366960 + }, + { + "epoch": 1.85, + "learning_rate": 2.2288369464863198e-05, + "loss": 0.0066, + "step": 366970 + }, + { + "epoch": 1.85, + "learning_rate": 2.228080177184919e-05, + "loss": 0.0067, + "step": 366980 + }, + { + "epoch": 1.85, + "learning_rate": 2.2273234078835178e-05, + "loss": 0.0079, + "step": 366990 + }, + { + "epoch": 1.85, + "learning_rate": 2.226566638582117e-05, + "loss": 0.0065, + "step": 367000 + }, + { + "epoch": 1.85, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004412375390529633, + "eval_runtime": 116.7639, + "eval_samples_per_second": 17.129, + "eval_steps_per_second": 4.282, + "step": 367000 + }, + { + "epoch": 1.85, + "learning_rate": 2.2258098692807157e-05, + "loss": 0.0051, + "step": 367010 + }, + { + "epoch": 1.85, + "learning_rate": 2.225053099979315e-05, + "loss": 0.0068, + "step": 367020 + }, + { + "epoch": 1.85, + "learning_rate": 2.2242963306779137e-05, + "loss": 0.0064, + "step": 367030 + }, + { + "epoch": 1.85, + "learning_rate": 2.223539561376513e-05, + "loss": 0.0049, + "step": 367040 + }, + { + "epoch": 1.85, + "learning_rate": 2.2227827920751117e-05, + "loss": 0.0059, + "step": 367050 + }, + { + "epoch": 1.85, + "learning_rate": 2.222026022773711e-05, + "loss": 0.0046, + "step": 367060 + }, + { + "epoch": 1.85, + "learning_rate": 2.2212692534723097e-05, + "loss": 0.0066, + "step": 367070 + }, + { + "epoch": 1.85, + "learning_rate": 2.220512484170909e-05, + "loss": 0.0048, + "step": 367080 + }, + { + "epoch": 1.85, + "learning_rate": 2.2197557148695073e-05, + "loss": 0.0056, + "step": 367090 + }, + { + "epoch": 1.85, + "learning_rate": 2.2189989455681065e-05, + "loss": 0.0052, + "step": 367100 + }, + { + "epoch": 1.85, + "learning_rate": 2.2182421762667053e-05, + "loss": 0.0046, + "step": 367110 + }, + { + "epoch": 1.85, + "learning_rate": 2.2174854069653045e-05, + "loss": 0.007, + "step": 367120 + }, + { + "epoch": 1.85, + "learning_rate": 2.2167286376639033e-05, + "loss": 0.0026, + "step": 367130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2159718683625025e-05, + "loss": 0.0067, + "step": 367140 + }, + { + "epoch": 1.85, + "learning_rate": 2.2152150990611013e-05, + "loss": 0.007, + "step": 367150 + }, + { + "epoch": 1.85, + "learning_rate": 2.2144583297597004e-05, + "loss": 0.0064, + "step": 367160 + }, + { + "epoch": 1.85, + "learning_rate": 2.2137015604582993e-05, + "loss": 0.0058, + "step": 367170 + }, + { + "epoch": 1.85, + "learning_rate": 2.2129447911568984e-05, + "loss": 0.0055, + "step": 367180 + }, + { + "epoch": 1.85, + "learning_rate": 2.2121880218554973e-05, + "loss": 0.0045, + "step": 367190 + }, + { + "epoch": 1.85, + "learning_rate": 2.2114312525540964e-05, + "loss": 0.0054, + "step": 367200 + }, + { + "epoch": 1.85, + "learning_rate": 2.2106744832526952e-05, + "loss": 0.0062, + "step": 367210 + }, + { + "epoch": 1.85, + "learning_rate": 2.2099177139512944e-05, + "loss": 0.0056, + "step": 367220 + }, + { + "epoch": 1.85, + "learning_rate": 2.2091609446498932e-05, + "loss": 0.0058, + "step": 367230 + }, + { + "epoch": 1.85, + "learning_rate": 2.2084041753484924e-05, + "loss": 0.0061, + "step": 367240 + }, + { + "epoch": 1.85, + "learning_rate": 2.207647406047091e-05, + "loss": 0.0057, + "step": 367250 + }, + { + "epoch": 1.85, + "learning_rate": 2.2068906367456897e-05, + "loss": 0.0045, + "step": 367260 + }, + { + "epoch": 1.85, + "learning_rate": 2.206133867444289e-05, + "loss": 0.006, + "step": 367270 + }, + { + "epoch": 1.85, + "learning_rate": 2.2053770981428877e-05, + "loss": 0.0064, + "step": 367280 + }, + { + "epoch": 1.85, + "learning_rate": 2.2046203288414868e-05, + "loss": 0.0075, + "step": 367290 + }, + { + "epoch": 1.85, + "learning_rate": 2.2038635595400856e-05, + "loss": 0.0054, + "step": 367300 + }, + { + "epoch": 1.85, + "learning_rate": 2.2031067902386848e-05, + "loss": 0.0074, + "step": 367310 + }, + { + "epoch": 1.85, + "learning_rate": 2.2023500209372836e-05, + "loss": 0.0048, + "step": 367320 + }, + { + "epoch": 1.85, + "learning_rate": 2.2015932516358828e-05, + "loss": 0.0055, + "step": 367330 + }, + { + "epoch": 1.85, + "learning_rate": 2.200836482334482e-05, + "loss": 0.0049, + "step": 367340 + }, + { + "epoch": 1.85, + "learning_rate": 2.2000797130330808e-05, + "loss": 0.0054, + "step": 367350 + }, + { + "epoch": 1.85, + "learning_rate": 2.19932294373168e-05, + "loss": 0.005, + "step": 367360 + }, + { + "epoch": 1.85, + "learning_rate": 2.1985661744302788e-05, + "loss": 0.0059, + "step": 367370 + }, + { + "epoch": 1.85, + "learning_rate": 2.197809405128878e-05, + "loss": 0.0068, + "step": 367380 + }, + { + "epoch": 1.85, + "learning_rate": 2.1970526358274767e-05, + "loss": 0.005, + "step": 367390 + }, + { + "epoch": 1.85, + "learning_rate": 2.196295866526076e-05, + "loss": 0.0064, + "step": 367400 + }, + { + "epoch": 1.85, + "learning_rate": 2.1955390972246744e-05, + "loss": 0.0073, + "step": 367410 + }, + { + "epoch": 1.85, + "learning_rate": 2.1947823279232732e-05, + "loss": 0.0054, + "step": 367420 + }, + { + "epoch": 1.85, + "learning_rate": 2.1940255586218724e-05, + "loss": 0.0049, + "step": 367430 + }, + { + "epoch": 1.85, + "learning_rate": 2.1932687893204712e-05, + "loss": 0.0059, + "step": 367440 + }, + { + "epoch": 1.85, + "learning_rate": 2.1925120200190703e-05, + "loss": 0.0067, + "step": 367450 + }, + { + "epoch": 1.85, + "learning_rate": 2.1917552507176692e-05, + "loss": 0.0062, + "step": 367460 + }, + { + "epoch": 1.85, + "learning_rate": 2.1909984814162683e-05, + "loss": 0.0061, + "step": 367470 + }, + { + "epoch": 1.85, + "learning_rate": 2.190241712114867e-05, + "loss": 0.0052, + "step": 367480 + }, + { + "epoch": 1.85, + "learning_rate": 2.1894849428134663e-05, + "loss": 0.0086, + "step": 367490 + }, + { + "epoch": 1.85, + "learning_rate": 2.188728173512065e-05, + "loss": 0.0057, + "step": 367500 + }, + { + "epoch": 1.85, + "learning_rate": 2.1879714042106643e-05, + "loss": 0.0056, + "step": 367510 + }, + { + "epoch": 1.85, + "learning_rate": 2.187214634909263e-05, + "loss": 0.0032, + "step": 367520 + }, + { + "epoch": 1.85, + "learning_rate": 2.1864578656078623e-05, + "loss": 0.0067, + "step": 367530 + }, + { + "epoch": 1.85, + "learning_rate": 2.185701096306461e-05, + "loss": 0.0082, + "step": 367540 + }, + { + "epoch": 1.85, + "learning_rate": 2.1849443270050603e-05, + "loss": 0.0057, + "step": 367550 + }, + { + "epoch": 1.85, + "learning_rate": 2.184187557703659e-05, + "loss": 0.0056, + "step": 367560 + }, + { + "epoch": 1.85, + "learning_rate": 2.183430788402258e-05, + "loss": 0.0061, + "step": 367570 + }, + { + "epoch": 1.85, + "learning_rate": 2.1826740191008567e-05, + "loss": 0.0051, + "step": 367580 + }, + { + "epoch": 1.85, + "learning_rate": 2.181917249799456e-05, + "loss": 0.0055, + "step": 367590 + }, + { + "epoch": 1.85, + "learning_rate": 2.1811604804980547e-05, + "loss": 0.0038, + "step": 367600 + }, + { + "epoch": 1.85, + "learning_rate": 2.180403711196654e-05, + "loss": 0.006, + "step": 367610 + }, + { + "epoch": 1.85, + "learning_rate": 2.1796469418952527e-05, + "loss": 0.0061, + "step": 367620 + }, + { + "epoch": 1.85, + "learning_rate": 2.178890172593852e-05, + "loss": 0.0061, + "step": 367630 + }, + { + "epoch": 1.85, + "learning_rate": 2.1781334032924507e-05, + "loss": 0.0063, + "step": 367640 + }, + { + "epoch": 1.85, + "learning_rate": 2.17737663399105e-05, + "loss": 0.0063, + "step": 367650 + }, + { + "epoch": 1.85, + "learning_rate": 2.1766198646896487e-05, + "loss": 0.0059, + "step": 367660 + }, + { + "epoch": 1.85, + "learning_rate": 2.1758630953882478e-05, + "loss": 0.0058, + "step": 367670 + }, + { + "epoch": 1.85, + "learning_rate": 2.1751063260868466e-05, + "loss": 0.0075, + "step": 367680 + }, + { + "epoch": 1.86, + "learning_rate": 2.1743495567854458e-05, + "loss": 0.0063, + "step": 367690 + }, + { + "epoch": 1.86, + "learning_rate": 2.1735927874840446e-05, + "loss": 0.0061, + "step": 367700 + }, + { + "epoch": 1.86, + "learning_rate": 2.1728360181826438e-05, + "loss": 0.0069, + "step": 367710 + }, + { + "epoch": 1.86, + "learning_rate": 2.1720792488812423e-05, + "loss": 0.0046, + "step": 367720 + }, + { + "epoch": 1.86, + "learning_rate": 2.1713224795798414e-05, + "loss": 0.0086, + "step": 367730 + }, + { + "epoch": 1.86, + "learning_rate": 2.1705657102784402e-05, + "loss": 0.006, + "step": 367740 + }, + { + "epoch": 1.86, + "learning_rate": 2.1698089409770394e-05, + "loss": 0.0046, + "step": 367750 + }, + { + "epoch": 1.86, + "learning_rate": 2.1690521716756382e-05, + "loss": 0.0046, + "step": 367760 + }, + { + "epoch": 1.86, + "learning_rate": 2.1682954023742374e-05, + "loss": 0.006, + "step": 367770 + }, + { + "epoch": 1.86, + "learning_rate": 2.1675386330728362e-05, + "loss": 0.0077, + "step": 367780 + }, + { + "epoch": 1.86, + "learning_rate": 2.1667818637714354e-05, + "loss": 0.0052, + "step": 367790 + }, + { + "epoch": 1.86, + "learning_rate": 2.1660250944700342e-05, + "loss": 0.0042, + "step": 367800 + }, + { + "epoch": 1.86, + "learning_rate": 2.1652683251686334e-05, + "loss": 0.0085, + "step": 367810 + }, + { + "epoch": 1.86, + "learning_rate": 2.1645115558672322e-05, + "loss": 0.0065, + "step": 367820 + }, + { + "epoch": 1.86, + "learning_rate": 2.1637547865658313e-05, + "loss": 0.0078, + "step": 367830 + }, + { + "epoch": 1.86, + "learning_rate": 2.16299801726443e-05, + "loss": 0.0047, + "step": 367840 + }, + { + "epoch": 1.86, + "learning_rate": 2.1622412479630293e-05, + "loss": 0.0054, + "step": 367850 + }, + { + "epoch": 1.86, + "learning_rate": 2.161484478661628e-05, + "loss": 0.0052, + "step": 367860 + }, + { + "epoch": 1.86, + "learning_rate": 2.1607277093602273e-05, + "loss": 0.0059, + "step": 367870 + }, + { + "epoch": 1.86, + "learning_rate": 2.1599709400588258e-05, + "loss": 0.006, + "step": 367880 + }, + { + "epoch": 1.86, + "learning_rate": 2.159214170757425e-05, + "loss": 0.0062, + "step": 367890 + }, + { + "epoch": 1.86, + "learning_rate": 2.1584574014560238e-05, + "loss": 0.0046, + "step": 367900 + }, + { + "epoch": 1.86, + "learning_rate": 2.157700632154623e-05, + "loss": 0.0047, + "step": 367910 + }, + { + "epoch": 1.86, + "learning_rate": 2.1569438628532218e-05, + "loss": 0.0072, + "step": 367920 + }, + { + "epoch": 1.86, + "learning_rate": 2.156187093551821e-05, + "loss": 0.0063, + "step": 367930 + }, + { + "epoch": 1.86, + "learning_rate": 2.1554303242504197e-05, + "loss": 0.0066, + "step": 367940 + }, + { + "epoch": 1.86, + "learning_rate": 2.154673554949019e-05, + "loss": 0.0046, + "step": 367950 + }, + { + "epoch": 1.86, + "learning_rate": 2.1539167856476177e-05, + "loss": 0.0076, + "step": 367960 + }, + { + "epoch": 1.86, + "learning_rate": 2.153160016346217e-05, + "loss": 0.0077, + "step": 367970 + }, + { + "epoch": 1.86, + "learning_rate": 2.1524032470448157e-05, + "loss": 0.0058, + "step": 367980 + }, + { + "epoch": 1.86, + "learning_rate": 2.151646477743415e-05, + "loss": 0.0042, + "step": 367990 + }, + { + "epoch": 1.86, + "learning_rate": 2.1508897084420137e-05, + "loss": 0.0072, + "step": 368000 + }, + { + "epoch": 1.86, + "eval_cer": 0.9144285288697699, + "eval_loss": 0.004368205089122057, + "eval_runtime": 116.793, + "eval_samples_per_second": 17.124, + "eval_steps_per_second": 4.281, + "step": 368000 + }, + { + "epoch": 1.86, + "learning_rate": 2.150132939140613e-05, + "loss": 0.0076, + "step": 368010 + }, + { + "epoch": 1.86, + "learning_rate": 2.1493761698392117e-05, + "loss": 0.0044, + "step": 368020 + }, + { + "epoch": 1.86, + "learning_rate": 2.1486194005378108e-05, + "loss": 0.0057, + "step": 368030 + }, + { + "epoch": 1.86, + "learning_rate": 2.1478626312364093e-05, + "loss": 0.0048, + "step": 368040 + }, + { + "epoch": 1.86, + "learning_rate": 2.1471058619350085e-05, + "loss": 0.0039, + "step": 368050 + }, + { + "epoch": 1.86, + "learning_rate": 2.1463490926336073e-05, + "loss": 0.0054, + "step": 368060 + }, + { + "epoch": 1.86, + "learning_rate": 2.1455923233322065e-05, + "loss": 0.0038, + "step": 368070 + }, + { + "epoch": 1.86, + "learning_rate": 2.1448355540308053e-05, + "loss": 0.0057, + "step": 368080 + }, + { + "epoch": 1.86, + "learning_rate": 2.1440787847294044e-05, + "loss": 0.0068, + "step": 368090 + }, + { + "epoch": 1.86, + "learning_rate": 2.1433220154280033e-05, + "loss": 0.0078, + "step": 368100 + }, + { + "epoch": 1.86, + "learning_rate": 2.1425652461266024e-05, + "loss": 0.0053, + "step": 368110 + }, + { + "epoch": 1.86, + "learning_rate": 2.1418084768252012e-05, + "loss": 0.0062, + "step": 368120 + }, + { + "epoch": 1.86, + "learning_rate": 2.1410517075238004e-05, + "loss": 0.0109, + "step": 368130 + }, + { + "epoch": 1.86, + "learning_rate": 2.1402949382223992e-05, + "loss": 0.0045, + "step": 368140 + }, + { + "epoch": 1.86, + "learning_rate": 2.1395381689209984e-05, + "loss": 0.0061, + "step": 368150 + }, + { + "epoch": 1.86, + "learning_rate": 2.1387813996195972e-05, + "loss": 0.006, + "step": 368160 + }, + { + "epoch": 1.86, + "learning_rate": 2.1380246303181964e-05, + "loss": 0.0053, + "step": 368170 + }, + { + "epoch": 1.86, + "learning_rate": 2.1372678610167952e-05, + "loss": 0.0046, + "step": 368180 + }, + { + "epoch": 1.86, + "learning_rate": 2.1365110917153937e-05, + "loss": 0.0041, + "step": 368190 + }, + { + "epoch": 1.86, + "learning_rate": 2.135754322413993e-05, + "loss": 0.0054, + "step": 368200 + }, + { + "epoch": 1.86, + "learning_rate": 2.1349975531125917e-05, + "loss": 0.005, + "step": 368210 + }, + { + "epoch": 1.86, + "learning_rate": 2.1342407838111908e-05, + "loss": 0.0082, + "step": 368220 + }, + { + "epoch": 1.86, + "learning_rate": 2.1334840145097896e-05, + "loss": 0.0054, + "step": 368230 + }, + { + "epoch": 1.86, + "learning_rate": 2.1327272452083888e-05, + "loss": 0.0047, + "step": 368240 + }, + { + "epoch": 1.86, + "learning_rate": 2.1319704759069876e-05, + "loss": 0.0059, + "step": 368250 + }, + { + "epoch": 1.86, + "learning_rate": 2.1312137066055868e-05, + "loss": 0.0063, + "step": 368260 + }, + { + "epoch": 1.86, + "learning_rate": 2.1304569373041856e-05, + "loss": 0.0102, + "step": 368270 + }, + { + "epoch": 1.86, + "learning_rate": 2.1297001680027848e-05, + "loss": 0.0049, + "step": 368280 + }, + { + "epoch": 1.86, + "learning_rate": 2.1289433987013836e-05, + "loss": 0.0054, + "step": 368290 + }, + { + "epoch": 1.86, + "learning_rate": 2.1281866293999827e-05, + "loss": 0.0052, + "step": 368300 + }, + { + "epoch": 1.86, + "learning_rate": 2.127429860098582e-05, + "loss": 0.0069, + "step": 368310 + }, + { + "epoch": 1.86, + "learning_rate": 2.1266730907971807e-05, + "loss": 0.0042, + "step": 368320 + }, + { + "epoch": 1.86, + "learning_rate": 2.12591632149578e-05, + "loss": 0.0044, + "step": 368330 + }, + { + "epoch": 1.86, + "learning_rate": 2.1251595521943787e-05, + "loss": 0.0074, + "step": 368340 + }, + { + "epoch": 1.86, + "learning_rate": 2.1244027828929772e-05, + "loss": 0.0058, + "step": 368350 + }, + { + "epoch": 1.86, + "learning_rate": 2.1236460135915764e-05, + "loss": 0.0065, + "step": 368360 + }, + { + "epoch": 1.86, + "learning_rate": 2.1228892442901752e-05, + "loss": 0.0042, + "step": 368370 + }, + { + "epoch": 1.86, + "learning_rate": 2.1221324749887743e-05, + "loss": 0.0044, + "step": 368380 + }, + { + "epoch": 1.86, + "learning_rate": 2.121375705687373e-05, + "loss": 0.0063, + "step": 368390 + }, + { + "epoch": 1.86, + "learning_rate": 2.1206189363859723e-05, + "loss": 0.0054, + "step": 368400 + }, + { + "epoch": 1.86, + "learning_rate": 2.119862167084571e-05, + "loss": 0.0068, + "step": 368410 + }, + { + "epoch": 1.86, + "learning_rate": 2.1191053977831703e-05, + "loss": 0.008, + "step": 368420 + }, + { + "epoch": 1.86, + "learning_rate": 2.118348628481769e-05, + "loss": 0.0068, + "step": 368430 + }, + { + "epoch": 1.86, + "learning_rate": 2.1175918591803683e-05, + "loss": 0.0058, + "step": 368440 + }, + { + "epoch": 1.86, + "learning_rate": 2.116835089878967e-05, + "loss": 0.0059, + "step": 368450 + }, + { + "epoch": 1.86, + "learning_rate": 2.1160783205775663e-05, + "loss": 0.0046, + "step": 368460 + }, + { + "epoch": 1.86, + "learning_rate": 2.115321551276165e-05, + "loss": 0.0037, + "step": 368470 + }, + { + "epoch": 1.86, + "learning_rate": 2.1145647819747642e-05, + "loss": 0.0074, + "step": 368480 + }, + { + "epoch": 1.86, + "learning_rate": 2.113808012673363e-05, + "loss": 0.0065, + "step": 368490 + }, + { + "epoch": 1.86, + "learning_rate": 2.1130512433719622e-05, + "loss": 0.0057, + "step": 368500 + }, + { + "epoch": 1.86, + "learning_rate": 2.1122944740705607e-05, + "loss": 0.0054, + "step": 368510 + }, + { + "epoch": 1.86, + "learning_rate": 2.11153770476916e-05, + "loss": 0.0053, + "step": 368520 + }, + { + "epoch": 1.86, + "learning_rate": 2.1107809354677587e-05, + "loss": 0.0057, + "step": 368530 + }, + { + "epoch": 1.86, + "learning_rate": 2.110024166166358e-05, + "loss": 0.0053, + "step": 368540 + }, + { + "epoch": 1.86, + "learning_rate": 2.1092673968649567e-05, + "loss": 0.0069, + "step": 368550 + }, + { + "epoch": 1.86, + "learning_rate": 2.108510627563556e-05, + "loss": 0.005, + "step": 368560 + }, + { + "epoch": 1.86, + "learning_rate": 2.1077538582621547e-05, + "loss": 0.0062, + "step": 368570 + }, + { + "epoch": 1.86, + "learning_rate": 2.1069970889607538e-05, + "loss": 0.0071, + "step": 368580 + }, + { + "epoch": 1.86, + "learning_rate": 2.1062403196593526e-05, + "loss": 0.0073, + "step": 368590 + }, + { + "epoch": 1.86, + "learning_rate": 2.1054835503579518e-05, + "loss": 0.0055, + "step": 368600 + }, + { + "epoch": 1.86, + "learning_rate": 2.1047267810565506e-05, + "loss": 0.0046, + "step": 368610 + }, + { + "epoch": 1.86, + "learning_rate": 2.1039700117551498e-05, + "loss": 0.0074, + "step": 368620 + }, + { + "epoch": 1.86, + "learning_rate": 2.1032132424537486e-05, + "loss": 0.0064, + "step": 368630 + }, + { + "epoch": 1.86, + "learning_rate": 2.1024564731523478e-05, + "loss": 0.0052, + "step": 368640 + }, + { + "epoch": 1.86, + "learning_rate": 2.1016997038509466e-05, + "loss": 0.0062, + "step": 368650 + }, + { + "epoch": 1.86, + "learning_rate": 2.1009429345495458e-05, + "loss": 0.0063, + "step": 368660 + }, + { + "epoch": 1.86, + "learning_rate": 2.1001861652481442e-05, + "loss": 0.0049, + "step": 368670 + }, + { + "epoch": 1.86, + "learning_rate": 2.0994293959467434e-05, + "loss": 0.005, + "step": 368680 + }, + { + "epoch": 1.86, + "learning_rate": 2.0986726266453422e-05, + "loss": 0.0046, + "step": 368690 + }, + { + "epoch": 1.86, + "learning_rate": 2.0979158573439414e-05, + "loss": 0.0067, + "step": 368700 + }, + { + "epoch": 1.86, + "learning_rate": 2.0971590880425402e-05, + "loss": 0.0067, + "step": 368710 + }, + { + "epoch": 1.86, + "learning_rate": 2.0964023187411394e-05, + "loss": 0.0053, + "step": 368720 + }, + { + "epoch": 1.86, + "learning_rate": 2.0956455494397382e-05, + "loss": 0.005, + "step": 368730 + }, + { + "epoch": 1.86, + "learning_rate": 2.0948887801383373e-05, + "loss": 0.0048, + "step": 368740 + }, + { + "epoch": 1.86, + "learning_rate": 2.094132010836936e-05, + "loss": 0.0051, + "step": 368750 + }, + { + "epoch": 1.86, + "learning_rate": 2.0933752415355353e-05, + "loss": 0.0065, + "step": 368760 + }, + { + "epoch": 1.86, + "learning_rate": 2.092618472234134e-05, + "loss": 0.0068, + "step": 368770 + }, + { + "epoch": 1.86, + "learning_rate": 2.0918617029327333e-05, + "loss": 0.0065, + "step": 368780 + }, + { + "epoch": 1.86, + "learning_rate": 2.091104933631332e-05, + "loss": 0.0066, + "step": 368790 + }, + { + "epoch": 1.86, + "learning_rate": 2.0903481643299313e-05, + "loss": 0.0049, + "step": 368800 + }, + { + "epoch": 1.86, + "learning_rate": 2.08959139502853e-05, + "loss": 0.0052, + "step": 368810 + }, + { + "epoch": 1.86, + "learning_rate": 2.088834625727129e-05, + "loss": 0.0043, + "step": 368820 + }, + { + "epoch": 1.86, + "learning_rate": 2.0880778564257278e-05, + "loss": 0.0056, + "step": 368830 + }, + { + "epoch": 1.86, + "learning_rate": 2.087321087124327e-05, + "loss": 0.0045, + "step": 368840 + }, + { + "epoch": 1.86, + "learning_rate": 2.0865643178229257e-05, + "loss": 0.0057, + "step": 368850 + }, + { + "epoch": 1.86, + "learning_rate": 2.085807548521525e-05, + "loss": 0.0052, + "step": 368860 + }, + { + "epoch": 1.86, + "learning_rate": 2.0850507792201237e-05, + "loss": 0.0077, + "step": 368870 + }, + { + "epoch": 1.86, + "learning_rate": 2.084294009918723e-05, + "loss": 0.0053, + "step": 368880 + }, + { + "epoch": 1.86, + "learning_rate": 2.0835372406173217e-05, + "loss": 0.007, + "step": 368890 + }, + { + "epoch": 1.86, + "learning_rate": 2.082780471315921e-05, + "loss": 0.0057, + "step": 368900 + }, + { + "epoch": 1.86, + "learning_rate": 2.0820237020145197e-05, + "loss": 0.0061, + "step": 368910 + }, + { + "epoch": 1.86, + "learning_rate": 2.081266932713119e-05, + "loss": 0.0074, + "step": 368920 + }, + { + "epoch": 1.86, + "learning_rate": 2.0805101634117177e-05, + "loss": 0.0055, + "step": 368930 + }, + { + "epoch": 1.86, + "learning_rate": 2.079753394110317e-05, + "loss": 0.0057, + "step": 368940 + }, + { + "epoch": 1.86, + "learning_rate": 2.0789966248089157e-05, + "loss": 0.0044, + "step": 368950 + }, + { + "epoch": 1.86, + "learning_rate": 2.0782398555075148e-05, + "loss": 0.0061, + "step": 368960 + }, + { + "epoch": 1.86, + "learning_rate": 2.0774830862061136e-05, + "loss": 0.0043, + "step": 368970 + }, + { + "epoch": 1.86, + "learning_rate": 2.076726316904712e-05, + "loss": 0.0084, + "step": 368980 + }, + { + "epoch": 1.86, + "learning_rate": 2.0759695476033113e-05, + "loss": 0.0047, + "step": 368990 + }, + { + "epoch": 1.86, + "learning_rate": 2.07521277830191e-05, + "loss": 0.008, + "step": 369000 + }, + { + "epoch": 1.86, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.0044240448623895645, + "eval_runtime": 116.7122, + "eval_samples_per_second": 17.136, + "eval_steps_per_second": 4.284, + "step": 369000 + }, + { + "epoch": 1.86, + "learning_rate": 2.0744560090005093e-05, + "loss": 0.0053, + "step": 369010 + }, + { + "epoch": 1.86, + "learning_rate": 2.0736992396991084e-05, + "loss": 0.0047, + "step": 369020 + }, + { + "epoch": 1.86, + "learning_rate": 2.0729424703977072e-05, + "loss": 0.0054, + "step": 369030 + }, + { + "epoch": 1.86, + "learning_rate": 2.0721857010963064e-05, + "loss": 0.0058, + "step": 369040 + }, + { + "epoch": 1.86, + "learning_rate": 2.0714289317949052e-05, + "loss": 0.0055, + "step": 369050 + }, + { + "epoch": 1.86, + "learning_rate": 2.0706721624935044e-05, + "loss": 0.0067, + "step": 369060 + }, + { + "epoch": 1.86, + "learning_rate": 2.0699153931921032e-05, + "loss": 0.0061, + "step": 369070 + }, + { + "epoch": 1.86, + "learning_rate": 2.0691586238907024e-05, + "loss": 0.0068, + "step": 369080 + }, + { + "epoch": 1.86, + "learning_rate": 2.0684018545893012e-05, + "loss": 0.0059, + "step": 369090 + }, + { + "epoch": 1.86, + "learning_rate": 2.0676450852879004e-05, + "loss": 0.0069, + "step": 369100 + }, + { + "epoch": 1.86, + "learning_rate": 2.0668883159864992e-05, + "loss": 0.006, + "step": 369110 + }, + { + "epoch": 1.86, + "learning_rate": 2.0661315466850983e-05, + "loss": 0.0063, + "step": 369120 + }, + { + "epoch": 1.86, + "learning_rate": 2.065374777383697e-05, + "loss": 0.0104, + "step": 369130 + }, + { + "epoch": 1.86, + "learning_rate": 2.0646180080822956e-05, + "loss": 0.0061, + "step": 369140 + }, + { + "epoch": 1.86, + "learning_rate": 2.0638612387808948e-05, + "loss": 0.0047, + "step": 369150 + }, + { + "epoch": 1.86, + "learning_rate": 2.0631044694794936e-05, + "loss": 0.0112, + "step": 369160 + }, + { + "epoch": 1.86, + "learning_rate": 2.0623477001780928e-05, + "loss": 0.0056, + "step": 369170 + }, + { + "epoch": 1.86, + "learning_rate": 2.0615909308766916e-05, + "loss": 0.0059, + "step": 369180 + }, + { + "epoch": 1.86, + "learning_rate": 2.0608341615752908e-05, + "loss": 0.005, + "step": 369190 + }, + { + "epoch": 1.86, + "learning_rate": 2.0600773922738896e-05, + "loss": 0.0068, + "step": 369200 + }, + { + "epoch": 1.86, + "learning_rate": 2.0593206229724887e-05, + "loss": 0.0113, + "step": 369210 + }, + { + "epoch": 1.86, + "learning_rate": 2.0585638536710876e-05, + "loss": 0.0063, + "step": 369220 + }, + { + "epoch": 1.86, + "learning_rate": 2.0578070843696867e-05, + "loss": 0.0059, + "step": 369230 + }, + { + "epoch": 1.86, + "learning_rate": 2.0570503150682856e-05, + "loss": 0.0064, + "step": 369240 + }, + { + "epoch": 1.86, + "learning_rate": 2.0562935457668847e-05, + "loss": 0.0059, + "step": 369250 + }, + { + "epoch": 1.86, + "learning_rate": 2.0555367764654835e-05, + "loss": 0.0045, + "step": 369260 + }, + { + "epoch": 1.86, + "learning_rate": 2.0547800071640827e-05, + "loss": 0.0057, + "step": 369270 + }, + { + "epoch": 1.86, + "learning_rate": 2.054023237862682e-05, + "loss": 0.0059, + "step": 369280 + }, + { + "epoch": 1.86, + "learning_rate": 2.0532664685612803e-05, + "loss": 0.006, + "step": 369290 + }, + { + "epoch": 1.86, + "learning_rate": 2.052509699259879e-05, + "loss": 0.0066, + "step": 369300 + }, + { + "epoch": 1.86, + "learning_rate": 2.0517529299584783e-05, + "loss": 0.0061, + "step": 369310 + }, + { + "epoch": 1.86, + "learning_rate": 2.050996160657077e-05, + "loss": 0.0063, + "step": 369320 + }, + { + "epoch": 1.86, + "learning_rate": 2.0502393913556763e-05, + "loss": 0.0086, + "step": 369330 + }, + { + "epoch": 1.86, + "learning_rate": 2.049482622054275e-05, + "loss": 0.0049, + "step": 369340 + }, + { + "epoch": 1.86, + "learning_rate": 2.0487258527528743e-05, + "loss": 0.0045, + "step": 369350 + }, + { + "epoch": 1.86, + "learning_rate": 2.047969083451473e-05, + "loss": 0.0048, + "step": 369360 + }, + { + "epoch": 1.86, + "learning_rate": 2.0472123141500723e-05, + "loss": 0.0133, + "step": 369370 + }, + { + "epoch": 1.86, + "learning_rate": 2.046455544848671e-05, + "loss": 0.006, + "step": 369380 + }, + { + "epoch": 1.86, + "learning_rate": 2.0456987755472703e-05, + "loss": 0.0063, + "step": 369390 + }, + { + "epoch": 1.86, + "learning_rate": 2.044942006245869e-05, + "loss": 0.008, + "step": 369400 + }, + { + "epoch": 1.86, + "learning_rate": 2.0441852369444682e-05, + "loss": 0.0049, + "step": 369410 + }, + { + "epoch": 1.86, + "learning_rate": 2.043428467643067e-05, + "loss": 0.0055, + "step": 369420 + }, + { + "epoch": 1.86, + "learning_rate": 2.0426716983416662e-05, + "loss": 0.0044, + "step": 369430 + }, + { + "epoch": 1.86, + "learning_rate": 2.041914929040265e-05, + "loss": 0.005, + "step": 369440 + }, + { + "epoch": 1.86, + "learning_rate": 2.041158159738864e-05, + "loss": 0.0033, + "step": 369450 + }, + { + "epoch": 1.86, + "learning_rate": 2.0404013904374627e-05, + "loss": 0.0059, + "step": 369460 + }, + { + "epoch": 1.86, + "learning_rate": 2.039644621136062e-05, + "loss": 0.0047, + "step": 369470 + }, + { + "epoch": 1.86, + "learning_rate": 2.0388878518346607e-05, + "loss": 0.0069, + "step": 369480 + }, + { + "epoch": 1.86, + "learning_rate": 2.0381310825332598e-05, + "loss": 0.0075, + "step": 369490 + }, + { + "epoch": 1.86, + "learning_rate": 2.0373743132318586e-05, + "loss": 0.0051, + "step": 369500 + }, + { + "epoch": 1.86, + "learning_rate": 2.0366175439304578e-05, + "loss": 0.0049, + "step": 369510 + }, + { + "epoch": 1.86, + "learning_rate": 2.0358607746290566e-05, + "loss": 0.007, + "step": 369520 + }, + { + "epoch": 1.86, + "learning_rate": 2.0351040053276558e-05, + "loss": 0.0048, + "step": 369530 + }, + { + "epoch": 1.86, + "learning_rate": 2.0343472360262546e-05, + "loss": 0.0064, + "step": 369540 + }, + { + "epoch": 1.86, + "learning_rate": 2.0335904667248538e-05, + "loss": 0.0065, + "step": 369550 + }, + { + "epoch": 1.86, + "learning_rate": 2.0328336974234526e-05, + "loss": 0.0068, + "step": 369560 + }, + { + "epoch": 1.86, + "learning_rate": 2.0320769281220518e-05, + "loss": 0.0053, + "step": 369570 + }, + { + "epoch": 1.86, + "learning_rate": 2.0313201588206506e-05, + "loss": 0.006, + "step": 369580 + }, + { + "epoch": 1.86, + "learning_rate": 2.0305633895192497e-05, + "loss": 0.0044, + "step": 369590 + }, + { + "epoch": 1.86, + "learning_rate": 2.0298066202178486e-05, + "loss": 0.0049, + "step": 369600 + }, + { + "epoch": 1.86, + "learning_rate": 2.0290498509164474e-05, + "loss": 0.0043, + "step": 369610 + }, + { + "epoch": 1.86, + "learning_rate": 2.0282930816150462e-05, + "loss": 0.0067, + "step": 369620 + }, + { + "epoch": 1.86, + "learning_rate": 2.0275363123136454e-05, + "loss": 0.0068, + "step": 369630 + }, + { + "epoch": 1.86, + "learning_rate": 2.0267795430122442e-05, + "loss": 0.0067, + "step": 369640 + }, + { + "epoch": 1.86, + "learning_rate": 2.0260227737108433e-05, + "loss": 0.0059, + "step": 369650 + }, + { + "epoch": 1.86, + "learning_rate": 2.0252660044094422e-05, + "loss": 0.0065, + "step": 369660 + }, + { + "epoch": 1.87, + "learning_rate": 2.0245092351080413e-05, + "loss": 0.0085, + "step": 369670 + }, + { + "epoch": 1.87, + "learning_rate": 2.02375246580664e-05, + "loss": 0.0072, + "step": 369680 + }, + { + "epoch": 1.87, + "learning_rate": 2.0229956965052393e-05, + "loss": 0.0045, + "step": 369690 + }, + { + "epoch": 1.87, + "learning_rate": 2.022238927203838e-05, + "loss": 0.0046, + "step": 369700 + }, + { + "epoch": 1.87, + "learning_rate": 2.0214821579024373e-05, + "loss": 0.0068, + "step": 369710 + }, + { + "epoch": 1.87, + "learning_rate": 2.020725388601036e-05, + "loss": 0.0068, + "step": 369720 + }, + { + "epoch": 1.87, + "learning_rate": 2.0199686192996353e-05, + "loss": 0.0054, + "step": 369730 + }, + { + "epoch": 1.87, + "learning_rate": 2.019211849998234e-05, + "loss": 0.0056, + "step": 369740 + }, + { + "epoch": 1.87, + "learning_rate": 2.0184550806968333e-05, + "loss": 0.0053, + "step": 369750 + }, + { + "epoch": 1.87, + "learning_rate": 2.017698311395432e-05, + "loss": 0.0069, + "step": 369760 + }, + { + "epoch": 1.87, + "learning_rate": 2.016941542094031e-05, + "loss": 0.0059, + "step": 369770 + }, + { + "epoch": 1.87, + "learning_rate": 2.0161847727926297e-05, + "loss": 0.0049, + "step": 369780 + }, + { + "epoch": 1.87, + "learning_rate": 2.015428003491229e-05, + "loss": 0.006, + "step": 369790 + }, + { + "epoch": 1.87, + "learning_rate": 2.0146712341898277e-05, + "loss": 0.0046, + "step": 369800 + }, + { + "epoch": 1.87, + "learning_rate": 2.013914464888427e-05, + "loss": 0.0059, + "step": 369810 + }, + { + "epoch": 1.87, + "learning_rate": 2.0131576955870257e-05, + "loss": 0.007, + "step": 369820 + }, + { + "epoch": 1.87, + "learning_rate": 2.012400926285625e-05, + "loss": 0.0055, + "step": 369830 + }, + { + "epoch": 1.87, + "learning_rate": 2.0116441569842237e-05, + "loss": 0.0064, + "step": 369840 + }, + { + "epoch": 1.87, + "learning_rate": 2.010887387682823e-05, + "loss": 0.0043, + "step": 369850 + }, + { + "epoch": 1.87, + "learning_rate": 2.0101306183814217e-05, + "loss": 0.005, + "step": 369860 + }, + { + "epoch": 1.87, + "learning_rate": 2.0093738490800208e-05, + "loss": 0.0058, + "step": 369870 + }, + { + "epoch": 1.87, + "learning_rate": 2.0086170797786196e-05, + "loss": 0.0063, + "step": 369880 + }, + { + "epoch": 1.87, + "learning_rate": 2.0078603104772188e-05, + "loss": 0.007, + "step": 369890 + }, + { + "epoch": 1.87, + "learning_rate": 2.0071035411758176e-05, + "loss": 0.0058, + "step": 369900 + }, + { + "epoch": 1.87, + "learning_rate": 2.0063467718744168e-05, + "loss": 0.0045, + "step": 369910 + }, + { + "epoch": 1.87, + "learning_rate": 2.0055900025730153e-05, + "loss": 0.0061, + "step": 369920 + }, + { + "epoch": 1.87, + "learning_rate": 2.004833233271614e-05, + "loss": 0.0067, + "step": 369930 + }, + { + "epoch": 1.87, + "learning_rate": 2.0040764639702132e-05, + "loss": 0.005, + "step": 369940 + }, + { + "epoch": 1.87, + "learning_rate": 2.003319694668812e-05, + "loss": 0.0042, + "step": 369950 + }, + { + "epoch": 1.87, + "learning_rate": 2.0025629253674112e-05, + "loss": 0.0084, + "step": 369960 + }, + { + "epoch": 1.87, + "learning_rate": 2.00180615606601e-05, + "loss": 0.007, + "step": 369970 + }, + { + "epoch": 1.87, + "learning_rate": 2.0010493867646092e-05, + "loss": 0.0052, + "step": 369980 + }, + { + "epoch": 1.87, + "learning_rate": 2.0002926174632084e-05, + "loss": 0.0055, + "step": 369990 + }, + { + "epoch": 1.87, + "learning_rate": 1.9995358481618072e-05, + "loss": 0.0046, + "step": 370000 + }, + { + "epoch": 1.87, + "eval_cer": 0.9144246472852683, + "eval_loss": 0.004436591174453497, + "eval_runtime": 116.7427, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, + "step": 370000 + }, + { + "epoch": 1.87, + "learning_rate": 1.9987790788604064e-05, + "loss": 0.0047, + "step": 370010 + }, + { + "epoch": 1.87, + "learning_rate": 1.9980223095590052e-05, + "loss": 0.0077, + "step": 370020 + }, + { + "epoch": 1.87, + "learning_rate": 1.9972655402576043e-05, + "loss": 0.0039, + "step": 370030 + }, + { + "epoch": 1.87, + "learning_rate": 1.996508770956203e-05, + "loss": 0.0071, + "step": 370040 + }, + { + "epoch": 1.87, + "learning_rate": 1.9957520016548023e-05, + "loss": 0.0044, + "step": 370050 + }, + { + "epoch": 1.87, + "learning_rate": 1.994995232353401e-05, + "loss": 0.0049, + "step": 370060 + }, + { + "epoch": 1.87, + "learning_rate": 1.9942384630520003e-05, + "loss": 0.0055, + "step": 370070 + }, + { + "epoch": 1.87, + "learning_rate": 1.9934816937505988e-05, + "loss": 0.0046, + "step": 370080 + }, + { + "epoch": 1.87, + "learning_rate": 1.9927249244491976e-05, + "loss": 0.0043, + "step": 370090 + }, + { + "epoch": 1.87, + "learning_rate": 1.9919681551477968e-05, + "loss": 0.0069, + "step": 370100 + }, + { + "epoch": 1.87, + "learning_rate": 1.9912113858463956e-05, + "loss": 0.005, + "step": 370110 + }, + { + "epoch": 1.87, + "learning_rate": 1.9904546165449948e-05, + "loss": 0.007, + "step": 370120 + }, + { + "epoch": 1.87, + "learning_rate": 1.9896978472435936e-05, + "loss": 0.005, + "step": 370130 + }, + { + "epoch": 1.87, + "learning_rate": 1.9889410779421927e-05, + "loss": 0.0073, + "step": 370140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9881843086407916e-05, + "loss": 0.0052, + "step": 370150 + }, + { + "epoch": 1.87, + "learning_rate": 1.9874275393393907e-05, + "loss": 0.0056, + "step": 370160 + }, + { + "epoch": 1.87, + "learning_rate": 1.9866707700379895e-05, + "loss": 0.006, + "step": 370170 + }, + { + "epoch": 1.87, + "learning_rate": 1.9859140007365887e-05, + "loss": 0.0049, + "step": 370180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9851572314351875e-05, + "loss": 0.0052, + "step": 370190 + }, + { + "epoch": 1.87, + "learning_rate": 1.9844004621337867e-05, + "loss": 0.0072, + "step": 370200 + }, + { + "epoch": 1.87, + "learning_rate": 1.9836436928323855e-05, + "loss": 0.005, + "step": 370210 + }, + { + "epoch": 1.87, + "learning_rate": 1.9828869235309847e-05, + "loss": 0.0041, + "step": 370220 + }, + { + "epoch": 1.87, + "learning_rate": 1.9821301542295835e-05, + "loss": 0.0062, + "step": 370230 + }, + { + "epoch": 1.87, + "learning_rate": 1.9813733849281823e-05, + "loss": 0.0067, + "step": 370240 + }, + { + "epoch": 1.87, + "learning_rate": 1.980616615626781e-05, + "loss": 0.0079, + "step": 370250 + }, + { + "epoch": 1.87, + "learning_rate": 1.9798598463253803e-05, + "loss": 0.0051, + "step": 370260 + }, + { + "epoch": 1.87, + "learning_rate": 1.979103077023979e-05, + "loss": 0.0054, + "step": 370270 + }, + { + "epoch": 1.87, + "learning_rate": 1.9783463077225783e-05, + "loss": 0.0046, + "step": 370280 + }, + { + "epoch": 1.87, + "learning_rate": 1.977589538421177e-05, + "loss": 0.0056, + "step": 370290 + }, + { + "epoch": 1.87, + "learning_rate": 1.9768327691197763e-05, + "loss": 0.0058, + "step": 370300 + }, + { + "epoch": 1.87, + "learning_rate": 1.976075999818375e-05, + "loss": 0.0048, + "step": 370310 + }, + { + "epoch": 1.87, + "learning_rate": 1.9753192305169742e-05, + "loss": 0.0044, + "step": 370320 + }, + { + "epoch": 1.87, + "learning_rate": 1.974562461215573e-05, + "loss": 0.0067, + "step": 370330 + }, + { + "epoch": 1.87, + "learning_rate": 1.9738056919141722e-05, + "loss": 0.0066, + "step": 370340 + }, + { + "epoch": 1.87, + "learning_rate": 1.973048922612771e-05, + "loss": 0.0056, + "step": 370350 + }, + { + "epoch": 1.87, + "learning_rate": 1.9722921533113702e-05, + "loss": 0.0064, + "step": 370360 + }, + { + "epoch": 1.87, + "learning_rate": 1.971535384009969e-05, + "loss": 0.0044, + "step": 370370 + }, + { + "epoch": 1.87, + "learning_rate": 1.9707786147085682e-05, + "loss": 0.0058, + "step": 370380 + }, + { + "epoch": 1.87, + "learning_rate": 1.9700218454071667e-05, + "loss": 0.0077, + "step": 370390 + }, + { + "epoch": 1.87, + "learning_rate": 1.969265076105766e-05, + "loss": 0.0057, + "step": 370400 + }, + { + "epoch": 1.87, + "learning_rate": 1.9685083068043647e-05, + "loss": 0.006, + "step": 370410 + }, + { + "epoch": 1.87, + "learning_rate": 1.9677515375029638e-05, + "loss": 0.0039, + "step": 370420 + }, + { + "epoch": 1.87, + "learning_rate": 1.9669947682015626e-05, + "loss": 0.0059, + "step": 370430 + }, + { + "epoch": 1.87, + "learning_rate": 1.9662379989001618e-05, + "loss": 0.0069, + "step": 370440 + }, + { + "epoch": 1.87, + "learning_rate": 1.9654812295987606e-05, + "loss": 0.007, + "step": 370450 + }, + { + "epoch": 1.87, + "learning_rate": 1.9647244602973598e-05, + "loss": 0.0086, + "step": 370460 + }, + { + "epoch": 1.87, + "learning_rate": 1.9639676909959586e-05, + "loss": 0.0069, + "step": 370470 + }, + { + "epoch": 1.87, + "learning_rate": 1.9632109216945578e-05, + "loss": 0.0049, + "step": 370480 + }, + { + "epoch": 1.87, + "learning_rate": 1.9624541523931566e-05, + "loss": 0.0074, + "step": 370490 + }, + { + "epoch": 1.87, + "learning_rate": 1.9616973830917557e-05, + "loss": 0.0054, + "step": 370500 + }, + { + "epoch": 1.87, + "learning_rate": 1.9609406137903546e-05, + "loss": 0.0056, + "step": 370510 + }, + { + "epoch": 1.87, + "learning_rate": 1.9601838444889537e-05, + "loss": 0.0051, + "step": 370520 + }, + { + "epoch": 1.87, + "learning_rate": 1.9594270751875525e-05, + "loss": 0.0051, + "step": 370530 + }, + { + "epoch": 1.87, + "learning_rate": 1.9586703058861517e-05, + "loss": 0.0053, + "step": 370540 + }, + { + "epoch": 1.87, + "learning_rate": 1.9579135365847502e-05, + "loss": 0.0052, + "step": 370550 + }, + { + "epoch": 1.87, + "learning_rate": 1.9571567672833494e-05, + "loss": 0.0054, + "step": 370560 + }, + { + "epoch": 1.87, + "learning_rate": 1.9563999979819482e-05, + "loss": 0.0054, + "step": 370570 + }, + { + "epoch": 1.87, + "learning_rate": 1.9556432286805473e-05, + "loss": 0.006, + "step": 370580 + }, + { + "epoch": 1.87, + "learning_rate": 1.954886459379146e-05, + "loss": 0.0061, + "step": 370590 + }, + { + "epoch": 1.87, + "learning_rate": 1.9541296900777453e-05, + "loss": 0.0066, + "step": 370600 + }, + { + "epoch": 1.87, + "learning_rate": 1.953372920776344e-05, + "loss": 0.0068, + "step": 370610 + }, + { + "epoch": 1.87, + "learning_rate": 1.9526161514749433e-05, + "loss": 0.004, + "step": 370620 + }, + { + "epoch": 1.87, + "learning_rate": 1.951859382173542e-05, + "loss": 0.0069, + "step": 370630 + }, + { + "epoch": 1.87, + "learning_rate": 1.9511026128721413e-05, + "loss": 0.0063, + "step": 370640 + }, + { + "epoch": 1.87, + "learning_rate": 1.95034584357074e-05, + "loss": 0.0071, + "step": 370650 + }, + { + "epoch": 1.87, + "learning_rate": 1.9495890742693393e-05, + "loss": 0.0065, + "step": 370660 + }, + { + "epoch": 1.87, + "learning_rate": 1.948832304967938e-05, + "loss": 0.0064, + "step": 370670 + }, + { + "epoch": 1.87, + "learning_rate": 1.9480755356665372e-05, + "loss": 0.0063, + "step": 370680 + }, + { + "epoch": 1.87, + "learning_rate": 1.947318766365136e-05, + "loss": 0.0066, + "step": 370690 + }, + { + "epoch": 1.87, + "learning_rate": 1.9465619970637352e-05, + "loss": 0.0071, + "step": 370700 + }, + { + "epoch": 1.87, + "learning_rate": 1.9458052277623337e-05, + "loss": 0.0045, + "step": 370710 + }, + { + "epoch": 1.87, + "learning_rate": 1.945048458460933e-05, + "loss": 0.0067, + "step": 370720 + }, + { + "epoch": 1.87, + "learning_rate": 1.9442916891595317e-05, + "loss": 0.0051, + "step": 370730 + }, + { + "epoch": 1.87, + "learning_rate": 1.943534919858131e-05, + "loss": 0.0063, + "step": 370740 + }, + { + "epoch": 1.87, + "learning_rate": 1.9427781505567297e-05, + "loss": 0.0051, + "step": 370750 + }, + { + "epoch": 1.87, + "learning_rate": 1.942021381255329e-05, + "loss": 0.0067, + "step": 370760 + }, + { + "epoch": 1.87, + "learning_rate": 1.9412646119539277e-05, + "loss": 0.0039, + "step": 370770 + }, + { + "epoch": 1.87, + "learning_rate": 1.9405078426525268e-05, + "loss": 0.0065, + "step": 370780 + }, + { + "epoch": 1.87, + "learning_rate": 1.9397510733511256e-05, + "loss": 0.0055, + "step": 370790 + }, + { + "epoch": 1.87, + "learning_rate": 1.9389943040497248e-05, + "loss": 0.0066, + "step": 370800 + }, + { + "epoch": 1.87, + "learning_rate": 1.9382375347483236e-05, + "loss": 0.0062, + "step": 370810 + }, + { + "epoch": 1.87, + "learning_rate": 1.9374807654469228e-05, + "loss": 0.0048, + "step": 370820 + }, + { + "epoch": 1.87, + "learning_rate": 1.9367239961455216e-05, + "loss": 0.0055, + "step": 370830 + }, + { + "epoch": 1.87, + "learning_rate": 1.9359672268441208e-05, + "loss": 0.0062, + "step": 370840 + }, + { + "epoch": 1.87, + "learning_rate": 1.9352104575427196e-05, + "loss": 0.0074, + "step": 370850 + }, + { + "epoch": 1.87, + "learning_rate": 1.9344536882413188e-05, + "loss": 0.0052, + "step": 370860 + }, + { + "epoch": 1.87, + "learning_rate": 1.9336969189399172e-05, + "loss": 0.0056, + "step": 370870 + }, + { + "epoch": 1.87, + "learning_rate": 1.932940149638516e-05, + "loss": 0.0074, + "step": 370880 + }, + { + "epoch": 1.87, + "learning_rate": 1.9321833803371152e-05, + "loss": 0.0064, + "step": 370890 + }, + { + "epoch": 1.87, + "learning_rate": 1.931426611035714e-05, + "loss": 0.0054, + "step": 370900 + }, + { + "epoch": 1.87, + "learning_rate": 1.9306698417343132e-05, + "loss": 0.0053, + "step": 370910 + }, + { + "epoch": 1.87, + "learning_rate": 1.929913072432912e-05, + "loss": 0.005, + "step": 370920 + }, + { + "epoch": 1.87, + "learning_rate": 1.9291563031315112e-05, + "loss": 0.0099, + "step": 370930 + }, + { + "epoch": 1.87, + "learning_rate": 1.92839953383011e-05, + "loss": 0.0077, + "step": 370940 + }, + { + "epoch": 1.87, + "learning_rate": 1.927642764528709e-05, + "loss": 0.0049, + "step": 370950 + }, + { + "epoch": 1.87, + "learning_rate": 1.9268859952273083e-05, + "loss": 0.0057, + "step": 370960 + }, + { + "epoch": 1.87, + "learning_rate": 1.926129225925907e-05, + "loss": 0.0056, + "step": 370970 + }, + { + "epoch": 1.87, + "learning_rate": 1.9253724566245063e-05, + "loss": 0.0049, + "step": 370980 + }, + { + "epoch": 1.87, + "learning_rate": 1.924615687323105e-05, + "loss": 0.0048, + "step": 370990 + }, + { + "epoch": 1.87, + "learning_rate": 1.9238589180217043e-05, + "loss": 0.0069, + "step": 371000 + }, + { + "epoch": 1.87, + "eval_cer": 0.9144450256039017, + "eval_loss": 0.004348627291619778, + "eval_runtime": 116.6791, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, + "step": 371000 + }, + { + "epoch": 1.87, + "learning_rate": 1.923102148720303e-05, + "loss": 0.0046, + "step": 371010 + }, + { + "epoch": 1.87, + "learning_rate": 1.9223453794189016e-05, + "loss": 0.0054, + "step": 371020 + }, + { + "epoch": 1.87, + "learning_rate": 1.9215886101175008e-05, + "loss": 0.0062, + "step": 371030 + }, + { + "epoch": 1.87, + "learning_rate": 1.9208318408160996e-05, + "loss": 0.0049, + "step": 371040 + }, + { + "epoch": 1.87, + "learning_rate": 1.9200750715146987e-05, + "loss": 0.0048, + "step": 371050 + }, + { + "epoch": 1.87, + "learning_rate": 1.9193183022132976e-05, + "loss": 0.0059, + "step": 371060 + }, + { + "epoch": 1.87, + "learning_rate": 1.9185615329118967e-05, + "loss": 0.0032, + "step": 371070 + }, + { + "epoch": 1.87, + "learning_rate": 1.9178047636104955e-05, + "loss": 0.0069, + "step": 371080 + }, + { + "epoch": 1.87, + "learning_rate": 1.9170479943090947e-05, + "loss": 0.0071, + "step": 371090 + }, + { + "epoch": 1.87, + "learning_rate": 1.9162912250076935e-05, + "loss": 0.0053, + "step": 371100 + }, + { + "epoch": 1.87, + "learning_rate": 1.9155344557062927e-05, + "loss": 0.0069, + "step": 371110 + }, + { + "epoch": 1.87, + "learning_rate": 1.9147776864048915e-05, + "loss": 0.0068, + "step": 371120 + }, + { + "epoch": 1.87, + "learning_rate": 1.9140209171034907e-05, + "loss": 0.0045, + "step": 371130 + }, + { + "epoch": 1.87, + "learning_rate": 1.9132641478020895e-05, + "loss": 0.007, + "step": 371140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9125073785006887e-05, + "loss": 0.0056, + "step": 371150 + }, + { + "epoch": 1.87, + "learning_rate": 1.9117506091992875e-05, + "loss": 0.0048, + "step": 371160 + }, + { + "epoch": 1.87, + "learning_rate": 1.9109938398978866e-05, + "loss": 0.0057, + "step": 371170 + }, + { + "epoch": 1.87, + "learning_rate": 1.910237070596485e-05, + "loss": 0.0044, + "step": 371180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9094803012950843e-05, + "loss": 0.0068, + "step": 371190 + }, + { + "epoch": 1.87, + "learning_rate": 1.908723531993683e-05, + "loss": 0.0061, + "step": 371200 + }, + { + "epoch": 1.87, + "learning_rate": 1.9079667626922823e-05, + "loss": 0.007, + "step": 371210 + }, + { + "epoch": 1.87, + "learning_rate": 1.907209993390881e-05, + "loss": 0.0048, + "step": 371220 + }, + { + "epoch": 1.87, + "learning_rate": 1.9064532240894802e-05, + "loss": 0.0073, + "step": 371230 + }, + { + "epoch": 1.87, + "learning_rate": 1.905696454788079e-05, + "loss": 0.0074, + "step": 371240 + }, + { + "epoch": 1.87, + "learning_rate": 1.9049396854866782e-05, + "loss": 0.0087, + "step": 371250 + }, + { + "epoch": 1.87, + "learning_rate": 1.904182916185277e-05, + "loss": 0.0052, + "step": 371260 + }, + { + "epoch": 1.87, + "learning_rate": 1.9034261468838762e-05, + "loss": 0.0068, + "step": 371270 + }, + { + "epoch": 1.87, + "learning_rate": 1.902669377582475e-05, + "loss": 0.0055, + "step": 371280 + }, + { + "epoch": 1.87, + "learning_rate": 1.9019126082810742e-05, + "loss": 0.0033, + "step": 371290 + }, + { + "epoch": 1.87, + "learning_rate": 1.901155838979673e-05, + "loss": 0.0047, + "step": 371300 + }, + { + "epoch": 1.87, + "learning_rate": 1.9003990696782722e-05, + "loss": 0.0054, + "step": 371310 + }, + { + "epoch": 1.87, + "learning_rate": 1.899642300376871e-05, + "loss": 0.0065, + "step": 371320 + }, + { + "epoch": 1.87, + "learning_rate": 1.89888553107547e-05, + "loss": 0.0046, + "step": 371330 + }, + { + "epoch": 1.87, + "learning_rate": 1.8981287617740686e-05, + "loss": 0.0058, + "step": 371340 + }, + { + "epoch": 1.87, + "learning_rate": 1.8973719924726678e-05, + "loss": 0.0055, + "step": 371350 + }, + { + "epoch": 1.87, + "learning_rate": 1.8966152231712666e-05, + "loss": 0.0062, + "step": 371360 + }, + { + "epoch": 1.87, + "learning_rate": 1.8958584538698658e-05, + "loss": 0.0058, + "step": 371370 + }, + { + "epoch": 1.87, + "learning_rate": 1.8951016845684646e-05, + "loss": 0.0064, + "step": 371380 + }, + { + "epoch": 1.87, + "learning_rate": 1.8943449152670638e-05, + "loss": 0.0063, + "step": 371390 + }, + { + "epoch": 1.87, + "learning_rate": 1.8935881459656626e-05, + "loss": 0.0049, + "step": 371400 + }, + { + "epoch": 1.87, + "learning_rate": 1.8928313766642617e-05, + "loss": 0.0054, + "step": 371410 + }, + { + "epoch": 1.87, + "learning_rate": 1.8920746073628606e-05, + "loss": 0.0066, + "step": 371420 + }, + { + "epoch": 1.87, + "learning_rate": 1.8913178380614597e-05, + "loss": 0.0055, + "step": 371430 + }, + { + "epoch": 1.87, + "learning_rate": 1.8905610687600586e-05, + "loss": 0.0062, + "step": 371440 + }, + { + "epoch": 1.87, + "learning_rate": 1.8898042994586577e-05, + "loss": 0.0049, + "step": 371450 + }, + { + "epoch": 1.87, + "learning_rate": 1.8890475301572565e-05, + "loss": 0.0058, + "step": 371460 + }, + { + "epoch": 1.87, + "learning_rate": 1.8882907608558557e-05, + "loss": 0.0056, + "step": 371470 + }, + { + "epoch": 1.87, + "learning_rate": 1.8875339915544545e-05, + "loss": 0.005, + "step": 371480 + }, + { + "epoch": 1.87, + "learning_rate": 1.8867772222530533e-05, + "loss": 0.0057, + "step": 371490 + }, + { + "epoch": 1.87, + "learning_rate": 1.886020452951652e-05, + "loss": 0.0094, + "step": 371500 + }, + { + "epoch": 1.87, + "learning_rate": 1.8852636836502513e-05, + "loss": 0.0107, + "step": 371510 + }, + { + "epoch": 1.87, + "learning_rate": 1.88450691434885e-05, + "loss": 0.0045, + "step": 371520 + }, + { + "epoch": 1.87, + "learning_rate": 1.8837501450474493e-05, + "loss": 0.006, + "step": 371530 + }, + { + "epoch": 1.87, + "learning_rate": 1.882993375746048e-05, + "loss": 0.0068, + "step": 371540 + }, + { + "epoch": 1.87, + "learning_rate": 1.8822366064446473e-05, + "loss": 0.0079, + "step": 371550 + }, + { + "epoch": 1.87, + "learning_rate": 1.881479837143246e-05, + "loss": 0.0045, + "step": 371560 + }, + { + "epoch": 1.87, + "learning_rate": 1.8807230678418453e-05, + "loss": 0.0041, + "step": 371570 + }, + { + "epoch": 1.87, + "learning_rate": 1.879966298540444e-05, + "loss": 0.0059, + "step": 371580 + }, + { + "epoch": 1.87, + "learning_rate": 1.8792095292390433e-05, + "loss": 0.0046, + "step": 371590 + }, + { + "epoch": 1.87, + "learning_rate": 1.878452759937642e-05, + "loss": 0.0053, + "step": 371600 + }, + { + "epoch": 1.87, + "learning_rate": 1.8776959906362412e-05, + "loss": 0.0045, + "step": 371610 + }, + { + "epoch": 1.87, + "learning_rate": 1.87693922133484e-05, + "loss": 0.0053, + "step": 371620 + }, + { + "epoch": 1.87, + "learning_rate": 1.8761824520334392e-05, + "loss": 0.0049, + "step": 371630 + }, + { + "epoch": 1.87, + "learning_rate": 1.875425682732038e-05, + "loss": 0.0071, + "step": 371640 + }, + { + "epoch": 1.88, + "learning_rate": 1.874668913430637e-05, + "loss": 0.0051, + "step": 371650 + }, + { + "epoch": 1.88, + "learning_rate": 1.873912144129236e-05, + "loss": 0.004, + "step": 371660 + }, + { + "epoch": 1.88, + "learning_rate": 1.873155374827835e-05, + "loss": 0.0063, + "step": 371670 + }, + { + "epoch": 1.88, + "learning_rate": 1.872398605526434e-05, + "loss": 0.0059, + "step": 371680 + }, + { + "epoch": 1.88, + "learning_rate": 1.8716418362250328e-05, + "loss": 0.0069, + "step": 371690 + }, + { + "epoch": 1.88, + "learning_rate": 1.8708850669236316e-05, + "loss": 0.0046, + "step": 371700 + }, + { + "epoch": 1.88, + "learning_rate": 1.8701282976222308e-05, + "loss": 0.0056, + "step": 371710 + }, + { + "epoch": 1.88, + "learning_rate": 1.8693715283208296e-05, + "loss": 0.0068, + "step": 371720 + }, + { + "epoch": 1.88, + "learning_rate": 1.8686147590194288e-05, + "loss": 0.0055, + "step": 371730 + }, + { + "epoch": 1.88, + "learning_rate": 1.8678579897180276e-05, + "loss": 0.0061, + "step": 371740 + }, + { + "epoch": 1.88, + "learning_rate": 1.8671012204166268e-05, + "loss": 0.0054, + "step": 371750 + }, + { + "epoch": 1.88, + "learning_rate": 1.8663444511152256e-05, + "loss": 0.0063, + "step": 371760 + }, + { + "epoch": 1.88, + "learning_rate": 1.8655876818138244e-05, + "loss": 0.0044, + "step": 371770 + }, + { + "epoch": 1.88, + "learning_rate": 1.8648309125124232e-05, + "loss": 0.009, + "step": 371780 + }, + { + "epoch": 1.88, + "learning_rate": 1.8640741432110224e-05, + "loss": 0.0083, + "step": 371790 + }, + { + "epoch": 1.88, + "learning_rate": 1.8633173739096216e-05, + "loss": 0.0165, + "step": 371800 + }, + { + "epoch": 1.88, + "learning_rate": 1.8625606046082204e-05, + "loss": 0.004, + "step": 371810 + }, + { + "epoch": 1.88, + "learning_rate": 1.8618038353068195e-05, + "loss": 0.0045, + "step": 371820 + }, + { + "epoch": 1.88, + "learning_rate": 1.8610470660054184e-05, + "loss": 0.0055, + "step": 371830 + }, + { + "epoch": 1.88, + "learning_rate": 1.8602902967040175e-05, + "loss": 0.0069, + "step": 371840 + }, + { + "epoch": 1.88, + "learning_rate": 1.859533527402616e-05, + "loss": 0.0052, + "step": 371850 + }, + { + "epoch": 1.88, + "learning_rate": 1.8587767581012152e-05, + "loss": 0.0053, + "step": 371860 + }, + { + "epoch": 1.88, + "learning_rate": 1.858019988799814e-05, + "loss": 0.0058, + "step": 371870 + }, + { + "epoch": 1.88, + "learning_rate": 1.857263219498413e-05, + "loss": 0.0056, + "step": 371880 + }, + { + "epoch": 1.88, + "learning_rate": 1.856506450197012e-05, + "loss": 0.0041, + "step": 371890 + }, + { + "epoch": 1.88, + "learning_rate": 1.855749680895611e-05, + "loss": 0.0062, + "step": 371900 + }, + { + "epoch": 1.88, + "learning_rate": 1.85499291159421e-05, + "loss": 0.0091, + "step": 371910 + }, + { + "epoch": 1.88, + "learning_rate": 1.854236142292809e-05, + "loss": 0.0052, + "step": 371920 + }, + { + "epoch": 1.88, + "learning_rate": 1.853479372991408e-05, + "loss": 0.0055, + "step": 371930 + }, + { + "epoch": 1.88, + "learning_rate": 1.8527226036900068e-05, + "loss": 0.007, + "step": 371940 + }, + { + "epoch": 1.88, + "learning_rate": 1.851965834388606e-05, + "loss": 0.0053, + "step": 371950 + }, + { + "epoch": 1.88, + "learning_rate": 1.8512090650872047e-05, + "loss": 0.0066, + "step": 371960 + }, + { + "epoch": 1.88, + "learning_rate": 1.850452295785804e-05, + "loss": 0.0068, + "step": 371970 + }, + { + "epoch": 1.88, + "learning_rate": 1.8496955264844027e-05, + "loss": 0.0047, + "step": 371980 + }, + { + "epoch": 1.88, + "learning_rate": 1.848938757183002e-05, + "loss": 0.006, + "step": 371990 + }, + { + "epoch": 1.88, + "learning_rate": 1.8481819878816007e-05, + "loss": 0.0052, + "step": 372000 + }, + { + "epoch": 1.88, + "eval_cer": 0.914423676889143, + "eval_loss": 0.004319104366004467, + "eval_runtime": 116.6762, + "eval_samples_per_second": 17.141, + "eval_steps_per_second": 4.285, + "step": 372000 + }, + { + "epoch": 1.88, + "learning_rate": 1.8474252185801995e-05, + "loss": 0.0082, + "step": 372010 + }, + { + "epoch": 1.88, + "learning_rate": 1.8466684492787987e-05, + "loss": 0.0047, + "step": 372020 + }, + { + "epoch": 1.88, + "learning_rate": 1.8459116799773975e-05, + "loss": 0.0046, + "step": 372030 + }, + { + "epoch": 1.88, + "learning_rate": 1.8451549106759967e-05, + "loss": 0.0052, + "step": 372040 + }, + { + "epoch": 1.88, + "learning_rate": 1.8443981413745955e-05, + "loss": 0.005, + "step": 372050 + }, + { + "epoch": 1.88, + "learning_rate": 1.8436413720731947e-05, + "loss": 0.0072, + "step": 372060 + }, + { + "epoch": 1.88, + "learning_rate": 1.8428846027717935e-05, + "loss": 0.0044, + "step": 372070 + }, + { + "epoch": 1.88, + "learning_rate": 1.8421278334703923e-05, + "loss": 0.0104, + "step": 372080 + }, + { + "epoch": 1.88, + "learning_rate": 1.8413710641689915e-05, + "loss": 0.0045, + "step": 372090 + }, + { + "epoch": 1.88, + "learning_rate": 1.8406142948675903e-05, + "loss": 0.0161, + "step": 372100 + }, + { + "epoch": 1.88, + "learning_rate": 1.8398575255661894e-05, + "loss": 0.0056, + "step": 372110 + }, + { + "epoch": 1.88, + "learning_rate": 1.8391007562647883e-05, + "loss": 0.0065, + "step": 372120 + }, + { + "epoch": 1.88, + "learning_rate": 1.8383439869633874e-05, + "loss": 0.0052, + "step": 372130 + }, + { + "epoch": 1.88, + "learning_rate": 1.8375872176619862e-05, + "loss": 0.0055, + "step": 372140 + }, + { + "epoch": 1.88, + "learning_rate": 1.8368304483605854e-05, + "loss": 0.0057, + "step": 372150 + }, + { + "epoch": 1.88, + "learning_rate": 1.8360736790591842e-05, + "loss": 0.0057, + "step": 372160 + }, + { + "epoch": 1.88, + "learning_rate": 1.835316909757783e-05, + "loss": 0.0046, + "step": 372170 + }, + { + "epoch": 1.88, + "learning_rate": 1.8345601404563822e-05, + "loss": 0.006, + "step": 372180 + }, + { + "epoch": 1.88, + "learning_rate": 1.833803371154981e-05, + "loss": 0.0073, + "step": 372190 + }, + { + "epoch": 1.88, + "learning_rate": 1.8330466018535802e-05, + "loss": 0.0065, + "step": 372200 + }, + { + "epoch": 1.88, + "learning_rate": 1.832289832552179e-05, + "loss": 0.0045, + "step": 372210 + }, + { + "epoch": 1.88, + "learning_rate": 1.8315330632507782e-05, + "loss": 0.0055, + "step": 372220 + }, + { + "epoch": 1.88, + "learning_rate": 1.830776293949377e-05, + "loss": 0.0057, + "step": 372230 + }, + { + "epoch": 1.88, + "learning_rate": 1.8300195246479758e-05, + "loss": 0.0072, + "step": 372240 + }, + { + "epoch": 1.88, + "learning_rate": 1.829262755346575e-05, + "loss": 0.0058, + "step": 372250 + }, + { + "epoch": 1.88, + "learning_rate": 1.8285059860451738e-05, + "loss": 0.0052, + "step": 372260 + }, + { + "epoch": 1.88, + "learning_rate": 1.827749216743773e-05, + "loss": 0.0062, + "step": 372270 + }, + { + "epoch": 1.88, + "learning_rate": 1.8269924474423718e-05, + "loss": 0.0049, + "step": 372280 + }, + { + "epoch": 1.88, + "learning_rate": 1.826235678140971e-05, + "loss": 0.0054, + "step": 372290 + }, + { + "epoch": 1.88, + "learning_rate": 1.8254789088395698e-05, + "loss": 0.0044, + "step": 372300 + }, + { + "epoch": 1.88, + "learning_rate": 1.824722139538169e-05, + "loss": 0.0048, + "step": 372310 + }, + { + "epoch": 1.88, + "learning_rate": 1.8239653702367678e-05, + "loss": 0.007, + "step": 372320 + }, + { + "epoch": 1.88, + "learning_rate": 1.8232086009353666e-05, + "loss": 0.0065, + "step": 372330 + }, + { + "epoch": 1.88, + "learning_rate": 1.8224518316339657e-05, + "loss": 0.0048, + "step": 372340 + }, + { + "epoch": 1.88, + "learning_rate": 1.8216950623325646e-05, + "loss": 0.0063, + "step": 372350 + }, + { + "epoch": 1.88, + "learning_rate": 1.8209382930311637e-05, + "loss": 0.0089, + "step": 372360 + }, + { + "epoch": 1.88, + "learning_rate": 1.8201815237297625e-05, + "loss": 0.0054, + "step": 372370 + }, + { + "epoch": 1.88, + "learning_rate": 1.8194247544283617e-05, + "loss": 0.0057, + "step": 372380 + }, + { + "epoch": 1.88, + "learning_rate": 1.8186679851269605e-05, + "loss": 0.0048, + "step": 372390 + }, + { + "epoch": 1.88, + "learning_rate": 1.8179112158255593e-05, + "loss": 0.0066, + "step": 372400 + }, + { + "epoch": 1.88, + "learning_rate": 1.8171544465241585e-05, + "loss": 0.0072, + "step": 372410 + }, + { + "epoch": 1.88, + "learning_rate": 1.8163976772227573e-05, + "loss": 0.0058, + "step": 372420 + }, + { + "epoch": 1.88, + "learning_rate": 1.8156409079213565e-05, + "loss": 0.0051, + "step": 372430 + }, + { + "epoch": 1.88, + "learning_rate": 1.8148841386199553e-05, + "loss": 0.0044, + "step": 372440 + }, + { + "epoch": 1.88, + "learning_rate": 1.8141273693185545e-05, + "loss": 0.0075, + "step": 372450 + }, + { + "epoch": 1.88, + "learning_rate": 1.8133706000171533e-05, + "loss": 0.0039, + "step": 372460 + }, + { + "epoch": 1.88, + "learning_rate": 1.8126138307157525e-05, + "loss": 0.0068, + "step": 372470 + }, + { + "epoch": 1.88, + "learning_rate": 1.8118570614143513e-05, + "loss": 0.0055, + "step": 372480 + }, + { + "epoch": 1.88, + "learning_rate": 1.81110029211295e-05, + "loss": 0.0045, + "step": 372490 + }, + { + "epoch": 1.88, + "learning_rate": 1.8103435228115493e-05, + "loss": 0.0053, + "step": 372500 + }, + { + "epoch": 1.88, + "learning_rate": 1.809586753510148e-05, + "loss": 0.0059, + "step": 372510 + }, + { + "epoch": 1.88, + "learning_rate": 1.8088299842087472e-05, + "loss": 0.0071, + "step": 372520 + }, + { + "epoch": 1.88, + "learning_rate": 1.808073214907346e-05, + "loss": 0.0056, + "step": 372530 + }, + { + "epoch": 1.88, + "learning_rate": 1.8073164456059452e-05, + "loss": 0.0044, + "step": 372540 + }, + { + "epoch": 1.88, + "learning_rate": 1.806559676304544e-05, + "loss": 0.0078, + "step": 372550 + }, + { + "epoch": 1.88, + "learning_rate": 1.805802907003143e-05, + "loss": 0.0081, + "step": 372560 + }, + { + "epoch": 1.88, + "learning_rate": 1.805046137701742e-05, + "loss": 0.0048, + "step": 372570 + }, + { + "epoch": 1.88, + "learning_rate": 1.804289368400341e-05, + "loss": 0.0059, + "step": 372580 + }, + { + "epoch": 1.88, + "learning_rate": 1.80353259909894e-05, + "loss": 0.0039, + "step": 372590 + }, + { + "epoch": 1.88, + "learning_rate": 1.802775829797539e-05, + "loss": 0.005, + "step": 372600 + }, + { + "epoch": 1.88, + "learning_rate": 1.802019060496138e-05, + "loss": 0.0049, + "step": 372610 + }, + { + "epoch": 1.88, + "learning_rate": 1.8012622911947368e-05, + "loss": 0.0064, + "step": 372620 + }, + { + "epoch": 1.88, + "learning_rate": 1.8005055218933356e-05, + "loss": 0.0047, + "step": 372630 + }, + { + "epoch": 1.88, + "learning_rate": 1.7997487525919348e-05, + "loss": 0.0055, + "step": 372640 + }, + { + "epoch": 1.88, + "learning_rate": 1.7989919832905336e-05, + "loss": 0.0057, + "step": 372650 + }, + { + "epoch": 1.88, + "learning_rate": 1.7982352139891328e-05, + "loss": 0.0072, + "step": 372660 + }, + { + "epoch": 1.88, + "learning_rate": 1.7974784446877316e-05, + "loss": 0.0048, + "step": 372670 + }, + { + "epoch": 1.88, + "learning_rate": 1.7967216753863308e-05, + "loss": 0.0052, + "step": 372680 + }, + { + "epoch": 1.88, + "learning_rate": 1.7959649060849296e-05, + "loss": 0.0037, + "step": 372690 + }, + { + "epoch": 1.88, + "learning_rate": 1.7952081367835287e-05, + "loss": 0.0057, + "step": 372700 + }, + { + "epoch": 1.88, + "learning_rate": 1.7944513674821272e-05, + "loss": 0.004, + "step": 372710 + }, + { + "epoch": 1.88, + "learning_rate": 1.7936945981807264e-05, + "loss": 0.0043, + "step": 372720 + }, + { + "epoch": 1.88, + "learning_rate": 1.7929378288793252e-05, + "loss": 0.0063, + "step": 372730 + }, + { + "epoch": 1.88, + "learning_rate": 1.7921810595779244e-05, + "loss": 0.0068, + "step": 372740 + }, + { + "epoch": 1.88, + "learning_rate": 1.7914242902765232e-05, + "loss": 0.0064, + "step": 372750 + }, + { + "epoch": 1.88, + "learning_rate": 1.7906675209751224e-05, + "loss": 0.0071, + "step": 372760 + }, + { + "epoch": 1.88, + "learning_rate": 1.7899107516737215e-05, + "loss": 0.0064, + "step": 372770 + }, + { + "epoch": 1.88, + "learning_rate": 1.7891539823723203e-05, + "loss": 0.0056, + "step": 372780 + }, + { + "epoch": 1.88, + "learning_rate": 1.788397213070919e-05, + "loss": 0.0047, + "step": 372790 + }, + { + "epoch": 1.88, + "learning_rate": 1.787640443769518e-05, + "loss": 0.0042, + "step": 372800 + }, + { + "epoch": 1.88, + "learning_rate": 1.786883674468117e-05, + "loss": 0.0075, + "step": 372810 + }, + { + "epoch": 1.88, + "learning_rate": 1.786126905166716e-05, + "loss": 0.004, + "step": 372820 + }, + { + "epoch": 1.88, + "learning_rate": 1.785370135865315e-05, + "loss": 0.0065, + "step": 372830 + }, + { + "epoch": 1.88, + "learning_rate": 1.784613366563914e-05, + "loss": 0.0063, + "step": 372840 + }, + { + "epoch": 1.88, + "learning_rate": 1.783856597262513e-05, + "loss": 0.006, + "step": 372850 + }, + { + "epoch": 1.88, + "learning_rate": 1.783099827961112e-05, + "loss": 0.0049, + "step": 372860 + }, + { + "epoch": 1.88, + "learning_rate": 1.7823430586597108e-05, + "loss": 0.0045, + "step": 372870 + }, + { + "epoch": 1.88, + "learning_rate": 1.78158628935831e-05, + "loss": 0.0057, + "step": 372880 + }, + { + "epoch": 1.88, + "learning_rate": 1.7808295200569087e-05, + "loss": 0.0073, + "step": 372890 + }, + { + "epoch": 1.88, + "learning_rate": 1.780072750755508e-05, + "loss": 0.0043, + "step": 372900 + }, + { + "epoch": 1.88, + "learning_rate": 1.7793159814541067e-05, + "loss": 0.0058, + "step": 372910 + }, + { + "epoch": 1.88, + "learning_rate": 1.778559212152706e-05, + "loss": 0.0074, + "step": 372920 + }, + { + "epoch": 1.88, + "learning_rate": 1.7778024428513047e-05, + "loss": 0.0053, + "step": 372930 + }, + { + "epoch": 1.88, + "learning_rate": 1.777045673549904e-05, + "loss": 0.0078, + "step": 372940 + }, + { + "epoch": 1.88, + "learning_rate": 1.7762889042485027e-05, + "loss": 0.005, + "step": 372950 + }, + { + "epoch": 1.88, + "learning_rate": 1.7755321349471015e-05, + "loss": 0.0051, + "step": 372960 + }, + { + "epoch": 1.88, + "learning_rate": 1.7747753656457007e-05, + "loss": 0.0078, + "step": 372970 + }, + { + "epoch": 1.88, + "learning_rate": 1.7740185963442995e-05, + "loss": 0.006, + "step": 372980 + }, + { + "epoch": 1.88, + "learning_rate": 1.7732618270428986e-05, + "loss": 0.0034, + "step": 372990 + }, + { + "epoch": 1.88, + "learning_rate": 1.7725050577414975e-05, + "loss": 0.0082, + "step": 373000 + }, + { + "epoch": 1.88, + "eval_cer": 0.9144353216426477, + "eval_loss": 0.00432598264887929, + "eval_runtime": 116.7735, + "eval_samples_per_second": 17.127, + "eval_steps_per_second": 4.282, + "step": 373000 + }, + { + "epoch": 1.88, + "learning_rate": 1.7717482884400966e-05, + "loss": 0.009, + "step": 373010 + }, + { + "epoch": 1.88, + "learning_rate": 1.7709915191386954e-05, + "loss": 0.0066, + "step": 373020 + }, + { + "epoch": 1.88, + "learning_rate": 1.7702347498372943e-05, + "loss": 0.0064, + "step": 373030 + }, + { + "epoch": 1.88, + "learning_rate": 1.7694779805358934e-05, + "loss": 0.0052, + "step": 373040 + }, + { + "epoch": 1.88, + "learning_rate": 1.7687212112344923e-05, + "loss": 0.01, + "step": 373050 + }, + { + "epoch": 1.88, + "learning_rate": 1.7679644419330914e-05, + "loss": 0.0044, + "step": 373060 + }, + { + "epoch": 1.88, + "learning_rate": 1.7672076726316902e-05, + "loss": 0.0077, + "step": 373070 + }, + { + "epoch": 1.88, + "learning_rate": 1.7664509033302894e-05, + "loss": 0.0049, + "step": 373080 + }, + { + "epoch": 1.88, + "learning_rate": 1.7656941340288882e-05, + "loss": 0.007, + "step": 373090 + }, + { + "epoch": 1.88, + "learning_rate": 1.764937364727487e-05, + "loss": 0.006, + "step": 373100 + }, + { + "epoch": 1.88, + "learning_rate": 1.7641805954260862e-05, + "loss": 0.0057, + "step": 373110 + }, + { + "epoch": 1.88, + "learning_rate": 1.763423826124685e-05, + "loss": 0.0048, + "step": 373120 + }, + { + "epoch": 1.88, + "learning_rate": 1.7626670568232842e-05, + "loss": 0.0064, + "step": 373130 + }, + { + "epoch": 1.88, + "learning_rate": 1.761910287521883e-05, + "loss": 0.0047, + "step": 373140 + }, + { + "epoch": 1.88, + "learning_rate": 1.761153518220482e-05, + "loss": 0.0072, + "step": 373150 + }, + { + "epoch": 1.88, + "learning_rate": 1.760396748919081e-05, + "loss": 0.0076, + "step": 373160 + }, + { + "epoch": 1.88, + "learning_rate": 1.75963997961768e-05, + "loss": 0.0067, + "step": 373170 + }, + { + "epoch": 1.88, + "learning_rate": 1.758883210316279e-05, + "loss": 0.0056, + "step": 373180 + }, + { + "epoch": 1.88, + "learning_rate": 1.7581264410148778e-05, + "loss": 0.0055, + "step": 373190 + }, + { + "epoch": 1.88, + "learning_rate": 1.757369671713477e-05, + "loss": 0.0044, + "step": 373200 + }, + { + "epoch": 1.88, + "learning_rate": 1.7566129024120758e-05, + "loss": 0.006, + "step": 373210 + }, + { + "epoch": 1.88, + "learning_rate": 1.755856133110675e-05, + "loss": 0.0072, + "step": 373220 + }, + { + "epoch": 1.88, + "learning_rate": 1.7550993638092738e-05, + "loss": 0.0051, + "step": 373230 + }, + { + "epoch": 1.88, + "learning_rate": 1.754342594507873e-05, + "loss": 0.0062, + "step": 373240 + }, + { + "epoch": 1.88, + "learning_rate": 1.7535858252064717e-05, + "loss": 0.0054, + "step": 373250 + }, + { + "epoch": 1.88, + "learning_rate": 1.7528290559050706e-05, + "loss": 0.0049, + "step": 373260 + }, + { + "epoch": 1.88, + "learning_rate": 1.7520722866036697e-05, + "loss": 0.0063, + "step": 373270 + }, + { + "epoch": 1.88, + "learning_rate": 1.7513155173022685e-05, + "loss": 0.007, + "step": 373280 + }, + { + "epoch": 1.88, + "learning_rate": 1.7505587480008677e-05, + "loss": 0.0078, + "step": 373290 + }, + { + "epoch": 1.88, + "learning_rate": 1.7498019786994665e-05, + "loss": 0.0065, + "step": 373300 + }, + { + "epoch": 1.88, + "learning_rate": 1.7490452093980657e-05, + "loss": 0.0074, + "step": 373310 + }, + { + "epoch": 1.88, + "learning_rate": 1.7482884400966645e-05, + "loss": 0.0038, + "step": 373320 + }, + { + "epoch": 1.88, + "learning_rate": 1.7475316707952637e-05, + "loss": 0.0068, + "step": 373330 + }, + { + "epoch": 1.88, + "learning_rate": 1.7467749014938625e-05, + "loss": 0.0052, + "step": 373340 + }, + { + "epoch": 1.88, + "learning_rate": 1.7460181321924613e-05, + "loss": 0.0068, + "step": 373350 + }, + { + "epoch": 1.88, + "learning_rate": 1.7452613628910605e-05, + "loss": 0.0049, + "step": 373360 + }, + { + "epoch": 1.88, + "learning_rate": 1.7445045935896593e-05, + "loss": 0.0066, + "step": 373370 + }, + { + "epoch": 1.88, + "learning_rate": 1.7437478242882585e-05, + "loss": 0.0049, + "step": 373380 + }, + { + "epoch": 1.88, + "learning_rate": 1.7429910549868573e-05, + "loss": 0.0058, + "step": 373390 + }, + { + "epoch": 1.88, + "learning_rate": 1.7422342856854564e-05, + "loss": 0.0051, + "step": 373400 + }, + { + "epoch": 1.88, + "learning_rate": 1.7414775163840553e-05, + "loss": 0.0069, + "step": 373410 + }, + { + "epoch": 1.88, + "learning_rate": 1.740720747082654e-05, + "loss": 0.0064, + "step": 373420 + }, + { + "epoch": 1.88, + "learning_rate": 1.7399639777812532e-05, + "loss": 0.0065, + "step": 373430 + }, + { + "epoch": 1.88, + "learning_rate": 1.739207208479852e-05, + "loss": 0.0067, + "step": 373440 + }, + { + "epoch": 1.88, + "learning_rate": 1.7384504391784512e-05, + "loss": 0.0053, + "step": 373450 + }, + { + "epoch": 1.88, + "learning_rate": 1.73769366987705e-05, + "loss": 0.0046, + "step": 373460 + }, + { + "epoch": 1.88, + "learning_rate": 1.7369369005756492e-05, + "loss": 0.0067, + "step": 373470 + }, + { + "epoch": 1.88, + "learning_rate": 1.736180131274248e-05, + "loss": 0.0057, + "step": 373480 + }, + { + "epoch": 1.88, + "learning_rate": 1.7354233619728472e-05, + "loss": 0.006, + "step": 373490 + }, + { + "epoch": 1.88, + "learning_rate": 1.734666592671446e-05, + "loss": 0.0041, + "step": 373500 + }, + { + "epoch": 1.88, + "learning_rate": 1.733909823370045e-05, + "loss": 0.0062, + "step": 373510 + }, + { + "epoch": 1.88, + "learning_rate": 1.733153054068644e-05, + "loss": 0.0064, + "step": 373520 + }, + { + "epoch": 1.88, + "learning_rate": 1.7323962847672428e-05, + "loss": 0.006, + "step": 373530 + }, + { + "epoch": 1.88, + "learning_rate": 1.731639515465842e-05, + "loss": 0.0067, + "step": 373540 + }, + { + "epoch": 1.88, + "learning_rate": 1.7308827461644408e-05, + "loss": 0.0062, + "step": 373550 + }, + { + "epoch": 1.88, + "learning_rate": 1.73012597686304e-05, + "loss": 0.0057, + "step": 373560 + }, + { + "epoch": 1.88, + "learning_rate": 1.7293692075616388e-05, + "loss": 0.0058, + "step": 373570 + }, + { + "epoch": 1.88, + "learning_rate": 1.7286124382602376e-05, + "loss": 0.0061, + "step": 373580 + }, + { + "epoch": 1.88, + "learning_rate": 1.7278556689588364e-05, + "loss": 0.005, + "step": 373590 + }, + { + "epoch": 1.88, + "learning_rate": 1.7270988996574356e-05, + "loss": 0.0078, + "step": 373600 + }, + { + "epoch": 1.88, + "learning_rate": 1.7263421303560347e-05, + "loss": 0.0081, + "step": 373610 + }, + { + "epoch": 1.88, + "learning_rate": 1.7255853610546336e-05, + "loss": 0.006, + "step": 373620 + }, + { + "epoch": 1.89, + "learning_rate": 1.7248285917532327e-05, + "loss": 0.0054, + "step": 373630 + }, + { + "epoch": 1.89, + "learning_rate": 1.7240718224518316e-05, + "loss": 0.0055, + "step": 373640 + }, + { + "epoch": 1.89, + "learning_rate": 1.7233150531504304e-05, + "loss": 0.0077, + "step": 373650 + }, + { + "epoch": 1.89, + "learning_rate": 1.7225582838490292e-05, + "loss": 0.0061, + "step": 373660 + }, + { + "epoch": 1.89, + "learning_rate": 1.7218015145476284e-05, + "loss": 0.0067, + "step": 373670 + }, + { + "epoch": 1.89, + "learning_rate": 1.7210447452462272e-05, + "loss": 0.0044, + "step": 373680 + }, + { + "epoch": 1.89, + "learning_rate": 1.7202879759448263e-05, + "loss": 0.0076, + "step": 373690 + }, + { + "epoch": 1.89, + "learning_rate": 1.719531206643425e-05, + "loss": 0.004, + "step": 373700 + }, + { + "epoch": 1.89, + "learning_rate": 1.7187744373420243e-05, + "loss": 0.0059, + "step": 373710 + }, + { + "epoch": 1.89, + "learning_rate": 1.718017668040623e-05, + "loss": 0.0082, + "step": 373720 + }, + { + "epoch": 1.89, + "learning_rate": 1.717260898739222e-05, + "loss": 0.0071, + "step": 373730 + }, + { + "epoch": 1.89, + "learning_rate": 1.716504129437821e-05, + "loss": 0.0061, + "step": 373740 + }, + { + "epoch": 1.89, + "learning_rate": 1.71574736013642e-05, + "loss": 0.0046, + "step": 373750 + }, + { + "epoch": 1.89, + "learning_rate": 1.714990590835019e-05, + "loss": 0.0051, + "step": 373760 + }, + { + "epoch": 1.89, + "learning_rate": 1.714233821533618e-05, + "loss": 0.005, + "step": 373770 + }, + { + "epoch": 1.89, + "learning_rate": 1.713477052232217e-05, + "loss": 0.0053, + "step": 373780 + }, + { + "epoch": 1.89, + "learning_rate": 1.712720282930816e-05, + "loss": 0.0062, + "step": 373790 + }, + { + "epoch": 1.89, + "learning_rate": 1.711963513629415e-05, + "loss": 0.0068, + "step": 373800 + }, + { + "epoch": 1.89, + "learning_rate": 1.711206744328014e-05, + "loss": 0.0082, + "step": 373810 + }, + { + "epoch": 1.89, + "learning_rate": 1.7104499750266127e-05, + "loss": 0.0077, + "step": 373820 + }, + { + "epoch": 1.89, + "learning_rate": 1.709693205725212e-05, + "loss": 0.0064, + "step": 373830 + }, + { + "epoch": 1.89, + "learning_rate": 1.7089364364238107e-05, + "loss": 0.0068, + "step": 373840 + }, + { + "epoch": 1.89, + "learning_rate": 1.70817966712241e-05, + "loss": 0.0057, + "step": 373850 + }, + { + "epoch": 1.89, + "learning_rate": 1.7074228978210087e-05, + "loss": 0.0046, + "step": 373860 + }, + { + "epoch": 1.89, + "learning_rate": 1.706666128519608e-05, + "loss": 0.0052, + "step": 373870 + }, + { + "epoch": 1.89, + "learning_rate": 1.7059093592182067e-05, + "loss": 0.0073, + "step": 373880 + }, + { + "epoch": 1.89, + "learning_rate": 1.7051525899168055e-05, + "loss": 0.005, + "step": 373890 + }, + { + "epoch": 1.89, + "learning_rate": 1.7043958206154047e-05, + "loss": 0.0065, + "step": 373900 + }, + { + "epoch": 1.89, + "learning_rate": 1.7036390513140035e-05, + "loss": 0.0049, + "step": 373910 + }, + { + "epoch": 1.89, + "learning_rate": 1.7028822820126026e-05, + "loss": 0.0044, + "step": 373920 + }, + { + "epoch": 1.89, + "learning_rate": 1.7021255127112015e-05, + "loss": 0.005, + "step": 373930 + }, + { + "epoch": 1.89, + "learning_rate": 1.7013687434098006e-05, + "loss": 0.0069, + "step": 373940 + }, + { + "epoch": 1.89, + "learning_rate": 1.7006119741083994e-05, + "loss": 0.0076, + "step": 373950 + }, + { + "epoch": 1.89, + "learning_rate": 1.6998552048069986e-05, + "loss": 0.0046, + "step": 373960 + }, + { + "epoch": 1.89, + "learning_rate": 1.6990984355055974e-05, + "loss": 0.0064, + "step": 373970 + }, + { + "epoch": 1.89, + "learning_rate": 1.6983416662041962e-05, + "loss": 0.0059, + "step": 373980 + }, + { + "epoch": 1.89, + "learning_rate": 1.6975848969027954e-05, + "loss": 0.0058, + "step": 373990 + }, + { + "epoch": 1.89, + "learning_rate": 1.6968281276013942e-05, + "loss": 0.005, + "step": 374000 + }, + { + "epoch": 1.89, + "eval_cer": 0.9144294992658953, + "eval_loss": 0.004294942133128643, + "eval_runtime": 116.742, + "eval_samples_per_second": 17.132, + "eval_steps_per_second": 4.283, + "step": 374000 + }, + { + "epoch": 1.89, + "learning_rate": 1.6960713582999934e-05, + "loss": 0.0042, + "step": 374010 + }, + { + "epoch": 1.89, + "learning_rate": 1.6953145889985922e-05, + "loss": 0.0059, + "step": 374020 + }, + { + "epoch": 1.89, + "learning_rate": 1.6945578196971914e-05, + "loss": 0.0079, + "step": 374030 + }, + { + "epoch": 1.89, + "learning_rate": 1.6938010503957902e-05, + "loss": 0.0031, + "step": 374040 + }, + { + "epoch": 1.89, + "learning_rate": 1.693044281094389e-05, + "loss": 0.0058, + "step": 374050 + }, + { + "epoch": 1.89, + "learning_rate": 1.6922875117929882e-05, + "loss": 0.0061, + "step": 374060 + }, + { + "epoch": 1.89, + "learning_rate": 1.691530742491587e-05, + "loss": 0.0053, + "step": 374070 + }, + { + "epoch": 1.89, + "learning_rate": 1.690773973190186e-05, + "loss": 0.0054, + "step": 374080 + }, + { + "epoch": 1.89, + "learning_rate": 1.690017203888785e-05, + "loss": 0.0043, + "step": 374090 + }, + { + "epoch": 1.89, + "learning_rate": 1.689260434587384e-05, + "loss": 0.0077, + "step": 374100 + }, + { + "epoch": 1.89, + "learning_rate": 1.688503665285983e-05, + "loss": 0.0062, + "step": 374110 + }, + { + "epoch": 1.89, + "learning_rate": 1.687746895984582e-05, + "loss": 0.0052, + "step": 374120 + }, + { + "epoch": 1.89, + "learning_rate": 1.686990126683181e-05, + "loss": 0.0058, + "step": 374130 + }, + { + "epoch": 1.89, + "learning_rate": 1.6862333573817798e-05, + "loss": 0.0059, + "step": 374140 + }, + { + "epoch": 1.89, + "learning_rate": 1.685476588080379e-05, + "loss": 0.0068, + "step": 374150 + }, + { + "epoch": 1.89, + "learning_rate": 1.6847198187789777e-05, + "loss": 0.0053, + "step": 374160 + }, + { + "epoch": 1.89, + "learning_rate": 1.683963049477577e-05, + "loss": 0.005, + "step": 374170 + }, + { + "epoch": 1.89, + "learning_rate": 1.6832062801761757e-05, + "loss": 0.0045, + "step": 374180 + }, + { + "epoch": 1.89, + "learning_rate": 1.682449510874775e-05, + "loss": 0.0035, + "step": 374190 + }, + { + "epoch": 1.89, + "learning_rate": 1.6816927415733737e-05, + "loss": 0.0072, + "step": 374200 + }, + { + "epoch": 1.89, + "learning_rate": 1.6809359722719725e-05, + "loss": 0.0059, + "step": 374210 + }, + { + "epoch": 1.89, + "learning_rate": 1.6801792029705717e-05, + "loss": 0.0056, + "step": 374220 + }, + { + "epoch": 1.89, + "learning_rate": 1.6794224336691705e-05, + "loss": 0.0065, + "step": 374230 + }, + { + "epoch": 1.89, + "learning_rate": 1.6786656643677697e-05, + "loss": 0.0052, + "step": 374240 + }, + { + "epoch": 1.89, + "learning_rate": 1.6779088950663685e-05, + "loss": 0.0047, + "step": 374250 + }, + { + "epoch": 1.89, + "learning_rate": 1.6771521257649677e-05, + "loss": 0.0054, + "step": 374260 + }, + { + "epoch": 1.89, + "learning_rate": 1.6763953564635665e-05, + "loss": 0.006, + "step": 374270 + }, + { + "epoch": 1.89, + "learning_rate": 1.6756385871621653e-05, + "loss": 0.0059, + "step": 374280 + }, + { + "epoch": 1.89, + "learning_rate": 1.6748818178607645e-05, + "loss": 0.0045, + "step": 374290 + }, + { + "epoch": 1.89, + "learning_rate": 1.6741250485593633e-05, + "loss": 0.0076, + "step": 374300 + }, + { + "epoch": 1.89, + "learning_rate": 1.6733682792579624e-05, + "loss": 0.0044, + "step": 374310 + }, + { + "epoch": 1.89, + "learning_rate": 1.6726115099565613e-05, + "loss": 0.0056, + "step": 374320 + }, + { + "epoch": 1.89, + "learning_rate": 1.6718547406551604e-05, + "loss": 0.0053, + "step": 374330 + }, + { + "epoch": 1.89, + "learning_rate": 1.6710979713537593e-05, + "loss": 0.0071, + "step": 374340 + }, + { + "epoch": 1.89, + "learning_rate": 1.6703412020523584e-05, + "loss": 0.0051, + "step": 374350 + }, + { + "epoch": 1.89, + "learning_rate": 1.6695844327509572e-05, + "loss": 0.0064, + "step": 374360 + }, + { + "epoch": 1.89, + "learning_rate": 1.668827663449556e-05, + "loss": 0.006, + "step": 374370 + }, + { + "epoch": 1.89, + "learning_rate": 1.6680708941481552e-05, + "loss": 0.0049, + "step": 374380 + }, + { + "epoch": 1.89, + "learning_rate": 1.667314124846754e-05, + "loss": 0.0083, + "step": 374390 + }, + { + "epoch": 1.89, + "learning_rate": 1.6665573555453532e-05, + "loss": 0.004, + "step": 374400 + }, + { + "epoch": 1.89, + "learning_rate": 1.665800586243952e-05, + "loss": 0.0063, + "step": 374410 + }, + { + "epoch": 1.89, + "learning_rate": 1.6650438169425512e-05, + "loss": 0.0058, + "step": 374420 + }, + { + "epoch": 1.89, + "learning_rate": 1.66428704764115e-05, + "loss": 0.0054, + "step": 374430 + }, + { + "epoch": 1.89, + "learning_rate": 1.6635302783397488e-05, + "loss": 0.006, + "step": 374440 + }, + { + "epoch": 1.89, + "learning_rate": 1.6627735090383476e-05, + "loss": 0.0062, + "step": 374450 + }, + { + "epoch": 1.89, + "learning_rate": 1.6620167397369468e-05, + "loss": 0.0064, + "step": 374460 + }, + { + "epoch": 1.89, + "learning_rate": 1.661259970435546e-05, + "loss": 0.007, + "step": 374470 + }, + { + "epoch": 1.89, + "learning_rate": 1.6605032011341448e-05, + "loss": 0.0066, + "step": 374480 + }, + { + "epoch": 1.89, + "learning_rate": 1.659746431832744e-05, + "loss": 0.0079, + "step": 374490 + }, + { + "epoch": 1.89, + "learning_rate": 1.6589896625313428e-05, + "loss": 0.0062, + "step": 374500 + }, + { + "epoch": 1.89, + "learning_rate": 1.658232893229942e-05, + "loss": 0.0062, + "step": 374510 + }, + { + "epoch": 1.89, + "learning_rate": 1.6574761239285404e-05, + "loss": 0.0063, + "step": 374520 + }, + { + "epoch": 1.89, + "learning_rate": 1.6567193546271396e-05, + "loss": 0.0057, + "step": 374530 + }, + { + "epoch": 1.89, + "learning_rate": 1.6559625853257384e-05, + "loss": 0.0049, + "step": 374540 + }, + { + "epoch": 1.89, + "learning_rate": 1.6552058160243376e-05, + "loss": 0.0063, + "step": 374550 + }, + { + "epoch": 1.89, + "learning_rate": 1.6544490467229364e-05, + "loss": 0.0048, + "step": 374560 + }, + { + "epoch": 1.89, + "learning_rate": 1.6536922774215355e-05, + "loss": 0.0062, + "step": 374570 + }, + { + "epoch": 1.89, + "learning_rate": 1.6529355081201347e-05, + "loss": 0.0056, + "step": 374580 + }, + { + "epoch": 1.89, + "learning_rate": 1.6521787388187335e-05, + "loss": 0.0056, + "step": 374590 + }, + { + "epoch": 1.89, + "learning_rate": 1.6514219695173323e-05, + "loss": 0.0063, + "step": 374600 + }, + { + "epoch": 1.89, + "learning_rate": 1.650665200215931e-05, + "loss": 0.0079, + "step": 374610 + }, + { + "epoch": 1.89, + "learning_rate": 1.6499084309145303e-05, + "loss": 0.0066, + "step": 374620 + }, + { + "epoch": 1.89, + "learning_rate": 1.649151661613129e-05, + "loss": 0.0052, + "step": 374630 + }, + { + "epoch": 1.89, + "learning_rate": 1.6483948923117283e-05, + "loss": 0.0071, + "step": 374640 + }, + { + "epoch": 1.89, + "learning_rate": 1.647638123010327e-05, + "loss": 0.0079, + "step": 374650 + }, + { + "epoch": 1.89, + "learning_rate": 1.6468813537089263e-05, + "loss": 0.0065, + "step": 374660 + }, + { + "epoch": 1.89, + "learning_rate": 1.646124584407525e-05, + "loss": 0.0049, + "step": 374670 + }, + { + "epoch": 1.89, + "learning_rate": 1.645367815106124e-05, + "loss": 0.0061, + "step": 374680 + }, + { + "epoch": 1.89, + "learning_rate": 1.644611045804723e-05, + "loss": 0.005, + "step": 374690 + }, + { + "epoch": 1.89, + "learning_rate": 1.643854276503322e-05, + "loss": 0.0061, + "step": 374700 + }, + { + "epoch": 1.89, + "learning_rate": 1.643097507201921e-05, + "loss": 0.0047, + "step": 374710 + }, + { + "epoch": 1.89, + "learning_rate": 1.64234073790052e-05, + "loss": 0.0055, + "step": 374720 + }, + { + "epoch": 1.89, + "learning_rate": 1.641583968599119e-05, + "loss": 0.0053, + "step": 374730 + }, + { + "epoch": 1.89, + "learning_rate": 1.640827199297718e-05, + "loss": 0.0048, + "step": 374740 + }, + { + "epoch": 1.89, + "learning_rate": 1.6400704299963167e-05, + "loss": 0.0046, + "step": 374750 + }, + { + "epoch": 1.89, + "learning_rate": 1.639313660694916e-05, + "loss": 0.0041, + "step": 374760 + }, + { + "epoch": 1.89, + "learning_rate": 1.6385568913935147e-05, + "loss": 0.0056, + "step": 374770 + }, + { + "epoch": 1.89, + "learning_rate": 1.637800122092114e-05, + "loss": 0.0044, + "step": 374780 + }, + { + "epoch": 1.89, + "learning_rate": 1.6370433527907127e-05, + "loss": 0.0046, + "step": 374790 + }, + { + "epoch": 1.89, + "learning_rate": 1.636286583489312e-05, + "loss": 0.0075, + "step": 374800 + }, + { + "epoch": 1.89, + "learning_rate": 1.6355298141879107e-05, + "loss": 0.006, + "step": 374810 + }, + { + "epoch": 1.89, + "learning_rate": 1.6347730448865098e-05, + "loss": 0.0051, + "step": 374820 + }, + { + "epoch": 1.89, + "learning_rate": 1.6340162755851086e-05, + "loss": 0.0054, + "step": 374830 + }, + { + "epoch": 1.89, + "learning_rate": 1.6332595062837075e-05, + "loss": 0.0064, + "step": 374840 + }, + { + "epoch": 1.89, + "learning_rate": 1.6325027369823066e-05, + "loss": 0.0064, + "step": 374850 + }, + { + "epoch": 1.89, + "learning_rate": 1.6317459676809054e-05, + "loss": 0.007, + "step": 374860 + }, + { + "epoch": 1.89, + "learning_rate": 1.6309891983795046e-05, + "loss": 0.0051, + "step": 374870 + }, + { + "epoch": 1.89, + "learning_rate": 1.6302324290781034e-05, + "loss": 0.005, + "step": 374880 + }, + { + "epoch": 1.89, + "learning_rate": 1.6294756597767026e-05, + "loss": 0.0071, + "step": 374890 + }, + { + "epoch": 1.89, + "learning_rate": 1.6287188904753014e-05, + "loss": 0.0054, + "step": 374900 + }, + { + "epoch": 1.89, + "learning_rate": 1.6279621211739002e-05, + "loss": 0.0075, + "step": 374910 + }, + { + "epoch": 1.89, + "learning_rate": 1.6272053518724994e-05, + "loss": 0.0051, + "step": 374920 + }, + { + "epoch": 1.89, + "learning_rate": 1.6264485825710982e-05, + "loss": 0.0049, + "step": 374930 + }, + { + "epoch": 1.89, + "learning_rate": 1.6256918132696974e-05, + "loss": 0.0071, + "step": 374940 + }, + { + "epoch": 1.89, + "learning_rate": 1.6249350439682962e-05, + "loss": 0.0059, + "step": 374950 + }, + { + "epoch": 1.89, + "learning_rate": 1.6241782746668954e-05, + "loss": 0.005, + "step": 374960 + }, + { + "epoch": 1.89, + "learning_rate": 1.6234215053654942e-05, + "loss": 0.0062, + "step": 374970 + }, + { + "epoch": 1.89, + "learning_rate": 1.6226647360640933e-05, + "loss": 0.0058, + "step": 374980 + }, + { + "epoch": 1.89, + "learning_rate": 1.621907966762692e-05, + "loss": 0.0066, + "step": 374990 + }, + { + "epoch": 1.89, + "learning_rate": 1.621151197461291e-05, + "loss": 0.0035, + "step": 375000 + }, + { + "epoch": 1.89, + "eval_cer": 0.9144246472852683, + "eval_loss": 0.004302851855754852, + "eval_runtime": 116.6099, + "eval_samples_per_second": 17.151, + "eval_steps_per_second": 4.288, + "step": 375000 + }, + { + "epoch": 1.89, + "learning_rate": 1.62039442815989e-05, + "loss": 0.0051, + "step": 375010 + }, + { + "epoch": 1.89, + "learning_rate": 1.619637658858489e-05, + "loss": 0.0057, + "step": 375020 + }, + { + "epoch": 1.89, + "learning_rate": 1.618880889557088e-05, + "loss": 0.0052, + "step": 375030 + }, + { + "epoch": 1.89, + "learning_rate": 1.618124120255687e-05, + "loss": 0.0053, + "step": 375040 + }, + { + "epoch": 1.89, + "learning_rate": 1.617367350954286e-05, + "loss": 0.0054, + "step": 375050 + }, + { + "epoch": 1.89, + "learning_rate": 1.616610581652885e-05, + "loss": 0.0044, + "step": 375060 + }, + { + "epoch": 1.89, + "learning_rate": 1.6158538123514838e-05, + "loss": 0.0039, + "step": 375070 + }, + { + "epoch": 1.89, + "learning_rate": 1.615097043050083e-05, + "loss": 0.0069, + "step": 375080 + }, + { + "epoch": 1.89, + "learning_rate": 1.6143402737486817e-05, + "loss": 0.0047, + "step": 375090 + }, + { + "epoch": 1.89, + "learning_rate": 1.613583504447281e-05, + "loss": 0.0051, + "step": 375100 + }, + { + "epoch": 1.89, + "learning_rate": 1.6128267351458797e-05, + "loss": 0.0064, + "step": 375110 + }, + { + "epoch": 1.89, + "learning_rate": 1.612069965844479e-05, + "loss": 0.0064, + "step": 375120 + }, + { + "epoch": 1.89, + "learning_rate": 1.6113131965430777e-05, + "loss": 0.0069, + "step": 375130 + }, + { + "epoch": 1.89, + "learning_rate": 1.610556427241677e-05, + "loss": 0.0057, + "step": 375140 + }, + { + "epoch": 1.89, + "learning_rate": 1.6097996579402757e-05, + "loss": 0.0064, + "step": 375150 + }, + { + "epoch": 1.89, + "learning_rate": 1.6090428886388745e-05, + "loss": 0.0045, + "step": 375160 + }, + { + "epoch": 1.89, + "learning_rate": 1.6082861193374737e-05, + "loss": 0.0057, + "step": 375170 + }, + { + "epoch": 1.89, + "learning_rate": 1.6075293500360725e-05, + "loss": 0.0056, + "step": 375180 + }, + { + "epoch": 1.89, + "learning_rate": 1.6067725807346716e-05, + "loss": 0.0059, + "step": 375190 + }, + { + "epoch": 1.89, + "learning_rate": 1.6060158114332705e-05, + "loss": 0.004, + "step": 375200 + }, + { + "epoch": 1.89, + "learning_rate": 1.6052590421318696e-05, + "loss": 0.0067, + "step": 375210 + }, + { + "epoch": 1.89, + "learning_rate": 1.6045022728304685e-05, + "loss": 0.0041, + "step": 375220 + }, + { + "epoch": 1.89, + "learning_rate": 1.6037455035290673e-05, + "loss": 0.0059, + "step": 375230 + }, + { + "epoch": 1.89, + "learning_rate": 1.6029887342276664e-05, + "loss": 0.0071, + "step": 375240 + }, + { + "epoch": 1.89, + "learning_rate": 1.6022319649262653e-05, + "loss": 0.0047, + "step": 375250 + }, + { + "epoch": 1.89, + "learning_rate": 1.6014751956248644e-05, + "loss": 0.0063, + "step": 375260 + }, + { + "epoch": 1.89, + "learning_rate": 1.6007184263234632e-05, + "loss": 0.0051, + "step": 375270 + }, + { + "epoch": 1.89, + "learning_rate": 1.5999616570220624e-05, + "loss": 0.0044, + "step": 375280 + }, + { + "epoch": 1.89, + "learning_rate": 1.5992048877206612e-05, + "loss": 0.0046, + "step": 375290 + }, + { + "epoch": 1.89, + "learning_rate": 1.59844811841926e-05, + "loss": 0.0056, + "step": 375300 + }, + { + "epoch": 1.89, + "learning_rate": 1.5976913491178592e-05, + "loss": 0.0068, + "step": 375310 + }, + { + "epoch": 1.89, + "learning_rate": 1.596934579816458e-05, + "loss": 0.0062, + "step": 375320 + }, + { + "epoch": 1.89, + "learning_rate": 1.5961778105150572e-05, + "loss": 0.006, + "step": 375330 + }, + { + "epoch": 1.89, + "learning_rate": 1.595421041213656e-05, + "loss": 0.0062, + "step": 375340 + }, + { + "epoch": 1.89, + "learning_rate": 1.594664271912255e-05, + "loss": 0.0052, + "step": 375350 + }, + { + "epoch": 1.89, + "learning_rate": 1.593907502610854e-05, + "loss": 0.0079, + "step": 375360 + }, + { + "epoch": 1.89, + "learning_rate": 1.593150733309453e-05, + "loss": 0.0071, + "step": 375370 + }, + { + "epoch": 1.89, + "learning_rate": 1.5923939640080516e-05, + "loss": 0.0059, + "step": 375380 + }, + { + "epoch": 1.89, + "learning_rate": 1.5916371947066508e-05, + "loss": 0.0042, + "step": 375390 + }, + { + "epoch": 1.89, + "learning_rate": 1.5908804254052496e-05, + "loss": 0.0058, + "step": 375400 + }, + { + "epoch": 1.89, + "learning_rate": 1.5901236561038488e-05, + "loss": 0.0061, + "step": 375410 + }, + { + "epoch": 1.89, + "learning_rate": 1.5893668868024476e-05, + "loss": 0.0058, + "step": 375420 + }, + { + "epoch": 1.89, + "learning_rate": 1.5886101175010468e-05, + "loss": 0.0049, + "step": 375430 + }, + { + "epoch": 1.89, + "learning_rate": 1.587853348199646e-05, + "loss": 0.0052, + "step": 375440 + }, + { + "epoch": 1.89, + "learning_rate": 1.5870965788982447e-05, + "loss": 0.0041, + "step": 375450 + }, + { + "epoch": 1.89, + "learning_rate": 1.5863398095968436e-05, + "loss": 0.0063, + "step": 375460 + }, + { + "epoch": 1.89, + "learning_rate": 1.5855830402954424e-05, + "loss": 0.005, + "step": 375470 + }, + { + "epoch": 1.89, + "learning_rate": 1.5848262709940415e-05, + "loss": 0.0061, + "step": 375480 + }, + { + "epoch": 1.89, + "learning_rate": 1.5840695016926404e-05, + "loss": 0.0067, + "step": 375490 + }, + { + "epoch": 1.89, + "learning_rate": 1.5833127323912395e-05, + "loss": 0.0048, + "step": 375500 + }, + { + "epoch": 1.89, + "learning_rate": 1.5825559630898384e-05, + "loss": 0.0054, + "step": 375510 + }, + { + "epoch": 1.89, + "learning_rate": 1.5817991937884375e-05, + "loss": 0.0052, + "step": 375520 + }, + { + "epoch": 1.89, + "learning_rate": 1.5810424244870363e-05, + "loss": 0.0053, + "step": 375530 + }, + { + "epoch": 1.89, + "learning_rate": 1.580285655185635e-05, + "loss": 0.0062, + "step": 375540 + }, + { + "epoch": 1.89, + "learning_rate": 1.5795288858842343e-05, + "loss": 0.0054, + "step": 375550 + }, + { + "epoch": 1.89, + "learning_rate": 1.578772116582833e-05, + "loss": 0.0073, + "step": 375560 + }, + { + "epoch": 1.89, + "learning_rate": 1.5780153472814323e-05, + "loss": 0.0057, + "step": 375570 + }, + { + "epoch": 1.89, + "learning_rate": 1.577258577980031e-05, + "loss": 0.0052, + "step": 375580 + }, + { + "epoch": 1.89, + "learning_rate": 1.5765018086786303e-05, + "loss": 0.004, + "step": 375590 + }, + { + "epoch": 1.89, + "learning_rate": 1.575745039377229e-05, + "loss": 0.0067, + "step": 375600 + }, + { + "epoch": 1.89, + "learning_rate": 1.5749882700758283e-05, + "loss": 0.0062, + "step": 375610 + }, + { + "epoch": 1.9, + "learning_rate": 1.574231500774427e-05, + "loss": 0.0053, + "step": 375620 + }, + { + "epoch": 1.9, + "learning_rate": 1.573474731473026e-05, + "loss": 0.0049, + "step": 375630 + }, + { + "epoch": 1.9, + "learning_rate": 1.572717962171625e-05, + "loss": 0.0058, + "step": 375640 + }, + { + "epoch": 1.9, + "learning_rate": 1.571961192870224e-05, + "loss": 0.005, + "step": 375650 + }, + { + "epoch": 1.9, + "learning_rate": 1.571204423568823e-05, + "loss": 0.0058, + "step": 375660 + }, + { + "epoch": 1.9, + "learning_rate": 1.570447654267422e-05, + "loss": 0.0064, + "step": 375670 + }, + { + "epoch": 1.9, + "learning_rate": 1.569690884966021e-05, + "loss": 0.0066, + "step": 375680 + }, + { + "epoch": 1.9, + "learning_rate": 1.56893411566462e-05, + "loss": 0.0049, + "step": 375690 + }, + { + "epoch": 1.9, + "learning_rate": 1.5681773463632187e-05, + "loss": 0.0051, + "step": 375700 + }, + { + "epoch": 1.9, + "learning_rate": 1.567420577061818e-05, + "loss": 0.0056, + "step": 375710 + }, + { + "epoch": 1.9, + "learning_rate": 1.5666638077604167e-05, + "loss": 0.0035, + "step": 375720 + }, + { + "epoch": 1.9, + "learning_rate": 1.5659070384590158e-05, + "loss": 0.0052, + "step": 375730 + }, + { + "epoch": 1.9, + "learning_rate": 1.5651502691576146e-05, + "loss": 0.0059, + "step": 375740 + }, + { + "epoch": 1.9, + "learning_rate": 1.5643934998562138e-05, + "loss": 0.0076, + "step": 375750 + }, + { + "epoch": 1.9, + "learning_rate": 1.5636367305548126e-05, + "loss": 0.0041, + "step": 375760 + }, + { + "epoch": 1.9, + "learning_rate": 1.5628799612534114e-05, + "loss": 0.0043, + "step": 375770 + }, + { + "epoch": 1.9, + "learning_rate": 1.5621231919520106e-05, + "loss": 0.0064, + "step": 375780 + }, + { + "epoch": 1.9, + "learning_rate": 1.5613664226506094e-05, + "loss": 0.0046, + "step": 375790 + }, + { + "epoch": 1.9, + "learning_rate": 1.5606096533492086e-05, + "loss": 0.0054, + "step": 375800 + }, + { + "epoch": 1.9, + "learning_rate": 1.5598528840478074e-05, + "loss": 0.0068, + "step": 375810 + }, + { + "epoch": 1.9, + "learning_rate": 1.5590961147464066e-05, + "loss": 0.0063, + "step": 375820 + }, + { + "epoch": 1.9, + "learning_rate": 1.5583393454450054e-05, + "loss": 0.0072, + "step": 375830 + }, + { + "epoch": 1.9, + "learning_rate": 1.5575825761436046e-05, + "loss": 0.0037, + "step": 375840 + }, + { + "epoch": 1.9, + "learning_rate": 1.5568258068422034e-05, + "loss": 0.0055, + "step": 375850 + }, + { + "epoch": 1.9, + "learning_rate": 1.5560690375408022e-05, + "loss": 0.0044, + "step": 375860 + }, + { + "epoch": 1.9, + "learning_rate": 1.5553122682394014e-05, + "loss": 0.0048, + "step": 375870 + }, + { + "epoch": 1.9, + "learning_rate": 1.5545554989380002e-05, + "loss": 0.0044, + "step": 375880 + }, + { + "epoch": 1.9, + "learning_rate": 1.5537987296365993e-05, + "loss": 0.0063, + "step": 375890 + }, + { + "epoch": 1.9, + "learning_rate": 1.553041960335198e-05, + "loss": 0.0047, + "step": 375900 + }, + { + "epoch": 1.9, + "learning_rate": 1.5522851910337973e-05, + "loss": 0.0063, + "step": 375910 + }, + { + "epoch": 1.9, + "learning_rate": 1.551528421732396e-05, + "loss": 0.0056, + "step": 375920 + }, + { + "epoch": 1.9, + "learning_rate": 1.550771652430995e-05, + "loss": 0.0064, + "step": 375930 + }, + { + "epoch": 1.9, + "learning_rate": 1.550014883129594e-05, + "loss": 0.0052, + "step": 375940 + }, + { + "epoch": 1.9, + "learning_rate": 1.549258113828193e-05, + "loss": 0.0049, + "step": 375950 + }, + { + "epoch": 1.9, + "learning_rate": 1.548501344526792e-05, + "loss": 0.005, + "step": 375960 + }, + { + "epoch": 1.9, + "learning_rate": 1.547744575225391e-05, + "loss": 0.0057, + "step": 375970 + }, + { + "epoch": 1.9, + "learning_rate": 1.54698780592399e-05, + "loss": 0.0068, + "step": 375980 + }, + { + "epoch": 1.9, + "learning_rate": 1.546231036622589e-05, + "loss": 0.0051, + "step": 375990 + }, + { + "epoch": 1.9, + "learning_rate": 1.545474267321188e-05, + "loss": 0.007, + "step": 376000 + }, + { + "epoch": 1.9, + "eval_cer": 0.9144372624348985, + "eval_loss": 0.00426588486880064, + "eval_runtime": 116.7025, + "eval_samples_per_second": 17.138, + "eval_steps_per_second": 4.284, + "step": 376000 + }, + { + "epoch": 1.9, + "learning_rate": 1.544717498019787e-05, + "loss": 0.0051, + "step": 376010 + }, + { + "epoch": 1.9, + "learning_rate": 1.5439607287183857e-05, + "loss": 0.0062, + "step": 376020 + }, + { + "epoch": 1.9, + "learning_rate": 1.543203959416985e-05, + "loss": 0.007, + "step": 376030 + }, + { + "epoch": 1.9, + "learning_rate": 1.5424471901155837e-05, + "loss": 0.0059, + "step": 376040 + }, + { + "epoch": 1.9, + "learning_rate": 1.541690420814183e-05, + "loss": 0.0052, + "step": 376050 + }, + { + "epoch": 1.9, + "learning_rate": 1.5409336515127817e-05, + "loss": 0.0059, + "step": 376060 + }, + { + "epoch": 1.9, + "learning_rate": 1.540176882211381e-05, + "loss": 0.0059, + "step": 376070 + }, + { + "epoch": 1.9, + "learning_rate": 1.5394201129099797e-05, + "loss": 0.0055, + "step": 376080 + }, + { + "epoch": 1.9, + "learning_rate": 1.5386633436085785e-05, + "loss": 0.0061, + "step": 376090 + }, + { + "epoch": 1.9, + "learning_rate": 1.5379065743071777e-05, + "loss": 0.0052, + "step": 376100 + }, + { + "epoch": 1.9, + "learning_rate": 1.5371498050057765e-05, + "loss": 0.0053, + "step": 376110 + }, + { + "epoch": 1.9, + "learning_rate": 1.5363930357043756e-05, + "loss": 0.0046, + "step": 376120 + }, + { + "epoch": 1.9, + "learning_rate": 1.5356362664029745e-05, + "loss": 0.0064, + "step": 376130 + }, + { + "epoch": 1.9, + "learning_rate": 1.5348794971015736e-05, + "loss": 0.0044, + "step": 376140 + }, + { + "epoch": 1.9, + "learning_rate": 1.5341227278001724e-05, + "loss": 0.0044, + "step": 376150 + }, + { + "epoch": 1.9, + "learning_rate": 1.5333659584987716e-05, + "loss": 0.0042, + "step": 376160 + }, + { + "epoch": 1.9, + "learning_rate": 1.5326091891973704e-05, + "loss": 0.0039, + "step": 376170 + }, + { + "epoch": 1.9, + "learning_rate": 1.5318524198959692e-05, + "loss": 0.0047, + "step": 376180 + }, + { + "epoch": 1.9, + "learning_rate": 1.5310956505945684e-05, + "loss": 0.0049, + "step": 376190 + }, + { + "epoch": 1.9, + "learning_rate": 1.5303388812931672e-05, + "loss": 0.0053, + "step": 376200 + }, + { + "epoch": 1.9, + "learning_rate": 1.5295821119917664e-05, + "loss": 0.0056, + "step": 376210 + }, + { + "epoch": 1.9, + "learning_rate": 1.5288253426903652e-05, + "loss": 0.0061, + "step": 376220 + }, + { + "epoch": 1.9, + "learning_rate": 1.5280685733889644e-05, + "loss": 0.0065, + "step": 376230 + }, + { + "epoch": 1.9, + "learning_rate": 1.5273118040875632e-05, + "loss": 0.0102, + "step": 376240 + }, + { + "epoch": 1.9, + "learning_rate": 1.526555034786162e-05, + "loss": 0.0057, + "step": 376250 + }, + { + "epoch": 1.9, + "learning_rate": 1.525798265484761e-05, + "loss": 0.0055, + "step": 376260 + }, + { + "epoch": 1.9, + "learning_rate": 1.52504149618336e-05, + "loss": 0.005, + "step": 376270 + }, + { + "epoch": 1.9, + "learning_rate": 1.524284726881959e-05, + "loss": 0.0069, + "step": 376280 + }, + { + "epoch": 1.9, + "learning_rate": 1.523527957580558e-05, + "loss": 0.0043, + "step": 376290 + }, + { + "epoch": 1.9, + "learning_rate": 1.522771188279157e-05, + "loss": 0.0059, + "step": 376300 + }, + { + "epoch": 1.9, + "learning_rate": 1.522014418977756e-05, + "loss": 0.0059, + "step": 376310 + }, + { + "epoch": 1.9, + "learning_rate": 1.5212576496763548e-05, + "loss": 0.0053, + "step": 376320 + }, + { + "epoch": 1.9, + "learning_rate": 1.5205008803749538e-05, + "loss": 0.0053, + "step": 376330 + }, + { + "epoch": 1.9, + "learning_rate": 1.5197441110735528e-05, + "loss": 0.0055, + "step": 376340 + }, + { + "epoch": 1.9, + "learning_rate": 1.5189873417721518e-05, + "loss": 0.0096, + "step": 376350 + }, + { + "epoch": 1.9, + "learning_rate": 1.5182305724707507e-05, + "loss": 0.0047, + "step": 376360 + }, + { + "epoch": 1.9, + "learning_rate": 1.5174738031693497e-05, + "loss": 0.0077, + "step": 376370 + }, + { + "epoch": 1.9, + "learning_rate": 1.5167170338679487e-05, + "loss": 0.0059, + "step": 376380 + }, + { + "epoch": 1.9, + "learning_rate": 1.5159602645665477e-05, + "loss": 0.0048, + "step": 376390 + }, + { + "epoch": 1.9, + "learning_rate": 1.5152034952651465e-05, + "loss": 0.0047, + "step": 376400 + }, + { + "epoch": 1.9, + "learning_rate": 1.5144467259637455e-05, + "loss": 0.0052, + "step": 376410 + }, + { + "epoch": 1.9, + "learning_rate": 1.5136899566623445e-05, + "loss": 0.0065, + "step": 376420 + }, + { + "epoch": 1.9, + "learning_rate": 1.5129331873609435e-05, + "loss": 0.0057, + "step": 376430 + }, + { + "epoch": 1.9, + "learning_rate": 1.5121764180595425e-05, + "loss": 0.0065, + "step": 376440 + }, + { + "epoch": 1.9, + "learning_rate": 1.5114196487581415e-05, + "loss": 0.0052, + "step": 376450 + }, + { + "epoch": 1.9, + "learning_rate": 1.5106628794567405e-05, + "loss": 0.0064, + "step": 376460 + }, + { + "epoch": 1.9, + "learning_rate": 1.5099061101553395e-05, + "loss": 0.0043, + "step": 376470 + }, + { + "epoch": 1.9, + "learning_rate": 1.5091493408539383e-05, + "loss": 0.0062, + "step": 376480 + }, + { + "epoch": 1.9, + "learning_rate": 1.5083925715525373e-05, + "loss": 0.0058, + "step": 376490 + }, + { + "epoch": 1.9, + "learning_rate": 1.5076358022511363e-05, + "loss": 0.0042, + "step": 376500 + }, + { + "epoch": 1.9, + "learning_rate": 1.5068790329497353e-05, + "loss": 0.0052, + "step": 376510 + }, + { + "epoch": 1.9, + "learning_rate": 1.5061222636483343e-05, + "loss": 0.0057, + "step": 376520 + }, + { + "epoch": 1.9, + "learning_rate": 1.5053654943469333e-05, + "loss": 0.0062, + "step": 376530 + }, + { + "epoch": 1.9, + "learning_rate": 1.5046087250455323e-05, + "loss": 0.0065, + "step": 376540 + }, + { + "epoch": 1.9, + "learning_rate": 1.5038519557441312e-05, + "loss": 0.0051, + "step": 376550 + }, + { + "epoch": 1.9, + "learning_rate": 1.50309518644273e-05, + "loss": 0.005, + "step": 376560 + }, + { + "epoch": 1.9, + "learning_rate": 1.502338417141329e-05, + "loss": 0.0055, + "step": 376570 + }, + { + "epoch": 1.9, + "learning_rate": 1.501581647839928e-05, + "loss": 0.0056, + "step": 376580 + }, + { + "epoch": 1.9, + "learning_rate": 1.500824878538527e-05, + "loss": 0.004, + "step": 376590 + }, + { + "epoch": 1.9, + "learning_rate": 1.500068109237126e-05, + "loss": 0.0054, + "step": 376600 + }, + { + "epoch": 1.9, + "learning_rate": 1.499311339935725e-05, + "loss": 0.0044, + "step": 376610 + }, + { + "epoch": 1.9, + "learning_rate": 1.498554570634324e-05, + "loss": 0.0058, + "step": 376620 + }, + { + "epoch": 1.9, + "learning_rate": 1.497797801332923e-05, + "loss": 0.0052, + "step": 376630 + }, + { + "epoch": 1.9, + "learning_rate": 1.4970410320315218e-05, + "loss": 0.0049, + "step": 376640 + }, + { + "epoch": 1.9, + "learning_rate": 1.4962842627301208e-05, + "loss": 0.0058, + "step": 376650 + }, + { + "epoch": 1.9, + "learning_rate": 1.4955274934287198e-05, + "loss": 0.0054, + "step": 376660 + }, + { + "epoch": 1.9, + "learning_rate": 1.4947707241273188e-05, + "loss": 0.0058, + "step": 376670 + }, + { + "epoch": 1.9, + "learning_rate": 1.4940139548259178e-05, + "loss": 0.0055, + "step": 376680 + }, + { + "epoch": 1.9, + "learning_rate": 1.4932571855245168e-05, + "loss": 0.0069, + "step": 376690 + }, + { + "epoch": 1.9, + "learning_rate": 1.4925004162231158e-05, + "loss": 0.0054, + "step": 376700 + }, + { + "epoch": 1.9, + "learning_rate": 1.4917436469217148e-05, + "loss": 0.0048, + "step": 376710 + }, + { + "epoch": 1.9, + "learning_rate": 1.4909868776203134e-05, + "loss": 0.0048, + "step": 376720 + }, + { + "epoch": 1.9, + "learning_rate": 1.4902301083189124e-05, + "loss": 0.0055, + "step": 376730 + }, + { + "epoch": 1.9, + "learning_rate": 1.4894733390175114e-05, + "loss": 0.0057, + "step": 376740 + }, + { + "epoch": 1.9, + "learning_rate": 1.4887165697161104e-05, + "loss": 0.005, + "step": 376750 + }, + { + "epoch": 1.9, + "learning_rate": 1.4879598004147096e-05, + "loss": 0.0063, + "step": 376760 + }, + { + "epoch": 1.9, + "learning_rate": 1.4872030311133085e-05, + "loss": 0.0076, + "step": 376770 + }, + { + "epoch": 1.9, + "learning_rate": 1.4864462618119075e-05, + "loss": 0.0053, + "step": 376780 + }, + { + "epoch": 1.9, + "learning_rate": 1.4856894925105065e-05, + "loss": 0.0055, + "step": 376790 + }, + { + "epoch": 1.9, + "learning_rate": 1.4849327232091052e-05, + "loss": 0.0052, + "step": 376800 + }, + { + "epoch": 1.9, + "learning_rate": 1.4841759539077042e-05, + "loss": 0.0058, + "step": 376810 + }, + { + "epoch": 1.9, + "learning_rate": 1.4834191846063032e-05, + "loss": 0.005, + "step": 376820 + }, + { + "epoch": 1.9, + "learning_rate": 1.4826624153049022e-05, + "loss": 0.008, + "step": 376830 + }, + { + "epoch": 1.9, + "learning_rate": 1.4819056460035011e-05, + "loss": 0.0047, + "step": 376840 + }, + { + "epoch": 1.9, + "learning_rate": 1.4811488767021001e-05, + "loss": 0.0055, + "step": 376850 + }, + { + "epoch": 1.9, + "learning_rate": 1.4803921074006991e-05, + "loss": 0.0083, + "step": 376860 + }, + { + "epoch": 1.9, + "learning_rate": 1.479635338099298e-05, + "loss": 0.0069, + "step": 376870 + }, + { + "epoch": 1.9, + "learning_rate": 1.478878568797897e-05, + "loss": 0.0048, + "step": 376880 + }, + { + "epoch": 1.9, + "learning_rate": 1.478121799496496e-05, + "loss": 0.006, + "step": 376890 + }, + { + "epoch": 1.9, + "learning_rate": 1.477365030195095e-05, + "loss": 0.0044, + "step": 376900 + }, + { + "epoch": 1.9, + "learning_rate": 1.4766082608936939e-05, + "loss": 0.0079, + "step": 376910 + }, + { + "epoch": 1.9, + "learning_rate": 1.4758514915922929e-05, + "loss": 0.0053, + "step": 376920 + }, + { + "epoch": 1.9, + "learning_rate": 1.4750947222908919e-05, + "loss": 0.0064, + "step": 376930 + }, + { + "epoch": 1.9, + "learning_rate": 1.4743379529894909e-05, + "loss": 0.0052, + "step": 376940 + }, + { + "epoch": 1.9, + "learning_rate": 1.4735811836880897e-05, + "loss": 0.0055, + "step": 376950 + }, + { + "epoch": 1.9, + "learning_rate": 1.4728244143866887e-05, + "loss": 0.0059, + "step": 376960 + }, + { + "epoch": 1.9, + "learning_rate": 1.4720676450852877e-05, + "loss": 0.0049, + "step": 376970 + }, + { + "epoch": 1.9, + "learning_rate": 1.4713108757838867e-05, + "loss": 0.005, + "step": 376980 + }, + { + "epoch": 1.9, + "learning_rate": 1.4705541064824857e-05, + "loss": 0.0065, + "step": 376990 + }, + { + "epoch": 1.9, + "learning_rate": 1.4697973371810847e-05, + "loss": 0.0067, + "step": 377000 + }, + { + "epoch": 1.9, + "eval_cer": 0.914438232831024, + "eval_loss": 0.004278304520994425, + "eval_runtime": 116.1202, + "eval_samples_per_second": 17.224, + "eval_steps_per_second": 4.306, + "step": 377000 + }, + { + "epoch": 1.9, + "learning_rate": 1.4690405678796837e-05, + "loss": 0.0054, + "step": 377010 + }, + { + "epoch": 1.9, + "learning_rate": 1.4682837985782826e-05, + "loss": 0.0067, + "step": 377020 + }, + { + "epoch": 1.9, + "learning_rate": 1.4675270292768815e-05, + "loss": 0.0035, + "step": 377030 + }, + { + "epoch": 1.9, + "learning_rate": 1.4667702599754805e-05, + "loss": 0.0054, + "step": 377040 + }, + { + "epoch": 1.9, + "learning_rate": 1.4660134906740795e-05, + "loss": 0.0046, + "step": 377050 + }, + { + "epoch": 1.9, + "learning_rate": 1.4652567213726784e-05, + "loss": 0.0062, + "step": 377060 + }, + { + "epoch": 1.9, + "learning_rate": 1.4644999520712774e-05, + "loss": 0.0048, + "step": 377070 + }, + { + "epoch": 1.9, + "learning_rate": 1.4637431827698764e-05, + "loss": 0.0047, + "step": 377080 + }, + { + "epoch": 1.9, + "learning_rate": 1.4629864134684754e-05, + "loss": 0.0055, + "step": 377090 + }, + { + "epoch": 1.9, + "learning_rate": 1.4622296441670744e-05, + "loss": 0.0066, + "step": 377100 + }, + { + "epoch": 1.9, + "learning_rate": 1.4614728748656732e-05, + "loss": 0.005, + "step": 377110 + }, + { + "epoch": 1.9, + "learning_rate": 1.4607161055642722e-05, + "loss": 0.0054, + "step": 377120 + }, + { + "epoch": 1.9, + "learning_rate": 1.4599593362628712e-05, + "loss": 0.0084, + "step": 377130 + }, + { + "epoch": 1.9, + "learning_rate": 1.4592025669614702e-05, + "loss": 0.0059, + "step": 377140 + }, + { + "epoch": 1.9, + "learning_rate": 1.4584457976600692e-05, + "loss": 0.0052, + "step": 377150 + }, + { + "epoch": 1.9, + "learning_rate": 1.4576890283586682e-05, + "loss": 0.0065, + "step": 377160 + }, + { + "epoch": 1.9, + "learning_rate": 1.4569322590572672e-05, + "loss": 0.0059, + "step": 377170 + }, + { + "epoch": 1.9, + "learning_rate": 1.4561754897558662e-05, + "loss": 0.0045, + "step": 377180 + }, + { + "epoch": 1.9, + "learning_rate": 1.455418720454465e-05, + "loss": 0.0083, + "step": 377190 + }, + { + "epoch": 1.9, + "learning_rate": 1.454661951153064e-05, + "loss": 0.007, + "step": 377200 + }, + { + "epoch": 1.9, + "learning_rate": 1.453905181851663e-05, + "loss": 0.0055, + "step": 377210 + }, + { + "epoch": 1.9, + "learning_rate": 1.453148412550262e-05, + "loss": 0.0081, + "step": 377220 + }, + { + "epoch": 1.9, + "learning_rate": 1.452391643248861e-05, + "loss": 0.0065, + "step": 377230 + }, + { + "epoch": 1.9, + "learning_rate": 1.45163487394746e-05, + "loss": 0.0076, + "step": 377240 + }, + { + "epoch": 1.9, + "learning_rate": 1.450878104646059e-05, + "loss": 0.0056, + "step": 377250 + }, + { + "epoch": 1.9, + "learning_rate": 1.450121335344658e-05, + "loss": 0.0068, + "step": 377260 + }, + { + "epoch": 1.9, + "learning_rate": 1.4493645660432568e-05, + "loss": 0.0073, + "step": 377270 + }, + { + "epoch": 1.9, + "learning_rate": 1.4486077967418557e-05, + "loss": 0.0083, + "step": 377280 + }, + { + "epoch": 1.9, + "learning_rate": 1.4478510274404547e-05, + "loss": 0.0058, + "step": 377290 + }, + { + "epoch": 1.9, + "learning_rate": 1.4470942581390537e-05, + "loss": 0.0064, + "step": 377300 + }, + { + "epoch": 1.9, + "learning_rate": 1.4463374888376527e-05, + "loss": 0.0052, + "step": 377310 + }, + { + "epoch": 1.9, + "learning_rate": 1.4455807195362517e-05, + "loss": 0.006, + "step": 377320 + }, + { + "epoch": 1.9, + "learning_rate": 1.4448239502348507e-05, + "loss": 0.0077, + "step": 377330 + }, + { + "epoch": 1.9, + "learning_rate": 1.4440671809334497e-05, + "loss": 0.0063, + "step": 377340 + }, + { + "epoch": 1.9, + "learning_rate": 1.4433104116320485e-05, + "loss": 0.0042, + "step": 377350 + }, + { + "epoch": 1.9, + "learning_rate": 1.4425536423306475e-05, + "loss": 0.0047, + "step": 377360 + }, + { + "epoch": 1.9, + "learning_rate": 1.4417968730292465e-05, + "loss": 0.0038, + "step": 377370 + }, + { + "epoch": 1.9, + "learning_rate": 1.4410401037278455e-05, + "loss": 0.0051, + "step": 377380 + }, + { + "epoch": 1.9, + "learning_rate": 1.4402833344264445e-05, + "loss": 0.0039, + "step": 377390 + }, + { + "epoch": 1.9, + "learning_rate": 1.4395265651250435e-05, + "loss": 0.0038, + "step": 377400 + }, + { + "epoch": 1.9, + "learning_rate": 1.4387697958236425e-05, + "loss": 0.0047, + "step": 377410 + }, + { + "epoch": 1.9, + "learning_rate": 1.4380130265222413e-05, + "loss": 0.006, + "step": 377420 + }, + { + "epoch": 1.9, + "learning_rate": 1.4372562572208403e-05, + "loss": 0.0039, + "step": 377430 + }, + { + "epoch": 1.9, + "learning_rate": 1.4364994879194393e-05, + "loss": 0.0058, + "step": 377440 + }, + { + "epoch": 1.9, + "learning_rate": 1.4357427186180383e-05, + "loss": 0.0046, + "step": 377450 + }, + { + "epoch": 1.9, + "learning_rate": 1.4349859493166372e-05, + "loss": 0.0064, + "step": 377460 + }, + { + "epoch": 1.9, + "learning_rate": 1.4342291800152362e-05, + "loss": 0.0051, + "step": 377470 + }, + { + "epoch": 1.9, + "learning_rate": 1.4334724107138352e-05, + "loss": 0.0056, + "step": 377480 + }, + { + "epoch": 1.9, + "learning_rate": 1.4327156414124342e-05, + "loss": 0.0068, + "step": 377490 + }, + { + "epoch": 1.9, + "learning_rate": 1.431958872111033e-05, + "loss": 0.0058, + "step": 377500 + }, + { + "epoch": 1.9, + "learning_rate": 1.431202102809632e-05, + "loss": 0.0063, + "step": 377510 + }, + { + "epoch": 1.9, + "learning_rate": 1.430445333508231e-05, + "loss": 0.0049, + "step": 377520 + }, + { + "epoch": 1.9, + "learning_rate": 1.42968856420683e-05, + "loss": 0.0058, + "step": 377530 + }, + { + "epoch": 1.9, + "learning_rate": 1.428931794905429e-05, + "loss": 0.0053, + "step": 377540 + }, + { + "epoch": 1.9, + "learning_rate": 1.428175025604028e-05, + "loss": 0.0036, + "step": 377550 + }, + { + "epoch": 1.9, + "learning_rate": 1.427418256302627e-05, + "loss": 0.006, + "step": 377560 + }, + { + "epoch": 1.9, + "learning_rate": 1.426661487001226e-05, + "loss": 0.007, + "step": 377570 + }, + { + "epoch": 1.9, + "learning_rate": 1.4259047176998246e-05, + "loss": 0.0068, + "step": 377580 + }, + { + "epoch": 1.9, + "learning_rate": 1.4251479483984236e-05, + "loss": 0.0052, + "step": 377590 + }, + { + "epoch": 1.91, + "learning_rate": 1.4243911790970228e-05, + "loss": 0.0048, + "step": 377600 + }, + { + "epoch": 1.91, + "learning_rate": 1.4236344097956218e-05, + "loss": 0.0057, + "step": 377610 + }, + { + "epoch": 1.91, + "learning_rate": 1.4228776404942208e-05, + "loss": 0.0043, + "step": 377620 + }, + { + "epoch": 1.91, + "learning_rate": 1.4221208711928198e-05, + "loss": 0.0073, + "step": 377630 + }, + { + "epoch": 1.91, + "learning_rate": 1.4213641018914188e-05, + "loss": 0.0061, + "step": 377640 + }, + { + "epoch": 1.91, + "learning_rate": 1.4206073325900177e-05, + "loss": 0.0057, + "step": 377650 + }, + { + "epoch": 1.91, + "learning_rate": 1.4198505632886164e-05, + "loss": 0.005, + "step": 377660 + }, + { + "epoch": 1.91, + "learning_rate": 1.4190937939872154e-05, + "loss": 0.0076, + "step": 377670 + }, + { + "epoch": 1.91, + "learning_rate": 1.4183370246858144e-05, + "loss": 0.0052, + "step": 377680 + }, + { + "epoch": 1.91, + "learning_rate": 1.4175802553844134e-05, + "loss": 0.0049, + "step": 377690 + }, + { + "epoch": 1.91, + "learning_rate": 1.4168234860830124e-05, + "loss": 0.0046, + "step": 377700 + }, + { + "epoch": 1.91, + "learning_rate": 1.4160667167816114e-05, + "loss": 0.0049, + "step": 377710 + }, + { + "epoch": 1.91, + "learning_rate": 1.4153099474802103e-05, + "loss": 0.0055, + "step": 377720 + }, + { + "epoch": 1.91, + "learning_rate": 1.4145531781788095e-05, + "loss": 0.0061, + "step": 377730 + }, + { + "epoch": 1.91, + "learning_rate": 1.4137964088774082e-05, + "loss": 0.0067, + "step": 377740 + }, + { + "epoch": 1.91, + "learning_rate": 1.4130396395760071e-05, + "loss": 0.0042, + "step": 377750 + }, + { + "epoch": 1.91, + "learning_rate": 1.4122828702746061e-05, + "loss": 0.0064, + "step": 377760 + }, + { + "epoch": 1.91, + "learning_rate": 1.4115261009732051e-05, + "loss": 0.0064, + "step": 377770 + }, + { + "epoch": 1.91, + "learning_rate": 1.4107693316718041e-05, + "loss": 0.0043, + "step": 377780 + }, + { + "epoch": 1.91, + "learning_rate": 1.4100125623704031e-05, + "loss": 0.0062, + "step": 377790 + }, + { + "epoch": 1.91, + "learning_rate": 1.4092557930690021e-05, + "loss": 0.0046, + "step": 377800 + }, + { + "epoch": 1.91, + "learning_rate": 1.4084990237676011e-05, + "loss": 0.0038, + "step": 377810 + }, + { + "epoch": 1.91, + "learning_rate": 1.4077422544662e-05, + "loss": 0.0044, + "step": 377820 + }, + { + "epoch": 1.91, + "learning_rate": 1.4069854851647989e-05, + "loss": 0.0046, + "step": 377830 + }, + { + "epoch": 1.91, + "learning_rate": 1.4062287158633979e-05, + "loss": 0.0045, + "step": 377840 + }, + { + "epoch": 1.91, + "learning_rate": 1.4054719465619969e-05, + "loss": 0.0054, + "step": 377850 + }, + { + "epoch": 1.91, + "learning_rate": 1.4047151772605959e-05, + "loss": 0.0057, + "step": 377860 + }, + { + "epoch": 1.91, + "learning_rate": 1.4039584079591949e-05, + "loss": 0.0057, + "step": 377870 + }, + { + "epoch": 1.91, + "learning_rate": 1.4032016386577939e-05, + "loss": 0.0059, + "step": 377880 + }, + { + "epoch": 1.91, + "learning_rate": 1.4024448693563929e-05, + "loss": 0.0071, + "step": 377890 + }, + { + "epoch": 1.91, + "learning_rate": 1.4016881000549917e-05, + "loss": 0.0063, + "step": 377900 + }, + { + "epoch": 1.91, + "learning_rate": 1.4009313307535907e-05, + "loss": 0.006, + "step": 377910 + }, + { + "epoch": 1.91, + "learning_rate": 1.4001745614521897e-05, + "loss": 0.0038, + "step": 377920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3994177921507887e-05, + "loss": 0.0055, + "step": 377930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3986610228493876e-05, + "loss": 0.0048, + "step": 377940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3979042535479866e-05, + "loss": 0.0058, + "step": 377950 + }, + { + "epoch": 1.91, + "learning_rate": 1.3971474842465856e-05, + "loss": 0.0068, + "step": 377960 + }, + { + "epoch": 1.91, + "learning_rate": 1.3963907149451844e-05, + "loss": 0.006, + "step": 377970 + }, + { + "epoch": 1.91, + "learning_rate": 1.3956339456437834e-05, + "loss": 0.0067, + "step": 377980 + }, + { + "epoch": 1.91, + "learning_rate": 1.3948771763423824e-05, + "loss": 0.0065, + "step": 377990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3941204070409814e-05, + "loss": 0.0045, + "step": 378000 + }, + { + "epoch": 1.91, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004249492194503546, + "eval_runtime": 116.3497, + "eval_samples_per_second": 17.19, + "eval_steps_per_second": 4.297, + "step": 378000 + }, + { + "epoch": 1.91, + "learning_rate": 1.3933636377395804e-05, + "loss": 0.0053, + "step": 378010 + }, + { + "epoch": 1.91, + "learning_rate": 1.3926068684381794e-05, + "loss": 0.0053, + "step": 378020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3918500991367784e-05, + "loss": 0.0052, + "step": 378030 + }, + { + "epoch": 1.91, + "learning_rate": 1.3910933298353774e-05, + "loss": 0.0063, + "step": 378040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3903365605339762e-05, + "loss": 0.0061, + "step": 378050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3895797912325752e-05, + "loss": 0.0051, + "step": 378060 + }, + { + "epoch": 1.91, + "learning_rate": 1.3888230219311742e-05, + "loss": 0.0091, + "step": 378070 + }, + { + "epoch": 1.91, + "learning_rate": 1.3880662526297732e-05, + "loss": 0.0054, + "step": 378080 + }, + { + "epoch": 1.91, + "learning_rate": 1.3873094833283722e-05, + "loss": 0.0048, + "step": 378090 + }, + { + "epoch": 1.91, + "learning_rate": 1.3865527140269712e-05, + "loss": 0.005, + "step": 378100 + }, + { + "epoch": 1.91, + "learning_rate": 1.3857959447255702e-05, + "loss": 0.007, + "step": 378110 + }, + { + "epoch": 1.91, + "learning_rate": 1.3850391754241691e-05, + "loss": 0.0059, + "step": 378120 + }, + { + "epoch": 1.91, + "learning_rate": 1.384282406122768e-05, + "loss": 0.0046, + "step": 378130 + }, + { + "epoch": 1.91, + "learning_rate": 1.383525636821367e-05, + "loss": 0.0055, + "step": 378140 + }, + { + "epoch": 1.91, + "learning_rate": 1.382768867519966e-05, + "loss": 0.0052, + "step": 378150 + }, + { + "epoch": 1.91, + "learning_rate": 1.382012098218565e-05, + "loss": 0.0064, + "step": 378160 + }, + { + "epoch": 1.91, + "learning_rate": 1.381255328917164e-05, + "loss": 0.0058, + "step": 378170 + }, + { + "epoch": 1.91, + "learning_rate": 1.380498559615763e-05, + "loss": 0.0061, + "step": 378180 + }, + { + "epoch": 1.91, + "learning_rate": 1.379741790314362e-05, + "loss": 0.0079, + "step": 378190 + }, + { + "epoch": 1.91, + "learning_rate": 1.3789850210129609e-05, + "loss": 0.0046, + "step": 378200 + }, + { + "epoch": 1.91, + "learning_rate": 1.3782282517115597e-05, + "loss": 0.0043, + "step": 378210 + }, + { + "epoch": 1.91, + "learning_rate": 1.3774714824101587e-05, + "loss": 0.0049, + "step": 378220 + }, + { + "epoch": 1.91, + "learning_rate": 1.3767147131087577e-05, + "loss": 0.0052, + "step": 378230 + }, + { + "epoch": 1.91, + "learning_rate": 1.3759579438073567e-05, + "loss": 0.0072, + "step": 378240 + }, + { + "epoch": 1.91, + "learning_rate": 1.3752011745059557e-05, + "loss": 0.0067, + "step": 378250 + }, + { + "epoch": 1.91, + "learning_rate": 1.3744444052045547e-05, + "loss": 0.0071, + "step": 378260 + }, + { + "epoch": 1.91, + "learning_rate": 1.3736876359031537e-05, + "loss": 0.0061, + "step": 378270 + }, + { + "epoch": 1.91, + "learning_rate": 1.3729308666017527e-05, + "loss": 0.0069, + "step": 378280 + }, + { + "epoch": 1.91, + "learning_rate": 1.3721740973003515e-05, + "loss": 0.0057, + "step": 378290 + }, + { + "epoch": 1.91, + "learning_rate": 1.3714173279989505e-05, + "loss": 0.0077, + "step": 378300 + }, + { + "epoch": 1.91, + "learning_rate": 1.3706605586975495e-05, + "loss": 0.0059, + "step": 378310 + }, + { + "epoch": 1.91, + "learning_rate": 1.3699037893961485e-05, + "loss": 0.0059, + "step": 378320 + }, + { + "epoch": 1.91, + "learning_rate": 1.3691470200947475e-05, + "loss": 0.0078, + "step": 378330 + }, + { + "epoch": 1.91, + "learning_rate": 1.3683902507933464e-05, + "loss": 0.0047, + "step": 378340 + }, + { + "epoch": 1.91, + "learning_rate": 1.3676334814919454e-05, + "loss": 0.0055, + "step": 378350 + }, + { + "epoch": 1.91, + "learning_rate": 1.3668767121905444e-05, + "loss": 0.005, + "step": 378360 + }, + { + "epoch": 1.91, + "learning_rate": 1.3661199428891433e-05, + "loss": 0.0049, + "step": 378370 + }, + { + "epoch": 1.91, + "learning_rate": 1.3653631735877422e-05, + "loss": 0.0061, + "step": 378380 + }, + { + "epoch": 1.91, + "learning_rate": 1.3646064042863412e-05, + "loss": 0.0061, + "step": 378390 + }, + { + "epoch": 1.91, + "learning_rate": 1.3638496349849402e-05, + "loss": 0.0057, + "step": 378400 + }, + { + "epoch": 1.91, + "learning_rate": 1.3630928656835392e-05, + "loss": 0.0059, + "step": 378410 + }, + { + "epoch": 1.91, + "learning_rate": 1.3623360963821382e-05, + "loss": 0.0053, + "step": 378420 + }, + { + "epoch": 1.91, + "learning_rate": 1.3615793270807372e-05, + "loss": 0.0063, + "step": 378430 + }, + { + "epoch": 1.91, + "learning_rate": 1.3608225577793362e-05, + "loss": 0.0048, + "step": 378440 + }, + { + "epoch": 1.91, + "learning_rate": 1.360065788477935e-05, + "loss": 0.0064, + "step": 378450 + }, + { + "epoch": 1.91, + "learning_rate": 1.359309019176534e-05, + "loss": 0.0049, + "step": 378460 + }, + { + "epoch": 1.91, + "learning_rate": 1.358552249875133e-05, + "loss": 0.0037, + "step": 378470 + }, + { + "epoch": 1.91, + "learning_rate": 1.357795480573732e-05, + "loss": 0.0048, + "step": 378480 + }, + { + "epoch": 1.91, + "learning_rate": 1.357038711272331e-05, + "loss": 0.007, + "step": 378490 + }, + { + "epoch": 1.91, + "learning_rate": 1.35628194197093e-05, + "loss": 0.0067, + "step": 378500 + }, + { + "epoch": 1.91, + "learning_rate": 1.355525172669529e-05, + "loss": 0.0047, + "step": 378510 + }, + { + "epoch": 1.91, + "learning_rate": 1.3547684033681276e-05, + "loss": 0.0065, + "step": 378520 + }, + { + "epoch": 1.91, + "learning_rate": 1.3540116340667266e-05, + "loss": 0.0059, + "step": 378530 + }, + { + "epoch": 1.91, + "learning_rate": 1.3532548647653256e-05, + "loss": 0.007, + "step": 378540 + }, + { + "epoch": 1.91, + "learning_rate": 1.3524980954639246e-05, + "loss": 0.0063, + "step": 378550 + }, + { + "epoch": 1.91, + "learning_rate": 1.3517413261625236e-05, + "loss": 0.0044, + "step": 378560 + }, + { + "epoch": 1.91, + "learning_rate": 1.3509845568611227e-05, + "loss": 0.006, + "step": 378570 + }, + { + "epoch": 1.91, + "learning_rate": 1.3502277875597217e-05, + "loss": 0.0049, + "step": 378580 + }, + { + "epoch": 1.91, + "learning_rate": 1.3494710182583207e-05, + "loss": 0.0052, + "step": 378590 + }, + { + "epoch": 1.91, + "learning_rate": 1.3487142489569194e-05, + "loss": 0.005, + "step": 378600 + }, + { + "epoch": 1.91, + "learning_rate": 1.3479574796555184e-05, + "loss": 0.0071, + "step": 378610 + }, + { + "epoch": 1.91, + "learning_rate": 1.3472007103541174e-05, + "loss": 0.0054, + "step": 378620 + }, + { + "epoch": 1.91, + "learning_rate": 1.3464439410527163e-05, + "loss": 0.0055, + "step": 378630 + }, + { + "epoch": 1.91, + "learning_rate": 1.3456871717513153e-05, + "loss": 0.0052, + "step": 378640 + }, + { + "epoch": 1.91, + "learning_rate": 1.3449304024499143e-05, + "loss": 0.0061, + "step": 378650 + }, + { + "epoch": 1.91, + "learning_rate": 1.3441736331485133e-05, + "loss": 0.0063, + "step": 378660 + }, + { + "epoch": 1.91, + "learning_rate": 1.3434168638471123e-05, + "loss": 0.0047, + "step": 378670 + }, + { + "epoch": 1.91, + "learning_rate": 1.3426600945457111e-05, + "loss": 0.0047, + "step": 378680 + }, + { + "epoch": 1.91, + "learning_rate": 1.3419033252443101e-05, + "loss": 0.008, + "step": 378690 + }, + { + "epoch": 1.91, + "learning_rate": 1.3411465559429091e-05, + "loss": 0.0057, + "step": 378700 + }, + { + "epoch": 1.91, + "learning_rate": 1.3403897866415081e-05, + "loss": 0.0062, + "step": 378710 + }, + { + "epoch": 1.91, + "learning_rate": 1.3396330173401071e-05, + "loss": 0.0079, + "step": 378720 + }, + { + "epoch": 1.91, + "learning_rate": 1.3388762480387061e-05, + "loss": 0.0066, + "step": 378730 + }, + { + "epoch": 1.91, + "learning_rate": 1.338119478737305e-05, + "loss": 0.0059, + "step": 378740 + }, + { + "epoch": 1.91, + "learning_rate": 1.337362709435904e-05, + "loss": 0.0065, + "step": 378750 + }, + { + "epoch": 1.91, + "learning_rate": 1.3366059401345029e-05, + "loss": 0.0071, + "step": 378760 + }, + { + "epoch": 1.91, + "learning_rate": 1.3358491708331019e-05, + "loss": 0.0051, + "step": 378770 + }, + { + "epoch": 1.91, + "learning_rate": 1.3350924015317009e-05, + "loss": 0.0043, + "step": 378780 + }, + { + "epoch": 1.91, + "learning_rate": 1.3343356322302999e-05, + "loss": 0.0058, + "step": 378790 + }, + { + "epoch": 1.91, + "learning_rate": 1.3335788629288989e-05, + "loss": 0.0055, + "step": 378800 + }, + { + "epoch": 1.91, + "learning_rate": 1.3328220936274979e-05, + "loss": 0.0047, + "step": 378810 + }, + { + "epoch": 1.91, + "learning_rate": 1.3320653243260968e-05, + "loss": 0.0063, + "step": 378820 + }, + { + "epoch": 1.91, + "learning_rate": 1.3313085550246958e-05, + "loss": 0.0051, + "step": 378830 + }, + { + "epoch": 1.91, + "learning_rate": 1.3305517857232947e-05, + "loss": 0.0048, + "step": 378840 + }, + { + "epoch": 1.91, + "learning_rate": 1.3297950164218936e-05, + "loss": 0.0058, + "step": 378850 + }, + { + "epoch": 1.91, + "learning_rate": 1.3290382471204926e-05, + "loss": 0.0037, + "step": 378860 + }, + { + "epoch": 1.91, + "learning_rate": 1.3282814778190916e-05, + "loss": 0.0055, + "step": 378870 + }, + { + "epoch": 1.91, + "learning_rate": 1.3275247085176906e-05, + "loss": 0.0085, + "step": 378880 + }, + { + "epoch": 1.91, + "learning_rate": 1.3267679392162896e-05, + "loss": 0.0065, + "step": 378890 + }, + { + "epoch": 1.91, + "learning_rate": 1.3260111699148886e-05, + "loss": 0.0074, + "step": 378900 + }, + { + "epoch": 1.91, + "learning_rate": 1.3252544006134876e-05, + "loss": 0.0061, + "step": 378910 + }, + { + "epoch": 1.91, + "learning_rate": 1.3244976313120864e-05, + "loss": 0.007, + "step": 378920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3237408620106854e-05, + "loss": 0.0044, + "step": 378930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3229840927092844e-05, + "loss": 0.0045, + "step": 378940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3222273234078834e-05, + "loss": 0.0047, + "step": 378950 + }, + { + "epoch": 1.91, + "learning_rate": 1.3214705541064824e-05, + "loss": 0.0068, + "step": 378960 + }, + { + "epoch": 1.91, + "learning_rate": 1.3207137848050814e-05, + "loss": 0.005, + "step": 378970 + }, + { + "epoch": 1.91, + "learning_rate": 1.3199570155036804e-05, + "loss": 0.0047, + "step": 378980 + }, + { + "epoch": 1.91, + "learning_rate": 1.3192002462022794e-05, + "loss": 0.0045, + "step": 378990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3184434769008782e-05, + "loss": 0.0051, + "step": 379000 + }, + { + "epoch": 1.91, + "eval_cer": 0.9144149433240143, + "eval_loss": 0.00423853425309062, + "eval_runtime": 116.3136, + "eval_samples_per_second": 17.195, + "eval_steps_per_second": 4.299, + "step": 379000 + }, + { + "epoch": 1.91, + "learning_rate": 1.3176867075994772e-05, + "loss": 0.0044, + "step": 379010 + }, + { + "epoch": 1.91, + "learning_rate": 1.3169299382980762e-05, + "loss": 0.0048, + "step": 379020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3161731689966752e-05, + "loss": 0.0064, + "step": 379030 + }, + { + "epoch": 1.91, + "learning_rate": 1.3154163996952741e-05, + "loss": 0.0069, + "step": 379040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3146596303938731e-05, + "loss": 0.0046, + "step": 379050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3139028610924721e-05, + "loss": 0.0054, + "step": 379060 + }, + { + "epoch": 1.91, + "learning_rate": 1.313146091791071e-05, + "loss": 0.0038, + "step": 379070 + }, + { + "epoch": 1.91, + "learning_rate": 1.31238932248967e-05, + "loss": 0.0042, + "step": 379080 + }, + { + "epoch": 1.91, + "learning_rate": 1.311632553188269e-05, + "loss": 0.0056, + "step": 379090 + }, + { + "epoch": 1.91, + "learning_rate": 1.310875783886868e-05, + "loss": 0.0079, + "step": 379100 + }, + { + "epoch": 1.91, + "learning_rate": 1.3101190145854669e-05, + "loss": 0.0066, + "step": 379110 + }, + { + "epoch": 1.91, + "learning_rate": 1.3093622452840659e-05, + "loss": 0.0059, + "step": 379120 + }, + { + "epoch": 1.91, + "learning_rate": 1.3086054759826649e-05, + "loss": 0.0054, + "step": 379130 + }, + { + "epoch": 1.91, + "learning_rate": 1.3078487066812639e-05, + "loss": 0.0039, + "step": 379140 + }, + { + "epoch": 1.91, + "learning_rate": 1.3070919373798627e-05, + "loss": 0.0061, + "step": 379150 + }, + { + "epoch": 1.91, + "learning_rate": 1.3063351680784617e-05, + "loss": 0.0048, + "step": 379160 + }, + { + "epoch": 1.91, + "learning_rate": 1.3055783987770607e-05, + "loss": 0.0057, + "step": 379170 + }, + { + "epoch": 1.91, + "learning_rate": 1.3048216294756597e-05, + "loss": 0.0061, + "step": 379180 + }, + { + "epoch": 1.91, + "learning_rate": 1.3040648601742587e-05, + "loss": 0.0043, + "step": 379190 + }, + { + "epoch": 1.91, + "learning_rate": 1.3033080908728577e-05, + "loss": 0.0042, + "step": 379200 + }, + { + "epoch": 1.91, + "learning_rate": 1.3025513215714567e-05, + "loss": 0.0041, + "step": 379210 + }, + { + "epoch": 1.91, + "learning_rate": 1.3017945522700556e-05, + "loss": 0.0074, + "step": 379220 + }, + { + "epoch": 1.91, + "learning_rate": 1.3010377829686545e-05, + "loss": 0.0056, + "step": 379230 + }, + { + "epoch": 1.91, + "learning_rate": 1.3002810136672535e-05, + "loss": 0.0048, + "step": 379240 + }, + { + "epoch": 1.91, + "learning_rate": 1.2995242443658525e-05, + "loss": 0.0044, + "step": 379250 + }, + { + "epoch": 1.91, + "learning_rate": 1.2987674750644514e-05, + "loss": 0.0051, + "step": 379260 + }, + { + "epoch": 1.91, + "learning_rate": 1.2980107057630504e-05, + "loss": 0.0061, + "step": 379270 + }, + { + "epoch": 1.91, + "learning_rate": 1.2972539364616494e-05, + "loss": 0.0045, + "step": 379280 + }, + { + "epoch": 1.91, + "learning_rate": 1.2964971671602484e-05, + "loss": 0.0048, + "step": 379290 + }, + { + "epoch": 1.91, + "learning_rate": 1.2957403978588474e-05, + "loss": 0.0051, + "step": 379300 + }, + { + "epoch": 1.91, + "learning_rate": 1.2949836285574462e-05, + "loss": 0.0049, + "step": 379310 + }, + { + "epoch": 1.91, + "learning_rate": 1.2942268592560452e-05, + "loss": 0.0056, + "step": 379320 + }, + { + "epoch": 1.91, + "learning_rate": 1.2934700899546442e-05, + "loss": 0.0067, + "step": 379330 + }, + { + "epoch": 1.91, + "learning_rate": 1.2927133206532432e-05, + "loss": 0.0064, + "step": 379340 + }, + { + "epoch": 1.91, + "learning_rate": 1.2919565513518422e-05, + "loss": 0.0048, + "step": 379350 + }, + { + "epoch": 1.91, + "learning_rate": 1.2911997820504412e-05, + "loss": 0.0061, + "step": 379360 + }, + { + "epoch": 1.91, + "learning_rate": 1.2904430127490402e-05, + "loss": 0.0046, + "step": 379370 + }, + { + "epoch": 1.91, + "learning_rate": 1.2896862434476392e-05, + "loss": 0.0062, + "step": 379380 + }, + { + "epoch": 1.91, + "learning_rate": 1.2889294741462378e-05, + "loss": 0.0053, + "step": 379390 + }, + { + "epoch": 1.91, + "learning_rate": 1.2881727048448368e-05, + "loss": 0.0068, + "step": 379400 + }, + { + "epoch": 1.91, + "learning_rate": 1.287415935543436e-05, + "loss": 0.008, + "step": 379410 + }, + { + "epoch": 1.91, + "learning_rate": 1.286659166242035e-05, + "loss": 0.0054, + "step": 379420 + }, + { + "epoch": 1.91, + "learning_rate": 1.285902396940634e-05, + "loss": 0.0045, + "step": 379430 + }, + { + "epoch": 1.91, + "learning_rate": 1.285145627639233e-05, + "loss": 0.0052, + "step": 379440 + }, + { + "epoch": 1.91, + "learning_rate": 1.284388858337832e-05, + "loss": 0.0047, + "step": 379450 + }, + { + "epoch": 1.91, + "learning_rate": 1.283632089036431e-05, + "loss": 0.0058, + "step": 379460 + }, + { + "epoch": 1.91, + "learning_rate": 1.2828753197350296e-05, + "loss": 0.0049, + "step": 379470 + }, + { + "epoch": 1.91, + "learning_rate": 1.2821185504336286e-05, + "loss": 0.0052, + "step": 379480 + }, + { + "epoch": 1.91, + "learning_rate": 1.2813617811322276e-05, + "loss": 0.0056, + "step": 379490 + }, + { + "epoch": 1.91, + "learning_rate": 1.2806050118308266e-05, + "loss": 0.0062, + "step": 379500 + }, + { + "epoch": 1.91, + "learning_rate": 1.2798482425294255e-05, + "loss": 0.0061, + "step": 379510 + }, + { + "epoch": 1.91, + "learning_rate": 1.2790914732280245e-05, + "loss": 0.0061, + "step": 379520 + }, + { + "epoch": 1.91, + "learning_rate": 1.2783347039266235e-05, + "loss": 0.005, + "step": 379530 + }, + { + "epoch": 1.91, + "learning_rate": 1.2775779346252227e-05, + "loss": 0.0083, + "step": 379540 + }, + { + "epoch": 1.91, + "learning_rate": 1.2768211653238213e-05, + "loss": 0.0064, + "step": 379550 + }, + { + "epoch": 1.91, + "learning_rate": 1.2760643960224203e-05, + "loss": 0.0057, + "step": 379560 + }, + { + "epoch": 1.91, + "learning_rate": 1.2753076267210193e-05, + "loss": 0.0053, + "step": 379570 + }, + { + "epoch": 1.92, + "learning_rate": 1.2745508574196183e-05, + "loss": 0.0066, + "step": 379580 + }, + { + "epoch": 1.92, + "learning_rate": 1.2737940881182173e-05, + "loss": 0.0065, + "step": 379590 + }, + { + "epoch": 1.92, + "learning_rate": 1.2730373188168163e-05, + "loss": 0.0053, + "step": 379600 + }, + { + "epoch": 1.92, + "learning_rate": 1.2722805495154153e-05, + "loss": 0.0049, + "step": 379610 + }, + { + "epoch": 1.92, + "learning_rate": 1.2715237802140141e-05, + "loss": 0.0047, + "step": 379620 + }, + { + "epoch": 1.92, + "learning_rate": 1.2707670109126131e-05, + "loss": 0.0066, + "step": 379630 + }, + { + "epoch": 1.92, + "learning_rate": 1.2700102416112121e-05, + "loss": 0.0059, + "step": 379640 + }, + { + "epoch": 1.92, + "learning_rate": 1.2692534723098111e-05, + "loss": 0.0046, + "step": 379650 + }, + { + "epoch": 1.92, + "learning_rate": 1.26849670300841e-05, + "loss": 0.004, + "step": 379660 + }, + { + "epoch": 1.92, + "learning_rate": 1.267739933707009e-05, + "loss": 0.0048, + "step": 379670 + }, + { + "epoch": 1.92, + "learning_rate": 1.266983164405608e-05, + "loss": 0.0051, + "step": 379680 + }, + { + "epoch": 1.92, + "learning_rate": 1.266226395104207e-05, + "loss": 0.0054, + "step": 379690 + }, + { + "epoch": 1.92, + "learning_rate": 1.2654696258028059e-05, + "loss": 0.0077, + "step": 379700 + }, + { + "epoch": 1.92, + "learning_rate": 1.2647128565014049e-05, + "loss": 0.0076, + "step": 379710 + }, + { + "epoch": 1.92, + "learning_rate": 1.2639560872000039e-05, + "loss": 0.0045, + "step": 379720 + }, + { + "epoch": 1.92, + "learning_rate": 1.2631993178986028e-05, + "loss": 0.0058, + "step": 379730 + }, + { + "epoch": 1.92, + "learning_rate": 1.2624425485972018e-05, + "loss": 0.006, + "step": 379740 + }, + { + "epoch": 1.92, + "learning_rate": 1.2616857792958008e-05, + "loss": 0.0077, + "step": 379750 + }, + { + "epoch": 1.92, + "learning_rate": 1.2609290099943998e-05, + "loss": 0.0067, + "step": 379760 + }, + { + "epoch": 1.92, + "learning_rate": 1.2601722406929988e-05, + "loss": 0.0066, + "step": 379770 + }, + { + "epoch": 1.92, + "learning_rate": 1.2594154713915976e-05, + "loss": 0.0063, + "step": 379780 + }, + { + "epoch": 1.92, + "learning_rate": 1.2586587020901966e-05, + "loss": 0.0049, + "step": 379790 + }, + { + "epoch": 1.92, + "learning_rate": 1.2579019327887956e-05, + "loss": 0.0064, + "step": 379800 + }, + { + "epoch": 1.92, + "learning_rate": 1.2571451634873946e-05, + "loss": 0.0052, + "step": 379810 + }, + { + "epoch": 1.92, + "learning_rate": 1.2563883941859936e-05, + "loss": 0.0072, + "step": 379820 + }, + { + "epoch": 1.92, + "learning_rate": 1.2556316248845926e-05, + "loss": 0.0061, + "step": 379830 + }, + { + "epoch": 1.92, + "learning_rate": 1.2548748555831916e-05, + "loss": 0.0057, + "step": 379840 + }, + { + "epoch": 1.92, + "learning_rate": 1.2541180862817906e-05, + "loss": 0.0062, + "step": 379850 + }, + { + "epoch": 1.92, + "learning_rate": 1.2533613169803894e-05, + "loss": 0.0075, + "step": 379860 + }, + { + "epoch": 1.92, + "learning_rate": 1.2526045476789884e-05, + "loss": 0.0047, + "step": 379870 + }, + { + "epoch": 1.92, + "learning_rate": 1.2518477783775874e-05, + "loss": 0.0049, + "step": 379880 + }, + { + "epoch": 1.92, + "learning_rate": 1.2510910090761864e-05, + "loss": 0.0059, + "step": 379890 + }, + { + "epoch": 1.92, + "learning_rate": 1.2503342397747854e-05, + "loss": 0.0085, + "step": 379900 + }, + { + "epoch": 1.92, + "learning_rate": 1.2495774704733844e-05, + "loss": 0.0054, + "step": 379910 + }, + { + "epoch": 1.92, + "learning_rate": 1.2488207011719833e-05, + "loss": 0.0053, + "step": 379920 + }, + { + "epoch": 1.92, + "learning_rate": 1.2480639318705823e-05, + "loss": 0.0058, + "step": 379930 + }, + { + "epoch": 1.92, + "learning_rate": 1.2473071625691812e-05, + "loss": 0.0087, + "step": 379940 + }, + { + "epoch": 1.92, + "learning_rate": 1.2465503932677801e-05, + "loss": 0.0052, + "step": 379950 + }, + { + "epoch": 1.92, + "learning_rate": 1.2457936239663791e-05, + "loss": 0.0074, + "step": 379960 + }, + { + "epoch": 1.92, + "learning_rate": 1.2450368546649781e-05, + "loss": 0.0063, + "step": 379970 + }, + { + "epoch": 1.92, + "learning_rate": 1.2442800853635771e-05, + "loss": 0.0072, + "step": 379980 + }, + { + "epoch": 1.92, + "learning_rate": 1.2435233160621761e-05, + "loss": 0.0043, + "step": 379990 + }, + { + "epoch": 1.92, + "learning_rate": 1.2427665467607751e-05, + "loss": 0.0057, + "step": 380000 + }, + { + "epoch": 1.92, + "eval_cer": 0.9144217360968921, + "eval_loss": 0.004196519032120705, + "eval_runtime": 116.3652, + "eval_samples_per_second": 17.187, + "eval_steps_per_second": 4.297, + "step": 380000 + }, + { + "epoch": 1.92, + "learning_rate": 1.2420097774593741e-05, + "loss": 0.0058, + "step": 380010 + }, + { + "epoch": 1.92, + "learning_rate": 1.241253008157973e-05, + "loss": 0.0044, + "step": 380020 + }, + { + "epoch": 1.92, + "learning_rate": 1.2404962388565719e-05, + "loss": 0.0079, + "step": 380030 + }, + { + "epoch": 1.92, + "learning_rate": 1.2397394695551709e-05, + "loss": 0.0054, + "step": 380040 + }, + { + "epoch": 1.92, + "learning_rate": 1.2389827002537699e-05, + "loss": 0.0058, + "step": 380050 + }, + { + "epoch": 1.92, + "learning_rate": 1.2382259309523689e-05, + "loss": 0.0062, + "step": 380060 + }, + { + "epoch": 1.92, + "learning_rate": 1.2374691616509679e-05, + "loss": 0.0038, + "step": 380070 + }, + { + "epoch": 1.92, + "learning_rate": 1.2367123923495669e-05, + "loss": 0.0052, + "step": 380080 + }, + { + "epoch": 1.92, + "learning_rate": 1.2359556230481659e-05, + "loss": 0.0056, + "step": 380090 + }, + { + "epoch": 1.92, + "learning_rate": 1.2351988537467647e-05, + "loss": 0.006, + "step": 380100 + }, + { + "epoch": 1.92, + "learning_rate": 1.2344420844453637e-05, + "loss": 0.006, + "step": 380110 + }, + { + "epoch": 1.92, + "learning_rate": 1.2336853151439627e-05, + "loss": 0.0061, + "step": 380120 + }, + { + "epoch": 1.92, + "learning_rate": 1.2329285458425617e-05, + "loss": 0.0059, + "step": 380130 + }, + { + "epoch": 1.92, + "learning_rate": 1.2321717765411606e-05, + "loss": 0.0051, + "step": 380140 + }, + { + "epoch": 1.92, + "learning_rate": 1.2314150072397596e-05, + "loss": 0.0056, + "step": 380150 + }, + { + "epoch": 1.92, + "learning_rate": 1.2306582379383586e-05, + "loss": 0.0065, + "step": 380160 + }, + { + "epoch": 1.92, + "learning_rate": 1.2299014686369574e-05, + "loss": 0.005, + "step": 380170 + }, + { + "epoch": 1.92, + "learning_rate": 1.2291446993355564e-05, + "loss": 0.007, + "step": 380180 + }, + { + "epoch": 1.92, + "learning_rate": 1.2283879300341554e-05, + "loss": 0.0051, + "step": 380190 + }, + { + "epoch": 1.92, + "learning_rate": 1.2276311607327544e-05, + "loss": 0.0032, + "step": 380200 + }, + { + "epoch": 1.92, + "learning_rate": 1.2268743914313534e-05, + "loss": 0.0054, + "step": 380210 + }, + { + "epoch": 1.92, + "learning_rate": 1.2261176221299524e-05, + "loss": 0.0054, + "step": 380220 + }, + { + "epoch": 1.92, + "learning_rate": 1.2253608528285514e-05, + "loss": 0.0063, + "step": 380230 + }, + { + "epoch": 1.92, + "learning_rate": 1.2246040835271504e-05, + "loss": 0.0052, + "step": 380240 + }, + { + "epoch": 1.92, + "learning_rate": 1.223847314225749e-05, + "loss": 0.0054, + "step": 380250 + }, + { + "epoch": 1.92, + "learning_rate": 1.2230905449243482e-05, + "loss": 0.0061, + "step": 380260 + }, + { + "epoch": 1.92, + "learning_rate": 1.2223337756229472e-05, + "loss": 0.0068, + "step": 380270 + }, + { + "epoch": 1.92, + "learning_rate": 1.2215770063215462e-05, + "loss": 0.0058, + "step": 380280 + }, + { + "epoch": 1.92, + "learning_rate": 1.2208202370201452e-05, + "loss": 0.0066, + "step": 380290 + }, + { + "epoch": 1.92, + "learning_rate": 1.2200634677187442e-05, + "loss": 0.0049, + "step": 380300 + }, + { + "epoch": 1.92, + "learning_rate": 1.2193066984173432e-05, + "loss": 0.0045, + "step": 380310 + }, + { + "epoch": 1.92, + "learning_rate": 1.2185499291159421e-05, + "loss": 0.0056, + "step": 380320 + }, + { + "epoch": 1.92, + "learning_rate": 1.2177931598145408e-05, + "loss": 0.0054, + "step": 380330 + }, + { + "epoch": 1.92, + "learning_rate": 1.2170363905131398e-05, + "loss": 0.0053, + "step": 380340 + }, + { + "epoch": 1.92, + "learning_rate": 1.2162796212117388e-05, + "loss": 0.0082, + "step": 380350 + }, + { + "epoch": 1.92, + "learning_rate": 1.2155228519103378e-05, + "loss": 0.0056, + "step": 380360 + }, + { + "epoch": 1.92, + "learning_rate": 1.2147660826089368e-05, + "loss": 0.0053, + "step": 380370 + }, + { + "epoch": 1.92, + "learning_rate": 1.214009313307536e-05, + "loss": 0.0053, + "step": 380380 + }, + { + "epoch": 1.92, + "learning_rate": 1.213252544006135e-05, + "loss": 0.0072, + "step": 380390 + }, + { + "epoch": 1.92, + "learning_rate": 1.2124957747047339e-05, + "loss": 0.0092, + "step": 380400 + }, + { + "epoch": 1.92, + "learning_rate": 1.2117390054033326e-05, + "loss": 0.0049, + "step": 380410 + }, + { + "epoch": 1.92, + "learning_rate": 1.2109822361019316e-05, + "loss": 0.0046, + "step": 380420 + }, + { + "epoch": 1.92, + "learning_rate": 1.2102254668005305e-05, + "loss": 0.0075, + "step": 380430 + }, + { + "epoch": 1.92, + "learning_rate": 1.2094686974991295e-05, + "loss": 0.0057, + "step": 380440 + }, + { + "epoch": 1.92, + "learning_rate": 1.2087119281977285e-05, + "loss": 0.0052, + "step": 380450 + }, + { + "epoch": 1.92, + "learning_rate": 1.2079551588963275e-05, + "loss": 0.0064, + "step": 380460 + }, + { + "epoch": 1.92, + "learning_rate": 1.2071983895949265e-05, + "loss": 0.0042, + "step": 380470 + }, + { + "epoch": 1.92, + "learning_rate": 1.2064416202935255e-05, + "loss": 0.0061, + "step": 380480 + }, + { + "epoch": 1.92, + "learning_rate": 1.2056848509921243e-05, + "loss": 0.0066, + "step": 380490 + }, + { + "epoch": 1.92, + "learning_rate": 1.2049280816907233e-05, + "loss": 0.0046, + "step": 380500 + }, + { + "epoch": 1.92, + "learning_rate": 1.2041713123893223e-05, + "loss": 0.005, + "step": 380510 + }, + { + "epoch": 1.92, + "learning_rate": 1.2034145430879213e-05, + "loss": 0.0042, + "step": 380520 + }, + { + "epoch": 1.92, + "learning_rate": 1.2026577737865203e-05, + "loss": 0.0079, + "step": 380530 + }, + { + "epoch": 1.92, + "learning_rate": 1.2019010044851193e-05, + "loss": 0.006, + "step": 380540 + }, + { + "epoch": 1.92, + "learning_rate": 1.2011442351837183e-05, + "loss": 0.0095, + "step": 380550 + }, + { + "epoch": 1.92, + "learning_rate": 1.2003874658823173e-05, + "loss": 0.0063, + "step": 380560 + }, + { + "epoch": 1.92, + "learning_rate": 1.199630696580916e-05, + "loss": 0.0052, + "step": 380570 + }, + { + "epoch": 1.92, + "learning_rate": 1.198873927279515e-05, + "loss": 0.0061, + "step": 380580 + }, + { + "epoch": 1.92, + "learning_rate": 1.198117157978114e-05, + "loss": 0.0056, + "step": 380590 + }, + { + "epoch": 1.92, + "learning_rate": 1.197360388676713e-05, + "loss": 0.0058, + "step": 380600 + }, + { + "epoch": 1.92, + "learning_rate": 1.196603619375312e-05, + "loss": 0.0042, + "step": 380610 + }, + { + "epoch": 1.92, + "learning_rate": 1.195846850073911e-05, + "loss": 0.0054, + "step": 380620 + }, + { + "epoch": 1.92, + "learning_rate": 1.19509008077251e-05, + "loss": 0.0061, + "step": 380630 + }, + { + "epoch": 1.92, + "learning_rate": 1.194333311471109e-05, + "loss": 0.006, + "step": 380640 + }, + { + "epoch": 1.92, + "learning_rate": 1.1935765421697078e-05, + "loss": 0.0057, + "step": 380650 + }, + { + "epoch": 1.92, + "learning_rate": 1.1928197728683068e-05, + "loss": 0.0068, + "step": 380660 + }, + { + "epoch": 1.92, + "learning_rate": 1.1920630035669058e-05, + "loss": 0.0045, + "step": 380670 + }, + { + "epoch": 1.92, + "learning_rate": 1.1913062342655048e-05, + "loss": 0.0055, + "step": 380680 + }, + { + "epoch": 1.92, + "learning_rate": 1.1905494649641038e-05, + "loss": 0.0044, + "step": 380690 + }, + { + "epoch": 1.92, + "learning_rate": 1.1897926956627028e-05, + "loss": 0.0054, + "step": 380700 + }, + { + "epoch": 1.92, + "learning_rate": 1.1890359263613018e-05, + "loss": 0.0052, + "step": 380710 + }, + { + "epoch": 1.92, + "learning_rate": 1.1882791570599006e-05, + "loss": 0.0057, + "step": 380720 + }, + { + "epoch": 1.92, + "learning_rate": 1.1875223877584996e-05, + "loss": 0.0068, + "step": 380730 + }, + { + "epoch": 1.92, + "learning_rate": 1.1867656184570986e-05, + "loss": 0.0059, + "step": 380740 + }, + { + "epoch": 1.92, + "learning_rate": 1.1860088491556976e-05, + "loss": 0.0046, + "step": 380750 + }, + { + "epoch": 1.92, + "learning_rate": 1.1852520798542966e-05, + "loss": 0.0063, + "step": 380760 + }, + { + "epoch": 1.92, + "learning_rate": 1.1844953105528956e-05, + "loss": 0.0049, + "step": 380770 + }, + { + "epoch": 1.92, + "learning_rate": 1.1837385412514946e-05, + "loss": 0.0052, + "step": 380780 + }, + { + "epoch": 1.92, + "learning_rate": 1.1829817719500936e-05, + "loss": 0.0032, + "step": 380790 + }, + { + "epoch": 1.92, + "learning_rate": 1.1822250026486924e-05, + "loss": 0.006, + "step": 380800 + }, + { + "epoch": 1.92, + "learning_rate": 1.1814682333472914e-05, + "loss": 0.0055, + "step": 380810 + }, + { + "epoch": 1.92, + "learning_rate": 1.1807114640458904e-05, + "loss": 0.0082, + "step": 380820 + }, + { + "epoch": 1.92, + "learning_rate": 1.1799546947444893e-05, + "loss": 0.0071, + "step": 380830 + }, + { + "epoch": 1.92, + "learning_rate": 1.1791979254430883e-05, + "loss": 0.0036, + "step": 380840 + }, + { + "epoch": 1.92, + "learning_rate": 1.1784411561416873e-05, + "loss": 0.0057, + "step": 380850 + }, + { + "epoch": 1.92, + "learning_rate": 1.1776843868402863e-05, + "loss": 0.0057, + "step": 380860 + }, + { + "epoch": 1.92, + "learning_rate": 1.1769276175388853e-05, + "loss": 0.0058, + "step": 380870 + }, + { + "epoch": 1.92, + "learning_rate": 1.1761708482374841e-05, + "loss": 0.004, + "step": 380880 + }, + { + "epoch": 1.92, + "learning_rate": 1.1754140789360831e-05, + "loss": 0.0049, + "step": 380890 + }, + { + "epoch": 1.92, + "learning_rate": 1.1746573096346821e-05, + "loss": 0.0047, + "step": 380900 + }, + { + "epoch": 1.92, + "learning_rate": 1.1739005403332811e-05, + "loss": 0.0053, + "step": 380910 + }, + { + "epoch": 1.92, + "learning_rate": 1.1731437710318801e-05, + "loss": 0.0043, + "step": 380920 + }, + { + "epoch": 1.92, + "learning_rate": 1.1723870017304791e-05, + "loss": 0.0056, + "step": 380930 + }, + { + "epoch": 1.92, + "learning_rate": 1.171630232429078e-05, + "loss": 0.0054, + "step": 380940 + }, + { + "epoch": 1.92, + "learning_rate": 1.170873463127677e-05, + "loss": 0.0059, + "step": 380950 + }, + { + "epoch": 1.92, + "learning_rate": 1.1701166938262759e-05, + "loss": 0.0054, + "step": 380960 + }, + { + "epoch": 1.92, + "learning_rate": 1.1693599245248749e-05, + "loss": 0.0045, + "step": 380970 + }, + { + "epoch": 1.92, + "learning_rate": 1.1686031552234739e-05, + "loss": 0.0052, + "step": 380980 + }, + { + "epoch": 1.92, + "learning_rate": 1.1678463859220729e-05, + "loss": 0.0086, + "step": 380990 + }, + { + "epoch": 1.92, + "learning_rate": 1.1670896166206719e-05, + "loss": 0.0066, + "step": 381000 + }, + { + "epoch": 1.92, + "eval_cer": 0.9144256176813937, + "eval_loss": 0.004235303029417992, + "eval_runtime": 116.578, + "eval_samples_per_second": 17.156, + "eval_steps_per_second": 4.289, + "step": 381000 + }, + { + "epoch": 1.92, + "learning_rate": 1.1663328473192709e-05, + "loss": 0.0058, + "step": 381010 + }, + { + "epoch": 1.92, + "learning_rate": 1.1655760780178698e-05, + "loss": 0.0065, + "step": 381020 + }, + { + "epoch": 1.92, + "learning_rate": 1.1648193087164688e-05, + "loss": 0.0102, + "step": 381030 + }, + { + "epoch": 1.92, + "learning_rate": 1.1640625394150677e-05, + "loss": 0.0047, + "step": 381040 + }, + { + "epoch": 1.92, + "learning_rate": 1.1633057701136666e-05, + "loss": 0.0055, + "step": 381050 + }, + { + "epoch": 1.92, + "learning_rate": 1.1625490008122656e-05, + "loss": 0.0044, + "step": 381060 + }, + { + "epoch": 1.92, + "learning_rate": 1.1617922315108646e-05, + "loss": 0.0046, + "step": 381070 + }, + { + "epoch": 1.92, + "learning_rate": 1.1610354622094636e-05, + "loss": 0.0051, + "step": 381080 + }, + { + "epoch": 1.92, + "learning_rate": 1.1602786929080626e-05, + "loss": 0.0061, + "step": 381090 + }, + { + "epoch": 1.92, + "learning_rate": 1.1595219236066616e-05, + "loss": 0.0056, + "step": 381100 + }, + { + "epoch": 1.92, + "learning_rate": 1.1587651543052606e-05, + "loss": 0.0068, + "step": 381110 + }, + { + "epoch": 1.92, + "learning_rate": 1.1580083850038594e-05, + "loss": 0.0079, + "step": 381120 + }, + { + "epoch": 1.92, + "learning_rate": 1.1572516157024584e-05, + "loss": 0.0066, + "step": 381130 + }, + { + "epoch": 1.92, + "learning_rate": 1.1564948464010574e-05, + "loss": 0.0048, + "step": 381140 + }, + { + "epoch": 1.92, + "learning_rate": 1.1557380770996564e-05, + "loss": 0.0063, + "step": 381150 + }, + { + "epoch": 1.92, + "learning_rate": 1.1549813077982554e-05, + "loss": 0.0066, + "step": 381160 + }, + { + "epoch": 1.92, + "learning_rate": 1.1542245384968544e-05, + "loss": 0.0069, + "step": 381170 + }, + { + "epoch": 1.92, + "learning_rate": 1.1534677691954534e-05, + "loss": 0.0074, + "step": 381180 + }, + { + "epoch": 1.92, + "learning_rate": 1.1527109998940524e-05, + "loss": 0.0068, + "step": 381190 + }, + { + "epoch": 1.92, + "learning_rate": 1.151954230592651e-05, + "loss": 0.0068, + "step": 381200 + }, + { + "epoch": 1.92, + "learning_rate": 1.15119746129125e-05, + "loss": 0.0046, + "step": 381210 + }, + { + "epoch": 1.92, + "learning_rate": 1.150440691989849e-05, + "loss": 0.0047, + "step": 381220 + }, + { + "epoch": 1.92, + "learning_rate": 1.1496839226884482e-05, + "loss": 0.004, + "step": 381230 + }, + { + "epoch": 1.92, + "learning_rate": 1.1489271533870471e-05, + "loss": 0.0055, + "step": 381240 + }, + { + "epoch": 1.92, + "learning_rate": 1.1481703840856461e-05, + "loss": 0.0061, + "step": 381250 + }, + { + "epoch": 1.92, + "learning_rate": 1.1474136147842451e-05, + "loss": 0.004, + "step": 381260 + }, + { + "epoch": 1.92, + "learning_rate": 1.1466568454828438e-05, + "loss": 0.0067, + "step": 381270 + }, + { + "epoch": 1.92, + "learning_rate": 1.1459000761814428e-05, + "loss": 0.0045, + "step": 381280 + }, + { + "epoch": 1.92, + "learning_rate": 1.1451433068800418e-05, + "loss": 0.0043, + "step": 381290 + }, + { + "epoch": 1.92, + "learning_rate": 1.1443865375786408e-05, + "loss": 0.0062, + "step": 381300 + }, + { + "epoch": 1.92, + "learning_rate": 1.1436297682772397e-05, + "loss": 0.0074, + "step": 381310 + }, + { + "epoch": 1.92, + "learning_rate": 1.1428729989758387e-05, + "loss": 0.0049, + "step": 381320 + }, + { + "epoch": 1.92, + "learning_rate": 1.1421162296744377e-05, + "loss": 0.0058, + "step": 381330 + }, + { + "epoch": 1.92, + "learning_rate": 1.1413594603730367e-05, + "loss": 0.0047, + "step": 381340 + }, + { + "epoch": 1.92, + "learning_rate": 1.1406026910716355e-05, + "loss": 0.0086, + "step": 381350 + }, + { + "epoch": 1.92, + "learning_rate": 1.1398459217702345e-05, + "loss": 0.005, + "step": 381360 + }, + { + "epoch": 1.92, + "learning_rate": 1.1390891524688335e-05, + "loss": 0.0063, + "step": 381370 + }, + { + "epoch": 1.92, + "learning_rate": 1.1383323831674325e-05, + "loss": 0.0046, + "step": 381380 + }, + { + "epoch": 1.92, + "learning_rate": 1.1375756138660315e-05, + "loss": 0.0048, + "step": 381390 + }, + { + "epoch": 1.92, + "learning_rate": 1.1368188445646305e-05, + "loss": 0.0072, + "step": 381400 + }, + { + "epoch": 1.92, + "learning_rate": 1.1360620752632295e-05, + "loss": 0.0079, + "step": 381410 + }, + { + "epoch": 1.92, + "learning_rate": 1.1353053059618285e-05, + "loss": 0.0064, + "step": 381420 + }, + { + "epoch": 1.92, + "learning_rate": 1.1345485366604273e-05, + "loss": 0.0069, + "step": 381430 + }, + { + "epoch": 1.92, + "learning_rate": 1.1337917673590263e-05, + "loss": 0.0054, + "step": 381440 + }, + { + "epoch": 1.92, + "learning_rate": 1.1330349980576253e-05, + "loss": 0.0058, + "step": 381450 + }, + { + "epoch": 1.92, + "learning_rate": 1.1322782287562243e-05, + "loss": 0.005, + "step": 381460 + }, + { + "epoch": 1.92, + "learning_rate": 1.1315214594548233e-05, + "loss": 0.0061, + "step": 381470 + }, + { + "epoch": 1.92, + "learning_rate": 1.1307646901534223e-05, + "loss": 0.0047, + "step": 381480 + }, + { + "epoch": 1.92, + "learning_rate": 1.1300079208520212e-05, + "loss": 0.0064, + "step": 381490 + }, + { + "epoch": 1.92, + "learning_rate": 1.1292511515506202e-05, + "loss": 0.0067, + "step": 381500 + }, + { + "epoch": 1.92, + "learning_rate": 1.128494382249219e-05, + "loss": 0.0059, + "step": 381510 + }, + { + "epoch": 1.92, + "learning_rate": 1.127737612947818e-05, + "loss": 0.0061, + "step": 381520 + }, + { + "epoch": 1.92, + "learning_rate": 1.126980843646417e-05, + "loss": 0.008, + "step": 381530 + }, + { + "epoch": 1.92, + "learning_rate": 1.126224074345016e-05, + "loss": 0.0051, + "step": 381540 + }, + { + "epoch": 1.92, + "learning_rate": 1.125467305043615e-05, + "loss": 0.0065, + "step": 381550 + }, + { + "epoch": 1.93, + "learning_rate": 1.124710535742214e-05, + "loss": 0.006, + "step": 381560 + }, + { + "epoch": 1.93, + "learning_rate": 1.123953766440813e-05, + "loss": 0.0067, + "step": 381570 + }, + { + "epoch": 1.93, + "learning_rate": 1.123196997139412e-05, + "loss": 0.0074, + "step": 381580 + }, + { + "epoch": 1.93, + "learning_rate": 1.1224402278380108e-05, + "loss": 0.0081, + "step": 381590 + }, + { + "epoch": 1.93, + "learning_rate": 1.1216834585366098e-05, + "loss": 0.0044, + "step": 381600 + }, + { + "epoch": 1.93, + "learning_rate": 1.1209266892352088e-05, + "loss": 0.0046, + "step": 381610 + }, + { + "epoch": 1.93, + "learning_rate": 1.1201699199338078e-05, + "loss": 0.005, + "step": 381620 + }, + { + "epoch": 1.93, + "learning_rate": 1.1194131506324068e-05, + "loss": 0.0068, + "step": 381630 + }, + { + "epoch": 1.93, + "learning_rate": 1.1186563813310058e-05, + "loss": 0.0054, + "step": 381640 + }, + { + "epoch": 1.93, + "learning_rate": 1.1178996120296048e-05, + "loss": 0.0058, + "step": 381650 + }, + { + "epoch": 1.93, + "learning_rate": 1.1171428427282038e-05, + "loss": 0.0062, + "step": 381660 + }, + { + "epoch": 1.93, + "learning_rate": 1.1163860734268026e-05, + "loss": 0.0052, + "step": 381670 + }, + { + "epoch": 1.93, + "learning_rate": 1.1156293041254016e-05, + "loss": 0.0046, + "step": 381680 + }, + { + "epoch": 1.93, + "learning_rate": 1.1148725348240006e-05, + "loss": 0.0052, + "step": 381690 + }, + { + "epoch": 1.93, + "learning_rate": 1.1141157655225996e-05, + "loss": 0.0079, + "step": 381700 + }, + { + "epoch": 1.93, + "learning_rate": 1.1133589962211985e-05, + "loss": 0.0053, + "step": 381710 + }, + { + "epoch": 1.93, + "learning_rate": 1.1126022269197975e-05, + "loss": 0.0056, + "step": 381720 + }, + { + "epoch": 1.93, + "learning_rate": 1.1118454576183965e-05, + "loss": 0.0057, + "step": 381730 + }, + { + "epoch": 1.93, + "learning_rate": 1.1110886883169954e-05, + "loss": 0.0048, + "step": 381740 + }, + { + "epoch": 1.93, + "learning_rate": 1.1103319190155943e-05, + "loss": 0.0042, + "step": 381750 + }, + { + "epoch": 1.93, + "learning_rate": 1.1095751497141933e-05, + "loss": 0.0058, + "step": 381760 + }, + { + "epoch": 1.93, + "learning_rate": 1.1088183804127923e-05, + "loss": 0.0059, + "step": 381770 + }, + { + "epoch": 1.93, + "learning_rate": 1.1080616111113913e-05, + "loss": 0.0073, + "step": 381780 + }, + { + "epoch": 1.93, + "learning_rate": 1.1073048418099903e-05, + "loss": 0.0073, + "step": 381790 + }, + { + "epoch": 1.93, + "learning_rate": 1.1065480725085893e-05, + "loss": 0.0043, + "step": 381800 + }, + { + "epoch": 1.93, + "learning_rate": 1.1057913032071883e-05, + "loss": 0.0096, + "step": 381810 + }, + { + "epoch": 1.93, + "learning_rate": 1.1050345339057871e-05, + "loss": 0.005, + "step": 381820 + }, + { + "epoch": 1.93, + "learning_rate": 1.1042777646043861e-05, + "loss": 0.0041, + "step": 381830 + }, + { + "epoch": 1.93, + "learning_rate": 1.1035209953029851e-05, + "loss": 0.0056, + "step": 381840 + }, + { + "epoch": 1.93, + "learning_rate": 1.1027642260015841e-05, + "loss": 0.0046, + "step": 381850 + }, + { + "epoch": 1.93, + "learning_rate": 1.102007456700183e-05, + "loss": 0.0044, + "step": 381860 + }, + { + "epoch": 1.93, + "learning_rate": 1.101250687398782e-05, + "loss": 0.0047, + "step": 381870 + }, + { + "epoch": 1.93, + "learning_rate": 1.100493918097381e-05, + "loss": 0.005, + "step": 381880 + }, + { + "epoch": 1.93, + "learning_rate": 1.09973714879598e-05, + "loss": 0.0059, + "step": 381890 + }, + { + "epoch": 1.93, + "learning_rate": 1.0989803794945789e-05, + "loss": 0.0068, + "step": 381900 + }, + { + "epoch": 1.93, + "learning_rate": 1.0982236101931779e-05, + "loss": 0.0049, + "step": 381910 + }, + { + "epoch": 1.93, + "learning_rate": 1.0974668408917769e-05, + "loss": 0.0044, + "step": 381920 + }, + { + "epoch": 1.93, + "learning_rate": 1.0967100715903758e-05, + "loss": 0.008, + "step": 381930 + }, + { + "epoch": 1.93, + "learning_rate": 1.0959533022889748e-05, + "loss": 0.0059, + "step": 381940 + }, + { + "epoch": 1.93, + "learning_rate": 1.0951965329875738e-05, + "loss": 0.0038, + "step": 381950 + }, + { + "epoch": 1.93, + "learning_rate": 1.0944397636861728e-05, + "loss": 0.0051, + "step": 381960 + }, + { + "epoch": 1.93, + "learning_rate": 1.0936829943847718e-05, + "loss": 0.0054, + "step": 381970 + }, + { + "epoch": 1.93, + "learning_rate": 1.0929262250833706e-05, + "loss": 0.0086, + "step": 381980 + }, + { + "epoch": 1.93, + "learning_rate": 1.0921694557819696e-05, + "loss": 0.0052, + "step": 381990 + }, + { + "epoch": 1.93, + "learning_rate": 1.0914126864805686e-05, + "loss": 0.0067, + "step": 382000 + }, + { + "epoch": 1.93, + "eval_cer": 0.9144032985705095, + "eval_loss": 0.004233332350850105, + "eval_runtime": 116.331, + "eval_samples_per_second": 17.192, + "eval_steps_per_second": 4.298, + "step": 382000 + }, + { + "epoch": 1.93, + "learning_rate": 1.0906559171791676e-05, + "loss": 0.0065, + "step": 382010 + }, + { + "epoch": 1.93, + "learning_rate": 1.0898991478777666e-05, + "loss": 0.0067, + "step": 382020 + }, + { + "epoch": 1.93, + "learning_rate": 1.0891423785763656e-05, + "loss": 0.0071, + "step": 382030 + }, + { + "epoch": 1.93, + "learning_rate": 1.0883856092749646e-05, + "loss": 0.0059, + "step": 382040 + }, + { + "epoch": 1.93, + "learning_rate": 1.0876288399735636e-05, + "loss": 0.0059, + "step": 382050 + }, + { + "epoch": 1.93, + "learning_rate": 1.0868720706721622e-05, + "loss": 0.0075, + "step": 382060 + }, + { + "epoch": 1.93, + "learning_rate": 1.0861153013707614e-05, + "loss": 0.0048, + "step": 382070 + }, + { + "epoch": 1.93, + "learning_rate": 1.0853585320693604e-05, + "loss": 0.0072, + "step": 382080 + }, + { + "epoch": 1.93, + "learning_rate": 1.0846017627679594e-05, + "loss": 0.0054, + "step": 382090 + }, + { + "epoch": 1.93, + "learning_rate": 1.0838449934665584e-05, + "loss": 0.006, + "step": 382100 + }, + { + "epoch": 1.93, + "learning_rate": 1.0830882241651574e-05, + "loss": 0.0085, + "step": 382110 + }, + { + "epoch": 1.93, + "learning_rate": 1.0823314548637563e-05, + "loss": 0.0055, + "step": 382120 + }, + { + "epoch": 1.93, + "learning_rate": 1.0815746855623553e-05, + "loss": 0.0041, + "step": 382130 + }, + { + "epoch": 1.93, + "learning_rate": 1.080817916260954e-05, + "loss": 0.0053, + "step": 382140 + }, + { + "epoch": 1.93, + "learning_rate": 1.080061146959553e-05, + "loss": 0.0035, + "step": 382150 + }, + { + "epoch": 1.93, + "learning_rate": 1.079304377658152e-05, + "loss": 0.0043, + "step": 382160 + }, + { + "epoch": 1.93, + "learning_rate": 1.078547608356751e-05, + "loss": 0.0066, + "step": 382170 + }, + { + "epoch": 1.93, + "learning_rate": 1.07779083905535e-05, + "loss": 0.0049, + "step": 382180 + }, + { + "epoch": 1.93, + "learning_rate": 1.077034069753949e-05, + "loss": 0.005, + "step": 382190 + }, + { + "epoch": 1.93, + "learning_rate": 1.0762773004525481e-05, + "loss": 0.0054, + "step": 382200 + }, + { + "epoch": 1.93, + "learning_rate": 1.0755205311511471e-05, + "loss": 0.0072, + "step": 382210 + }, + { + "epoch": 1.93, + "learning_rate": 1.0747637618497457e-05, + "loss": 0.0045, + "step": 382220 + }, + { + "epoch": 1.93, + "learning_rate": 1.0740069925483447e-05, + "loss": 0.005, + "step": 382230 + }, + { + "epoch": 1.93, + "learning_rate": 1.0732502232469437e-05, + "loss": 0.0099, + "step": 382240 + }, + { + "epoch": 1.93, + "learning_rate": 1.0724934539455427e-05, + "loss": 0.0048, + "step": 382250 + }, + { + "epoch": 1.93, + "learning_rate": 1.0717366846441417e-05, + "loss": 0.0069, + "step": 382260 + }, + { + "epoch": 1.93, + "learning_rate": 1.0709799153427407e-05, + "loss": 0.0053, + "step": 382270 + }, + { + "epoch": 1.93, + "learning_rate": 1.0702231460413397e-05, + "loss": 0.0056, + "step": 382280 + }, + { + "epoch": 1.93, + "learning_rate": 1.0694663767399385e-05, + "loss": 0.0055, + "step": 382290 + }, + { + "epoch": 1.93, + "learning_rate": 1.0687096074385375e-05, + "loss": 0.0042, + "step": 382300 + }, + { + "epoch": 1.93, + "learning_rate": 1.0679528381371365e-05, + "loss": 0.0063, + "step": 382310 + }, + { + "epoch": 1.93, + "learning_rate": 1.0671960688357355e-05, + "loss": 0.0042, + "step": 382320 + }, + { + "epoch": 1.93, + "learning_rate": 1.0664392995343345e-05, + "loss": 0.0076, + "step": 382330 + }, + { + "epoch": 1.93, + "learning_rate": 1.0656825302329335e-05, + "loss": 0.006, + "step": 382340 + }, + { + "epoch": 1.93, + "learning_rate": 1.0649257609315325e-05, + "loss": 0.0054, + "step": 382350 + }, + { + "epoch": 1.93, + "learning_rate": 1.0641689916301315e-05, + "loss": 0.0044, + "step": 382360 + }, + { + "epoch": 1.93, + "learning_rate": 1.0634122223287303e-05, + "loss": 0.0074, + "step": 382370 + }, + { + "epoch": 1.93, + "learning_rate": 1.0626554530273293e-05, + "loss": 0.005, + "step": 382380 + }, + { + "epoch": 1.93, + "learning_rate": 1.0618986837259283e-05, + "loss": 0.0049, + "step": 382390 + }, + { + "epoch": 1.93, + "learning_rate": 1.0611419144245273e-05, + "loss": 0.0055, + "step": 382400 + }, + { + "epoch": 1.93, + "learning_rate": 1.0603851451231262e-05, + "loss": 0.0056, + "step": 382410 + }, + { + "epoch": 1.93, + "learning_rate": 1.0596283758217252e-05, + "loss": 0.0063, + "step": 382420 + }, + { + "epoch": 1.93, + "learning_rate": 1.0588716065203242e-05, + "loss": 0.0047, + "step": 382430 + }, + { + "epoch": 1.93, + "learning_rate": 1.0581148372189232e-05, + "loss": 0.0059, + "step": 382440 + }, + { + "epoch": 1.93, + "learning_rate": 1.057358067917522e-05, + "loss": 0.0059, + "step": 382450 + }, + { + "epoch": 1.93, + "learning_rate": 1.056601298616121e-05, + "loss": 0.0071, + "step": 382460 + }, + { + "epoch": 1.93, + "learning_rate": 1.05584452931472e-05, + "loss": 0.0071, + "step": 382470 + }, + { + "epoch": 1.93, + "learning_rate": 1.055087760013319e-05, + "loss": 0.0035, + "step": 382480 + }, + { + "epoch": 1.93, + "learning_rate": 1.054330990711918e-05, + "loss": 0.0061, + "step": 382490 + }, + { + "epoch": 1.93, + "learning_rate": 1.053574221410517e-05, + "loss": 0.0059, + "step": 382500 + }, + { + "epoch": 1.93, + "learning_rate": 1.052817452109116e-05, + "loss": 0.007, + "step": 382510 + }, + { + "epoch": 1.93, + "learning_rate": 1.052060682807715e-05, + "loss": 0.0069, + "step": 382520 + }, + { + "epoch": 1.93, + "learning_rate": 1.0513039135063138e-05, + "loss": 0.0043, + "step": 382530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0505471442049128e-05, + "loss": 0.0041, + "step": 382540 + }, + { + "epoch": 1.93, + "learning_rate": 1.0497903749035118e-05, + "loss": 0.0048, + "step": 382550 + }, + { + "epoch": 1.93, + "learning_rate": 1.0490336056021108e-05, + "loss": 0.0055, + "step": 382560 + }, + { + "epoch": 1.93, + "learning_rate": 1.0482768363007098e-05, + "loss": 0.0065, + "step": 382570 + }, + { + "epoch": 1.93, + "learning_rate": 1.0475200669993088e-05, + "loss": 0.0079, + "step": 382580 + }, + { + "epoch": 1.93, + "learning_rate": 1.0467632976979077e-05, + "loss": 0.0053, + "step": 382590 + }, + { + "epoch": 1.93, + "learning_rate": 1.0460065283965067e-05, + "loss": 0.0044, + "step": 382600 + }, + { + "epoch": 1.93, + "learning_rate": 1.0452497590951056e-05, + "loss": 0.0052, + "step": 382610 + }, + { + "epoch": 1.93, + "learning_rate": 1.0444929897937046e-05, + "loss": 0.0059, + "step": 382620 + }, + { + "epoch": 1.93, + "learning_rate": 1.0437362204923035e-05, + "loss": 0.006, + "step": 382630 + }, + { + "epoch": 1.93, + "learning_rate": 1.0429794511909025e-05, + "loss": 0.0057, + "step": 382640 + }, + { + "epoch": 1.93, + "learning_rate": 1.0422226818895015e-05, + "loss": 0.0076, + "step": 382650 + }, + { + "epoch": 1.93, + "learning_rate": 1.0414659125881005e-05, + "loss": 0.0061, + "step": 382660 + }, + { + "epoch": 1.93, + "learning_rate": 1.0407091432866995e-05, + "loss": 0.006, + "step": 382670 + }, + { + "epoch": 1.93, + "learning_rate": 1.0399523739852985e-05, + "loss": 0.0087, + "step": 382680 + }, + { + "epoch": 1.93, + "learning_rate": 1.0391956046838973e-05, + "loss": 0.0045, + "step": 382690 + }, + { + "epoch": 1.93, + "learning_rate": 1.0384388353824963e-05, + "loss": 0.0098, + "step": 382700 + }, + { + "epoch": 1.93, + "learning_rate": 1.0376820660810953e-05, + "loss": 0.0071, + "step": 382710 + }, + { + "epoch": 1.93, + "learning_rate": 1.0369252967796943e-05, + "loss": 0.0084, + "step": 382720 + }, + { + "epoch": 1.93, + "learning_rate": 1.0361685274782933e-05, + "loss": 0.0049, + "step": 382730 + }, + { + "epoch": 1.93, + "learning_rate": 1.0354117581768923e-05, + "loss": 0.0049, + "step": 382740 + }, + { + "epoch": 1.93, + "learning_rate": 1.0346549888754913e-05, + "loss": 0.0058, + "step": 382750 + }, + { + "epoch": 1.93, + "learning_rate": 1.0338982195740903e-05, + "loss": 0.0052, + "step": 382760 + }, + { + "epoch": 1.93, + "learning_rate": 1.033141450272689e-05, + "loss": 0.0062, + "step": 382770 + }, + { + "epoch": 1.93, + "learning_rate": 1.032384680971288e-05, + "loss": 0.0063, + "step": 382780 + }, + { + "epoch": 1.93, + "learning_rate": 1.031627911669887e-05, + "loss": 0.0053, + "step": 382790 + }, + { + "epoch": 1.93, + "learning_rate": 1.030871142368486e-05, + "loss": 0.0045, + "step": 382800 + }, + { + "epoch": 1.93, + "learning_rate": 1.030114373067085e-05, + "loss": 0.0066, + "step": 382810 + }, + { + "epoch": 1.93, + "learning_rate": 1.029357603765684e-05, + "loss": 0.0041, + "step": 382820 + }, + { + "epoch": 1.93, + "learning_rate": 1.028600834464283e-05, + "loss": 0.0052, + "step": 382830 + }, + { + "epoch": 1.93, + "learning_rate": 1.0278440651628819e-05, + "loss": 0.0047, + "step": 382840 + }, + { + "epoch": 1.93, + "learning_rate": 1.0270872958614808e-05, + "loss": 0.0066, + "step": 382850 + }, + { + "epoch": 1.93, + "learning_rate": 1.0263305265600798e-05, + "loss": 0.0048, + "step": 382860 + }, + { + "epoch": 1.93, + "learning_rate": 1.0255737572586788e-05, + "loss": 0.0049, + "step": 382870 + }, + { + "epoch": 1.93, + "learning_rate": 1.0248169879572778e-05, + "loss": 0.0068, + "step": 382880 + }, + { + "epoch": 1.93, + "learning_rate": 1.0240602186558768e-05, + "loss": 0.0076, + "step": 382890 + }, + { + "epoch": 1.93, + "learning_rate": 1.0233034493544758e-05, + "loss": 0.0071, + "step": 382900 + }, + { + "epoch": 1.93, + "learning_rate": 1.0225466800530748e-05, + "loss": 0.0076, + "step": 382910 + }, + { + "epoch": 1.93, + "learning_rate": 1.0217899107516736e-05, + "loss": 0.0052, + "step": 382920 + }, + { + "epoch": 1.93, + "learning_rate": 1.0210331414502726e-05, + "loss": 0.0052, + "step": 382930 + }, + { + "epoch": 1.93, + "learning_rate": 1.0202763721488716e-05, + "loss": 0.0068, + "step": 382940 + }, + { + "epoch": 1.93, + "learning_rate": 1.0195196028474706e-05, + "loss": 0.0077, + "step": 382950 + }, + { + "epoch": 1.93, + "learning_rate": 1.0187628335460696e-05, + "loss": 0.0064, + "step": 382960 + }, + { + "epoch": 1.93, + "learning_rate": 1.0180060642446686e-05, + "loss": 0.0052, + "step": 382970 + }, + { + "epoch": 1.93, + "learning_rate": 1.0172492949432676e-05, + "loss": 0.0055, + "step": 382980 + }, + { + "epoch": 1.93, + "learning_rate": 1.0164925256418666e-05, + "loss": 0.006, + "step": 382990 + }, + { + "epoch": 1.93, + "learning_rate": 1.0157357563404652e-05, + "loss": 0.0059, + "step": 383000 + }, + { + "epoch": 1.93, + "eval_cer": 0.9144265880775191, + "eval_loss": 0.004191742278635502, + "eval_runtime": 116.3481, + "eval_samples_per_second": 17.19, + "eval_steps_per_second": 4.297, + "step": 383000 + }, + { + "epoch": 1.93, + "learning_rate": 1.0149789870390642e-05, + "loss": 0.0063, + "step": 383010 + }, + { + "epoch": 1.93, + "learning_rate": 1.0142222177376632e-05, + "loss": 0.0046, + "step": 383020 + }, + { + "epoch": 1.93, + "learning_rate": 1.0134654484362622e-05, + "loss": 0.0064, + "step": 383030 + }, + { + "epoch": 1.93, + "learning_rate": 1.0127086791348613e-05, + "loss": 0.0064, + "step": 383040 + }, + { + "epoch": 1.93, + "learning_rate": 1.0119519098334603e-05, + "loss": 0.0057, + "step": 383050 + }, + { + "epoch": 1.93, + "learning_rate": 1.0111951405320593e-05, + "loss": 0.0048, + "step": 383060 + }, + { + "epoch": 1.93, + "learning_rate": 1.0104383712306583e-05, + "loss": 0.0055, + "step": 383070 + }, + { + "epoch": 1.93, + "learning_rate": 1.009681601929257e-05, + "loss": 0.0067, + "step": 383080 + }, + { + "epoch": 1.93, + "learning_rate": 1.008924832627856e-05, + "loss": 0.0062, + "step": 383090 + }, + { + "epoch": 1.93, + "learning_rate": 1.008168063326455e-05, + "loss": 0.0055, + "step": 383100 + }, + { + "epoch": 1.93, + "learning_rate": 1.007411294025054e-05, + "loss": 0.0048, + "step": 383110 + }, + { + "epoch": 1.93, + "learning_rate": 1.006654524723653e-05, + "loss": 0.0047, + "step": 383120 + }, + { + "epoch": 1.93, + "learning_rate": 1.005897755422252e-05, + "loss": 0.0055, + "step": 383130 + }, + { + "epoch": 1.93, + "learning_rate": 1.0051409861208509e-05, + "loss": 0.0057, + "step": 383140 + }, + { + "epoch": 1.93, + "learning_rate": 1.0043842168194499e-05, + "loss": 0.0059, + "step": 383150 + }, + { + "epoch": 1.93, + "learning_rate": 1.0036274475180487e-05, + "loss": 0.005, + "step": 383160 + }, + { + "epoch": 1.93, + "learning_rate": 1.0028706782166477e-05, + "loss": 0.0043, + "step": 383170 + }, + { + "epoch": 1.93, + "learning_rate": 1.0021139089152467e-05, + "loss": 0.0054, + "step": 383180 + }, + { + "epoch": 1.93, + "learning_rate": 1.0013571396138457e-05, + "loss": 0.0057, + "step": 383190 + }, + { + "epoch": 1.93, + "learning_rate": 1.0006003703124447e-05, + "loss": 0.0063, + "step": 383200 + }, + { + "epoch": 1.93, + "learning_rate": 9.998436010110437e-06, + "loss": 0.0059, + "step": 383210 + }, + { + "epoch": 1.93, + "learning_rate": 9.990868317096427e-06, + "loss": 0.0083, + "step": 383220 + }, + { + "epoch": 1.93, + "learning_rate": 9.983300624082417e-06, + "loss": 0.004, + "step": 383230 + }, + { + "epoch": 1.93, + "learning_rate": 9.975732931068405e-06, + "loss": 0.0071, + "step": 383240 + }, + { + "epoch": 1.93, + "learning_rate": 9.968165238054395e-06, + "loss": 0.0043, + "step": 383250 + }, + { + "epoch": 1.93, + "learning_rate": 9.960597545040385e-06, + "loss": 0.0045, + "step": 383260 + }, + { + "epoch": 1.93, + "learning_rate": 9.953029852026375e-06, + "loss": 0.0071, + "step": 383270 + }, + { + "epoch": 1.93, + "learning_rate": 9.945462159012365e-06, + "loss": 0.0075, + "step": 383280 + }, + { + "epoch": 1.93, + "learning_rate": 9.937894465998354e-06, + "loss": 0.0059, + "step": 383290 + }, + { + "epoch": 1.93, + "learning_rate": 9.930326772984344e-06, + "loss": 0.0062, + "step": 383300 + }, + { + "epoch": 1.93, + "learning_rate": 9.922759079970334e-06, + "loss": 0.0057, + "step": 383310 + }, + { + "epoch": 1.93, + "learning_rate": 9.915191386956322e-06, + "loss": 0.0051, + "step": 383320 + }, + { + "epoch": 1.93, + "learning_rate": 9.907623693942312e-06, + "loss": 0.0055, + "step": 383330 + }, + { + "epoch": 1.93, + "learning_rate": 9.900056000928302e-06, + "loss": 0.0058, + "step": 383340 + }, + { + "epoch": 1.93, + "learning_rate": 9.892488307914292e-06, + "loss": 0.0051, + "step": 383350 + }, + { + "epoch": 1.93, + "learning_rate": 9.884920614900282e-06, + "loss": 0.0057, + "step": 383360 + }, + { + "epoch": 1.93, + "learning_rate": 9.877352921886272e-06, + "loss": 0.0066, + "step": 383370 + }, + { + "epoch": 1.93, + "learning_rate": 9.869785228872262e-06, + "loss": 0.0049, + "step": 383380 + }, + { + "epoch": 1.93, + "learning_rate": 9.86221753585825e-06, + "loss": 0.0061, + "step": 383390 + }, + { + "epoch": 1.93, + "learning_rate": 9.85464984284424e-06, + "loss": 0.0039, + "step": 383400 + }, + { + "epoch": 1.93, + "learning_rate": 9.84708214983023e-06, + "loss": 0.0051, + "step": 383410 + }, + { + "epoch": 1.93, + "learning_rate": 9.83951445681622e-06, + "loss": 0.0043, + "step": 383420 + }, + { + "epoch": 1.93, + "learning_rate": 9.83194676380221e-06, + "loss": 0.0051, + "step": 383430 + }, + { + "epoch": 1.93, + "learning_rate": 9.8243790707882e-06, + "loss": 0.004, + "step": 383440 + }, + { + "epoch": 1.93, + "learning_rate": 9.81681137777419e-06, + "loss": 0.0047, + "step": 383450 + }, + { + "epoch": 1.93, + "learning_rate": 9.80924368476018e-06, + "loss": 0.0041, + "step": 383460 + }, + { + "epoch": 1.93, + "learning_rate": 9.801675991746168e-06, + "loss": 0.005, + "step": 383470 + }, + { + "epoch": 1.93, + "learning_rate": 9.794108298732158e-06, + "loss": 0.0055, + "step": 383480 + }, + { + "epoch": 1.93, + "learning_rate": 9.786540605718148e-06, + "loss": 0.0049, + "step": 383490 + }, + { + "epoch": 1.93, + "learning_rate": 9.778972912704138e-06, + "loss": 0.0054, + "step": 383500 + }, + { + "epoch": 1.93, + "learning_rate": 9.771405219690127e-06, + "loss": 0.0079, + "step": 383510 + }, + { + "epoch": 1.93, + "learning_rate": 9.763837526676117e-06, + "loss": 0.0044, + "step": 383520 + }, + { + "epoch": 1.93, + "learning_rate": 9.756269833662107e-06, + "loss": 0.0052, + "step": 383530 + }, + { + "epoch": 1.94, + "learning_rate": 9.748702140648097e-06, + "loss": 0.0059, + "step": 383540 + }, + { + "epoch": 1.94, + "learning_rate": 9.741134447634085e-06, + "loss": 0.006, + "step": 383550 + }, + { + "epoch": 1.94, + "learning_rate": 9.733566754620075e-06, + "loss": 0.0043, + "step": 383560 + }, + { + "epoch": 1.94, + "learning_rate": 9.725999061606065e-06, + "loss": 0.0065, + "step": 383570 + }, + { + "epoch": 1.94, + "learning_rate": 9.718431368592055e-06, + "loss": 0.005, + "step": 383580 + }, + { + "epoch": 1.94, + "learning_rate": 9.710863675578045e-06, + "loss": 0.0067, + "step": 383590 + }, + { + "epoch": 1.94, + "learning_rate": 9.703295982564035e-06, + "loss": 0.0065, + "step": 383600 + }, + { + "epoch": 1.94, + "learning_rate": 9.695728289550025e-06, + "loss": 0.0047, + "step": 383610 + }, + { + "epoch": 1.94, + "learning_rate": 9.688160596536015e-06, + "loss": 0.0043, + "step": 383620 + }, + { + "epoch": 1.94, + "learning_rate": 9.680592903522003e-06, + "loss": 0.005, + "step": 383630 + }, + { + "epoch": 1.94, + "learning_rate": 9.673025210507993e-06, + "loss": 0.0059, + "step": 383640 + }, + { + "epoch": 1.94, + "learning_rate": 9.665457517493983e-06, + "loss": 0.0063, + "step": 383650 + }, + { + "epoch": 1.94, + "learning_rate": 9.657889824479973e-06, + "loss": 0.006, + "step": 383660 + }, + { + "epoch": 1.94, + "learning_rate": 9.650322131465963e-06, + "loss": 0.0053, + "step": 383670 + }, + { + "epoch": 1.94, + "learning_rate": 9.642754438451953e-06, + "loss": 0.0049, + "step": 383680 + }, + { + "epoch": 1.94, + "learning_rate": 9.635186745437942e-06, + "loss": 0.0068, + "step": 383690 + }, + { + "epoch": 1.94, + "learning_rate": 9.627619052423932e-06, + "loss": 0.0036, + "step": 383700 + }, + { + "epoch": 1.94, + "learning_rate": 9.62005135940992e-06, + "loss": 0.0044, + "step": 383710 + }, + { + "epoch": 1.94, + "learning_rate": 9.61248366639591e-06, + "loss": 0.0053, + "step": 383720 + }, + { + "epoch": 1.94, + "learning_rate": 9.6049159733819e-06, + "loss": 0.0055, + "step": 383730 + }, + { + "epoch": 1.94, + "learning_rate": 9.59734828036789e-06, + "loss": 0.0056, + "step": 383740 + }, + { + "epoch": 1.94, + "learning_rate": 9.58978058735388e-06, + "loss": 0.0042, + "step": 383750 + }, + { + "epoch": 1.94, + "learning_rate": 9.58221289433987e-06, + "loss": 0.0057, + "step": 383760 + }, + { + "epoch": 1.94, + "learning_rate": 9.57464520132586e-06, + "loss": 0.0045, + "step": 383770 + }, + { + "epoch": 1.94, + "learning_rate": 9.56707750831185e-06, + "loss": 0.0056, + "step": 383780 + }, + { + "epoch": 1.94, + "learning_rate": 9.559509815297838e-06, + "loss": 0.0051, + "step": 383790 + }, + { + "epoch": 1.94, + "learning_rate": 9.551942122283828e-06, + "loss": 0.006, + "step": 383800 + }, + { + "epoch": 1.94, + "learning_rate": 9.544374429269818e-06, + "loss": 0.0075, + "step": 383810 + }, + { + "epoch": 1.94, + "learning_rate": 9.536806736255808e-06, + "loss": 0.0054, + "step": 383820 + }, + { + "epoch": 1.94, + "learning_rate": 9.529239043241798e-06, + "loss": 0.0052, + "step": 383830 + }, + { + "epoch": 1.94, + "learning_rate": 9.521671350227788e-06, + "loss": 0.0061, + "step": 383840 + }, + { + "epoch": 1.94, + "learning_rate": 9.514103657213778e-06, + "loss": 0.0046, + "step": 383850 + }, + { + "epoch": 1.94, + "learning_rate": 9.506535964199768e-06, + "loss": 0.0058, + "step": 383860 + }, + { + "epoch": 1.94, + "learning_rate": 9.498968271185754e-06, + "loss": 0.0048, + "step": 383870 + }, + { + "epoch": 1.94, + "learning_rate": 9.491400578171746e-06, + "loss": 0.0042, + "step": 383880 + }, + { + "epoch": 1.94, + "learning_rate": 9.483832885157736e-06, + "loss": 0.0055, + "step": 383890 + }, + { + "epoch": 1.94, + "learning_rate": 9.476265192143726e-06, + "loss": 0.0061, + "step": 383900 + }, + { + "epoch": 1.94, + "learning_rate": 9.468697499129715e-06, + "loss": 0.009, + "step": 383910 + }, + { + "epoch": 1.94, + "learning_rate": 9.461129806115705e-06, + "loss": 0.0062, + "step": 383920 + }, + { + "epoch": 1.94, + "learning_rate": 9.453562113101695e-06, + "loss": 0.005, + "step": 383930 + }, + { + "epoch": 1.94, + "learning_rate": 9.445994420087682e-06, + "loss": 0.0058, + "step": 383940 + }, + { + "epoch": 1.94, + "learning_rate": 9.438426727073672e-06, + "loss": 0.0078, + "step": 383950 + }, + { + "epoch": 1.94, + "learning_rate": 9.430859034059662e-06, + "loss": 0.0058, + "step": 383960 + }, + { + "epoch": 1.94, + "learning_rate": 9.423291341045652e-06, + "loss": 0.0057, + "step": 383970 + }, + { + "epoch": 1.94, + "learning_rate": 9.415723648031641e-06, + "loss": 0.0046, + "step": 383980 + }, + { + "epoch": 1.94, + "learning_rate": 9.408155955017631e-06, + "loss": 0.0062, + "step": 383990 + }, + { + "epoch": 1.94, + "learning_rate": 9.400588262003621e-06, + "loss": 0.0047, + "step": 384000 + }, + { + "epoch": 1.94, + "eval_cer": 0.9144159137201398, + "eval_loss": 0.004220431204885244, + "eval_runtime": 116.4383, + "eval_samples_per_second": 17.176, + "eval_steps_per_second": 4.294, + "step": 384000 + }, + { + "epoch": 1.94, + "learning_rate": 9.393020568989613e-06, + "loss": 0.0066, + "step": 384010 + }, + { + "epoch": 1.94, + "learning_rate": 9.3854528759756e-06, + "loss": 0.0059, + "step": 384020 + }, + { + "epoch": 1.94, + "learning_rate": 9.37788518296159e-06, + "loss": 0.0034, + "step": 384030 + }, + { + "epoch": 1.94, + "learning_rate": 9.37031748994758e-06, + "loss": 0.0055, + "step": 384040 + }, + { + "epoch": 1.94, + "learning_rate": 9.36274979693357e-06, + "loss": 0.0049, + "step": 384050 + }, + { + "epoch": 1.94, + "learning_rate": 9.355182103919559e-06, + "loss": 0.0035, + "step": 384060 + }, + { + "epoch": 1.94, + "learning_rate": 9.347614410905549e-06, + "loss": 0.0055, + "step": 384070 + }, + { + "epoch": 1.94, + "learning_rate": 9.340046717891539e-06, + "loss": 0.0041, + "step": 384080 + }, + { + "epoch": 1.94, + "learning_rate": 9.332479024877529e-06, + "loss": 0.005, + "step": 384090 + }, + { + "epoch": 1.94, + "learning_rate": 9.324911331863519e-06, + "loss": 0.0058, + "step": 384100 + }, + { + "epoch": 1.94, + "learning_rate": 9.317343638849509e-06, + "loss": 0.0052, + "step": 384110 + }, + { + "epoch": 1.94, + "learning_rate": 9.309775945835497e-06, + "loss": 0.0056, + "step": 384120 + }, + { + "epoch": 1.94, + "learning_rate": 9.302208252821487e-06, + "loss": 0.0062, + "step": 384130 + }, + { + "epoch": 1.94, + "learning_rate": 9.294640559807477e-06, + "loss": 0.0073, + "step": 384140 + }, + { + "epoch": 1.94, + "learning_rate": 9.287072866793467e-06, + "loss": 0.0071, + "step": 384150 + }, + { + "epoch": 1.94, + "learning_rate": 9.279505173779457e-06, + "loss": 0.0048, + "step": 384160 + }, + { + "epoch": 1.94, + "learning_rate": 9.271937480765446e-06, + "loss": 0.0054, + "step": 384170 + }, + { + "epoch": 1.94, + "learning_rate": 9.264369787751436e-06, + "loss": 0.007, + "step": 384180 + }, + { + "epoch": 1.94, + "learning_rate": 9.256802094737426e-06, + "loss": 0.0053, + "step": 384190 + }, + { + "epoch": 1.94, + "learning_rate": 9.249234401723414e-06, + "loss": 0.0051, + "step": 384200 + }, + { + "epoch": 1.94, + "learning_rate": 9.241666708709404e-06, + "loss": 0.0057, + "step": 384210 + }, + { + "epoch": 1.94, + "learning_rate": 9.234099015695394e-06, + "loss": 0.0054, + "step": 384220 + }, + { + "epoch": 1.94, + "learning_rate": 9.226531322681384e-06, + "loss": 0.0039, + "step": 384230 + }, + { + "epoch": 1.94, + "learning_rate": 9.218963629667374e-06, + "loss": 0.0054, + "step": 384240 + }, + { + "epoch": 1.94, + "learning_rate": 9.211395936653364e-06, + "loss": 0.0042, + "step": 384250 + }, + { + "epoch": 1.94, + "learning_rate": 9.203828243639354e-06, + "loss": 0.0073, + "step": 384260 + }, + { + "epoch": 1.94, + "learning_rate": 9.196260550625344e-06, + "loss": 0.0076, + "step": 384270 + }, + { + "epoch": 1.94, + "learning_rate": 9.188692857611332e-06, + "loss": 0.0051, + "step": 384280 + }, + { + "epoch": 1.94, + "learning_rate": 9.181125164597322e-06, + "loss": 0.0066, + "step": 384290 + }, + { + "epoch": 1.94, + "learning_rate": 9.173557471583312e-06, + "loss": 0.0052, + "step": 384300 + }, + { + "epoch": 1.94, + "learning_rate": 9.165989778569302e-06, + "loss": 0.004, + "step": 384310 + }, + { + "epoch": 1.94, + "learning_rate": 9.158422085555292e-06, + "loss": 0.0066, + "step": 384320 + }, + { + "epoch": 1.94, + "learning_rate": 9.150854392541282e-06, + "loss": 0.0052, + "step": 384330 + }, + { + "epoch": 1.94, + "learning_rate": 9.143286699527272e-06, + "loss": 0.0047, + "step": 384340 + }, + { + "epoch": 1.94, + "learning_rate": 9.135719006513261e-06, + "loss": 0.006, + "step": 384350 + }, + { + "epoch": 1.94, + "learning_rate": 9.12815131349925e-06, + "loss": 0.0048, + "step": 384360 + }, + { + "epoch": 1.94, + "learning_rate": 9.12058362048524e-06, + "loss": 0.006, + "step": 384370 + }, + { + "epoch": 1.94, + "learning_rate": 9.11301592747123e-06, + "loss": 0.0055, + "step": 384380 + }, + { + "epoch": 1.94, + "learning_rate": 9.10544823445722e-06, + "loss": 0.0052, + "step": 384390 + }, + { + "epoch": 1.94, + "learning_rate": 9.097880541443208e-06, + "loss": 0.0067, + "step": 384400 + }, + { + "epoch": 1.94, + "learning_rate": 9.090312848429198e-06, + "loss": 0.004, + "step": 384410 + }, + { + "epoch": 1.94, + "learning_rate": 9.082745155415187e-06, + "loss": 0.0062, + "step": 384420 + }, + { + "epoch": 1.94, + "learning_rate": 9.075177462401179e-06, + "loss": 0.0058, + "step": 384430 + }, + { + "epoch": 1.94, + "learning_rate": 9.067609769387167e-06, + "loss": 0.0055, + "step": 384440 + }, + { + "epoch": 1.94, + "learning_rate": 9.060042076373157e-06, + "loss": 0.0067, + "step": 384450 + }, + { + "epoch": 1.94, + "learning_rate": 9.052474383359147e-06, + "loss": 0.0056, + "step": 384460 + }, + { + "epoch": 1.94, + "learning_rate": 9.044906690345135e-06, + "loss": 0.0041, + "step": 384470 + }, + { + "epoch": 1.94, + "learning_rate": 9.037338997331125e-06, + "loss": 0.0043, + "step": 384480 + }, + { + "epoch": 1.94, + "learning_rate": 9.029771304317115e-06, + "loss": 0.0047, + "step": 384490 + }, + { + "epoch": 1.94, + "learning_rate": 9.022203611303105e-06, + "loss": 0.0062, + "step": 384500 + }, + { + "epoch": 1.94, + "learning_rate": 9.014635918289095e-06, + "loss": 0.0053, + "step": 384510 + }, + { + "epoch": 1.94, + "learning_rate": 9.007068225275085e-06, + "loss": 0.0064, + "step": 384520 + }, + { + "epoch": 1.94, + "learning_rate": 8.999500532261075e-06, + "loss": 0.0056, + "step": 384530 + }, + { + "epoch": 1.94, + "learning_rate": 8.991932839247065e-06, + "loss": 0.0057, + "step": 384540 + }, + { + "epoch": 1.94, + "learning_rate": 8.984365146233053e-06, + "loss": 0.0083, + "step": 384550 + }, + { + "epoch": 1.94, + "learning_rate": 8.976797453219043e-06, + "loss": 0.0074, + "step": 384560 + }, + { + "epoch": 1.94, + "learning_rate": 8.969229760205033e-06, + "loss": 0.004, + "step": 384570 + }, + { + "epoch": 1.94, + "learning_rate": 8.961662067191023e-06, + "loss": 0.0054, + "step": 384580 + }, + { + "epoch": 1.94, + "learning_rate": 8.954094374177013e-06, + "loss": 0.0074, + "step": 384590 + }, + { + "epoch": 1.94, + "learning_rate": 8.946526681163003e-06, + "loss": 0.0044, + "step": 384600 + }, + { + "epoch": 1.94, + "learning_rate": 8.938958988148992e-06, + "loss": 0.0072, + "step": 384610 + }, + { + "epoch": 1.94, + "learning_rate": 8.931391295134982e-06, + "loss": 0.0057, + "step": 384620 + }, + { + "epoch": 1.94, + "learning_rate": 8.92382360212097e-06, + "loss": 0.0056, + "step": 384630 + }, + { + "epoch": 1.94, + "learning_rate": 8.91625590910696e-06, + "loss": 0.0046, + "step": 384640 + }, + { + "epoch": 1.94, + "learning_rate": 8.90868821609295e-06, + "loss": 0.0042, + "step": 384650 + }, + { + "epoch": 1.94, + "learning_rate": 8.90112052307894e-06, + "loss": 0.0053, + "step": 384660 + }, + { + "epoch": 1.94, + "learning_rate": 8.89355283006493e-06, + "loss": 0.0053, + "step": 384670 + }, + { + "epoch": 1.94, + "learning_rate": 8.88598513705092e-06, + "loss": 0.0058, + "step": 384680 + }, + { + "epoch": 1.94, + "learning_rate": 8.87841744403691e-06, + "loss": 0.0053, + "step": 384690 + }, + { + "epoch": 1.94, + "learning_rate": 8.8708497510229e-06, + "loss": 0.0072, + "step": 384700 + }, + { + "epoch": 1.94, + "learning_rate": 8.863282058008888e-06, + "loss": 0.0055, + "step": 384710 + }, + { + "epoch": 1.94, + "learning_rate": 8.855714364994878e-06, + "loss": 0.0063, + "step": 384720 + }, + { + "epoch": 1.94, + "learning_rate": 8.848146671980868e-06, + "loss": 0.0064, + "step": 384730 + }, + { + "epoch": 1.94, + "learning_rate": 8.840578978966858e-06, + "loss": 0.0066, + "step": 384740 + }, + { + "epoch": 1.94, + "learning_rate": 8.833011285952848e-06, + "loss": 0.0059, + "step": 384750 + }, + { + "epoch": 1.94, + "learning_rate": 8.825443592938838e-06, + "loss": 0.0049, + "step": 384760 + }, + { + "epoch": 1.94, + "learning_rate": 8.817875899924828e-06, + "loss": 0.007, + "step": 384770 + }, + { + "epoch": 1.94, + "learning_rate": 8.810308206910818e-06, + "loss": 0.0046, + "step": 384780 + }, + { + "epoch": 1.94, + "learning_rate": 8.802740513896806e-06, + "loss": 0.0057, + "step": 384790 + }, + { + "epoch": 1.94, + "learning_rate": 8.795172820882796e-06, + "loss": 0.0062, + "step": 384800 + }, + { + "epoch": 1.94, + "learning_rate": 8.787605127868786e-06, + "loss": 0.0076, + "step": 384810 + }, + { + "epoch": 1.94, + "learning_rate": 8.780037434854776e-06, + "loss": 0.0067, + "step": 384820 + }, + { + "epoch": 1.94, + "learning_rate": 8.772469741840764e-06, + "loss": 0.0071, + "step": 384830 + }, + { + "epoch": 1.94, + "learning_rate": 8.764902048826754e-06, + "loss": 0.0048, + "step": 384840 + }, + { + "epoch": 1.94, + "learning_rate": 8.757334355812745e-06, + "loss": 0.0088, + "step": 384850 + }, + { + "epoch": 1.94, + "learning_rate": 8.749766662798735e-06, + "loss": 0.0055, + "step": 384860 + }, + { + "epoch": 1.94, + "learning_rate": 8.742198969784723e-06, + "loss": 0.0062, + "step": 384870 + }, + { + "epoch": 1.94, + "learning_rate": 8.734631276770713e-06, + "loss": 0.0078, + "step": 384880 + }, + { + "epoch": 1.94, + "learning_rate": 8.727063583756703e-06, + "loss": 0.0059, + "step": 384890 + }, + { + "epoch": 1.94, + "learning_rate": 8.719495890742693e-06, + "loss": 0.0042, + "step": 384900 + }, + { + "epoch": 1.94, + "learning_rate": 8.711928197728681e-06, + "loss": 0.0059, + "step": 384910 + }, + { + "epoch": 1.94, + "learning_rate": 8.704360504714671e-06, + "loss": 0.0047, + "step": 384920 + }, + { + "epoch": 1.94, + "learning_rate": 8.696792811700661e-06, + "loss": 0.0088, + "step": 384930 + }, + { + "epoch": 1.94, + "learning_rate": 8.689225118686651e-06, + "loss": 0.0042, + "step": 384940 + }, + { + "epoch": 1.94, + "learning_rate": 8.681657425672641e-06, + "loss": 0.0049, + "step": 384950 + }, + { + "epoch": 1.94, + "learning_rate": 8.674089732658631e-06, + "loss": 0.007, + "step": 384960 + }, + { + "epoch": 1.94, + "learning_rate": 8.66652203964462e-06, + "loss": 0.0054, + "step": 384970 + }, + { + "epoch": 1.94, + "learning_rate": 8.65895434663061e-06, + "loss": 0.0049, + "step": 384980 + }, + { + "epoch": 1.94, + "learning_rate": 8.651386653616599e-06, + "loss": 0.0048, + "step": 384990 + }, + { + "epoch": 1.94, + "learning_rate": 8.643818960602589e-06, + "loss": 0.0064, + "step": 385000 + }, + { + "epoch": 1.94, + "eval_cer": 0.914423676889143, + "eval_loss": 0.0041769566014409065, + "eval_runtime": 116.103, + "eval_samples_per_second": 17.226, + "eval_steps_per_second": 4.307, + "step": 385000 + }, + { + "epoch": 1.94, + "learning_rate": 8.636251267588579e-06, + "loss": 0.0061, + "step": 385010 + }, + { + "epoch": 1.94, + "learning_rate": 8.628683574574569e-06, + "loss": 0.0048, + "step": 385020 + }, + { + "epoch": 1.94, + "learning_rate": 8.621115881560559e-06, + "loss": 0.0053, + "step": 385030 + }, + { + "epoch": 1.94, + "learning_rate": 8.613548188546549e-06, + "loss": 0.0046, + "step": 385040 + }, + { + "epoch": 1.94, + "learning_rate": 8.605980495532538e-06, + "loss": 0.0047, + "step": 385050 + }, + { + "epoch": 1.94, + "learning_rate": 8.598412802518527e-06, + "loss": 0.0063, + "step": 385060 + }, + { + "epoch": 1.94, + "learning_rate": 8.590845109504517e-06, + "loss": 0.0051, + "step": 385070 + }, + { + "epoch": 1.94, + "learning_rate": 8.583277416490506e-06, + "loss": 0.0051, + "step": 385080 + }, + { + "epoch": 1.94, + "learning_rate": 8.575709723476496e-06, + "loss": 0.0059, + "step": 385090 + }, + { + "epoch": 1.94, + "learning_rate": 8.568142030462486e-06, + "loss": 0.005, + "step": 385100 + }, + { + "epoch": 1.94, + "learning_rate": 8.560574337448476e-06, + "loss": 0.0055, + "step": 385110 + }, + { + "epoch": 1.94, + "learning_rate": 8.553006644434466e-06, + "loss": 0.0067, + "step": 385120 + }, + { + "epoch": 1.94, + "learning_rate": 8.545438951420456e-06, + "loss": 0.005, + "step": 385130 + }, + { + "epoch": 1.94, + "learning_rate": 8.537871258406444e-06, + "loss": 0.0048, + "step": 385140 + }, + { + "epoch": 1.94, + "learning_rate": 8.530303565392434e-06, + "loss": 0.0049, + "step": 385150 + }, + { + "epoch": 1.94, + "learning_rate": 8.522735872378424e-06, + "loss": 0.0049, + "step": 385160 + }, + { + "epoch": 1.94, + "learning_rate": 8.515168179364414e-06, + "loss": 0.0073, + "step": 385170 + }, + { + "epoch": 1.94, + "learning_rate": 8.507600486350404e-06, + "loss": 0.0051, + "step": 385180 + }, + { + "epoch": 1.94, + "learning_rate": 8.500032793336394e-06, + "loss": 0.0057, + "step": 385190 + }, + { + "epoch": 1.94, + "learning_rate": 8.492465100322384e-06, + "loss": 0.0069, + "step": 385200 + }, + { + "epoch": 1.94, + "learning_rate": 8.484897407308374e-06, + "loss": 0.0054, + "step": 385210 + }, + { + "epoch": 1.94, + "learning_rate": 8.477329714294362e-06, + "loss": 0.007, + "step": 385220 + }, + { + "epoch": 1.94, + "learning_rate": 8.469762021280352e-06, + "loss": 0.0066, + "step": 385230 + }, + { + "epoch": 1.94, + "learning_rate": 8.462194328266342e-06, + "loss": 0.0054, + "step": 385240 + }, + { + "epoch": 1.94, + "learning_rate": 8.454626635252332e-06, + "loss": 0.0066, + "step": 385250 + }, + { + "epoch": 1.94, + "learning_rate": 8.44705894223832e-06, + "loss": 0.0072, + "step": 385260 + }, + { + "epoch": 1.94, + "learning_rate": 8.439491249224311e-06, + "loss": 0.0062, + "step": 385270 + }, + { + "epoch": 1.94, + "learning_rate": 8.431923556210301e-06, + "loss": 0.0062, + "step": 385280 + }, + { + "epoch": 1.94, + "learning_rate": 8.424355863196291e-06, + "loss": 0.0041, + "step": 385290 + }, + { + "epoch": 1.94, + "learning_rate": 8.41678817018228e-06, + "loss": 0.0063, + "step": 385300 + }, + { + "epoch": 1.94, + "learning_rate": 8.40922047716827e-06, + "loss": 0.0042, + "step": 385310 + }, + { + "epoch": 1.94, + "learning_rate": 8.40165278415426e-06, + "loss": 0.0039, + "step": 385320 + }, + { + "epoch": 1.94, + "learning_rate": 8.39408509114025e-06, + "loss": 0.0041, + "step": 385330 + }, + { + "epoch": 1.94, + "learning_rate": 8.386517398126237e-06, + "loss": 0.0061, + "step": 385340 + }, + { + "epoch": 1.94, + "learning_rate": 8.378949705112227e-06, + "loss": 0.0078, + "step": 385350 + }, + { + "epoch": 1.94, + "learning_rate": 8.371382012098217e-06, + "loss": 0.0052, + "step": 385360 + }, + { + "epoch": 1.94, + "learning_rate": 8.363814319084207e-06, + "loss": 0.0114, + "step": 385370 + }, + { + "epoch": 1.94, + "learning_rate": 8.356246626070197e-06, + "loss": 0.0044, + "step": 385380 + }, + { + "epoch": 1.94, + "learning_rate": 8.348678933056187e-06, + "loss": 0.0052, + "step": 385390 + }, + { + "epoch": 1.94, + "learning_rate": 8.341111240042177e-06, + "loss": 0.0046, + "step": 385400 + }, + { + "epoch": 1.94, + "learning_rate": 8.333543547028167e-06, + "loss": 0.0042, + "step": 385410 + }, + { + "epoch": 1.94, + "learning_rate": 8.325975854014155e-06, + "loss": 0.0053, + "step": 385420 + }, + { + "epoch": 1.94, + "learning_rate": 8.318408161000145e-06, + "loss": 0.0042, + "step": 385430 + }, + { + "epoch": 1.94, + "learning_rate": 8.310840467986135e-06, + "loss": 0.0059, + "step": 385440 + }, + { + "epoch": 1.94, + "learning_rate": 8.303272774972125e-06, + "loss": 0.0039, + "step": 385450 + }, + { + "epoch": 1.94, + "learning_rate": 8.295705081958115e-06, + "loss": 0.0059, + "step": 385460 + }, + { + "epoch": 1.94, + "learning_rate": 8.288137388944105e-06, + "loss": 0.0046, + "step": 385470 + }, + { + "epoch": 1.94, + "learning_rate": 8.280569695930095e-06, + "loss": 0.0064, + "step": 385480 + }, + { + "epoch": 1.94, + "learning_rate": 8.273002002916084e-06, + "loss": 0.0048, + "step": 385490 + }, + { + "epoch": 1.94, + "learning_rate": 8.265434309902073e-06, + "loss": 0.0052, + "step": 385500 + }, + { + "epoch": 1.94, + "learning_rate": 8.257866616888063e-06, + "loss": 0.0079, + "step": 385510 + }, + { + "epoch": 1.94, + "learning_rate": 8.250298923874052e-06, + "loss": 0.0059, + "step": 385520 + }, + { + "epoch": 1.95, + "learning_rate": 8.242731230860042e-06, + "loss": 0.0047, + "step": 385530 + }, + { + "epoch": 1.95, + "learning_rate": 8.235163537846032e-06, + "loss": 0.0067, + "step": 385540 + }, + { + "epoch": 1.95, + "learning_rate": 8.227595844832022e-06, + "loss": 0.0055, + "step": 385550 + }, + { + "epoch": 1.95, + "learning_rate": 8.220028151818012e-06, + "loss": 0.0094, + "step": 385560 + }, + { + "epoch": 1.95, + "learning_rate": 8.212460458804e-06, + "loss": 0.0041, + "step": 385570 + }, + { + "epoch": 1.95, + "learning_rate": 8.20489276578999e-06, + "loss": 0.006, + "step": 385580 + }, + { + "epoch": 1.95, + "learning_rate": 8.19732507277598e-06, + "loss": 0.0053, + "step": 385590 + }, + { + "epoch": 1.95, + "learning_rate": 8.18975737976197e-06, + "loss": 0.0062, + "step": 385600 + }, + { + "epoch": 1.95, + "learning_rate": 8.18218968674796e-06, + "loss": 0.0064, + "step": 385610 + }, + { + "epoch": 1.95, + "learning_rate": 8.17462199373395e-06, + "loss": 0.0062, + "step": 385620 + }, + { + "epoch": 1.95, + "learning_rate": 8.16705430071994e-06, + "loss": 0.0054, + "step": 385630 + }, + { + "epoch": 1.95, + "learning_rate": 8.15948660770593e-06, + "loss": 0.0053, + "step": 385640 + }, + { + "epoch": 1.95, + "learning_rate": 8.151918914691918e-06, + "loss": 0.0042, + "step": 385650 + }, + { + "epoch": 1.95, + "learning_rate": 8.144351221677908e-06, + "loss": 0.0062, + "step": 385660 + }, + { + "epoch": 1.95, + "learning_rate": 8.136783528663898e-06, + "loss": 0.0057, + "step": 385670 + }, + { + "epoch": 1.95, + "learning_rate": 8.129215835649888e-06, + "loss": 0.0061, + "step": 385680 + }, + { + "epoch": 1.95, + "learning_rate": 8.121648142635878e-06, + "loss": 0.0056, + "step": 385690 + }, + { + "epoch": 1.95, + "learning_rate": 8.114080449621868e-06, + "loss": 0.0077, + "step": 385700 + }, + { + "epoch": 1.95, + "learning_rate": 8.106512756607857e-06, + "loss": 0.0064, + "step": 385710 + }, + { + "epoch": 1.95, + "learning_rate": 8.098945063593847e-06, + "loss": 0.0086, + "step": 385720 + }, + { + "epoch": 1.95, + "learning_rate": 8.091377370579836e-06, + "loss": 0.0047, + "step": 385730 + }, + { + "epoch": 1.95, + "learning_rate": 8.083809677565825e-06, + "loss": 0.0047, + "step": 385740 + }, + { + "epoch": 1.95, + "learning_rate": 8.076241984551815e-06, + "loss": 0.005, + "step": 385750 + }, + { + "epoch": 1.95, + "learning_rate": 8.068674291537805e-06, + "loss": 0.0047, + "step": 385760 + }, + { + "epoch": 1.95, + "learning_rate": 8.061106598523794e-06, + "loss": 0.0064, + "step": 385770 + }, + { + "epoch": 1.95, + "learning_rate": 8.053538905509783e-06, + "loss": 0.0057, + "step": 385780 + }, + { + "epoch": 1.95, + "learning_rate": 8.045971212495773e-06, + "loss": 0.0045, + "step": 385790 + }, + { + "epoch": 1.95, + "learning_rate": 8.038403519481763e-06, + "loss": 0.0048, + "step": 385800 + }, + { + "epoch": 1.95, + "learning_rate": 8.030835826467753e-06, + "loss": 0.0065, + "step": 385810 + }, + { + "epoch": 1.95, + "learning_rate": 8.023268133453743e-06, + "loss": 0.0064, + "step": 385820 + }, + { + "epoch": 1.95, + "learning_rate": 8.015700440439733e-06, + "loss": 0.0065, + "step": 385830 + }, + { + "epoch": 1.95, + "learning_rate": 8.008132747425723e-06, + "loss": 0.0061, + "step": 385840 + }, + { + "epoch": 1.95, + "learning_rate": 8.000565054411711e-06, + "loss": 0.0058, + "step": 385850 + }, + { + "epoch": 1.95, + "learning_rate": 7.992997361397701e-06, + "loss": 0.0066, + "step": 385860 + }, + { + "epoch": 1.95, + "learning_rate": 7.985429668383691e-06, + "loss": 0.0061, + "step": 385870 + }, + { + "epoch": 1.95, + "learning_rate": 7.977861975369681e-06, + "loss": 0.0045, + "step": 385880 + }, + { + "epoch": 1.95, + "learning_rate": 7.97029428235567e-06, + "loss": 0.0059, + "step": 385890 + }, + { + "epoch": 1.95, + "learning_rate": 7.96272658934166e-06, + "loss": 0.0068, + "step": 385900 + }, + { + "epoch": 1.95, + "learning_rate": 7.95515889632765e-06, + "loss": 0.006, + "step": 385910 + }, + { + "epoch": 1.95, + "learning_rate": 7.94759120331364e-06, + "loss": 0.0061, + "step": 385920 + }, + { + "epoch": 1.95, + "learning_rate": 7.940023510299629e-06, + "loss": 0.0059, + "step": 385930 + }, + { + "epoch": 1.95, + "learning_rate": 7.932455817285619e-06, + "loss": 0.0046, + "step": 385940 + }, + { + "epoch": 1.95, + "learning_rate": 7.924888124271609e-06, + "loss": 0.0049, + "step": 385950 + }, + { + "epoch": 1.95, + "learning_rate": 7.917320431257598e-06, + "loss": 0.0063, + "step": 385960 + }, + { + "epoch": 1.95, + "learning_rate": 7.909752738243588e-06, + "loss": 0.0065, + "step": 385970 + }, + { + "epoch": 1.95, + "learning_rate": 7.902185045229578e-06, + "loss": 0.0048, + "step": 385980 + }, + { + "epoch": 1.95, + "learning_rate": 7.894617352215568e-06, + "loss": 0.0071, + "step": 385990 + }, + { + "epoch": 1.95, + "learning_rate": 7.887049659201558e-06, + "loss": 0.0072, + "step": 386000 + }, + { + "epoch": 1.95, + "eval_cer": 0.9144178545123905, + "eval_loss": 0.0041864411905407906, + "eval_runtime": 116.4755, + "eval_samples_per_second": 17.171, + "eval_steps_per_second": 4.293, + "step": 386000 + }, + { + "epoch": 1.95, + "learning_rate": 7.879481966187546e-06, + "loss": 0.006, + "step": 386010 + }, + { + "epoch": 1.95, + "learning_rate": 7.871914273173536e-06, + "loss": 0.0031, + "step": 386020 + }, + { + "epoch": 1.95, + "learning_rate": 7.864346580159526e-06, + "loss": 0.0065, + "step": 386030 + }, + { + "epoch": 1.95, + "learning_rate": 7.856778887145516e-06, + "loss": 0.0066, + "step": 386040 + }, + { + "epoch": 1.95, + "learning_rate": 7.849211194131506e-06, + "loss": 0.0056, + "step": 386050 + }, + { + "epoch": 1.95, + "learning_rate": 7.841643501117496e-06, + "loss": 0.0035, + "step": 386060 + }, + { + "epoch": 1.95, + "learning_rate": 7.834075808103486e-06, + "loss": 0.0078, + "step": 386070 + }, + { + "epoch": 1.95, + "learning_rate": 7.826508115089476e-06, + "loss": 0.0037, + "step": 386080 + }, + { + "epoch": 1.95, + "learning_rate": 7.818940422075464e-06, + "loss": 0.0078, + "step": 386090 + }, + { + "epoch": 1.95, + "learning_rate": 7.811372729061454e-06, + "loss": 0.0063, + "step": 386100 + }, + { + "epoch": 1.95, + "learning_rate": 7.803805036047444e-06, + "loss": 0.0043, + "step": 386110 + }, + { + "epoch": 1.95, + "learning_rate": 7.796237343033434e-06, + "loss": 0.0041, + "step": 386120 + }, + { + "epoch": 1.95, + "learning_rate": 7.788669650019424e-06, + "loss": 0.0053, + "step": 386130 + }, + { + "epoch": 1.95, + "learning_rate": 7.781101957005414e-06, + "loss": 0.0045, + "step": 386140 + }, + { + "epoch": 1.95, + "learning_rate": 7.773534263991403e-06, + "loss": 0.0076, + "step": 386150 + }, + { + "epoch": 1.95, + "learning_rate": 7.765966570977392e-06, + "loss": 0.0047, + "step": 386160 + }, + { + "epoch": 1.95, + "learning_rate": 7.758398877963382e-06, + "loss": 0.0044, + "step": 386170 + }, + { + "epoch": 1.95, + "learning_rate": 7.750831184949371e-06, + "loss": 0.0069, + "step": 386180 + }, + { + "epoch": 1.95, + "learning_rate": 7.743263491935361e-06, + "loss": 0.0048, + "step": 386190 + }, + { + "epoch": 1.95, + "learning_rate": 7.73569579892135e-06, + "loss": 0.0064, + "step": 386200 + }, + { + "epoch": 1.95, + "learning_rate": 7.72812810590734e-06, + "loss": 0.0078, + "step": 386210 + }, + { + "epoch": 1.95, + "learning_rate": 7.72056041289333e-06, + "loss": 0.0056, + "step": 386220 + }, + { + "epoch": 1.95, + "learning_rate": 7.71299271987932e-06, + "loss": 0.0061, + "step": 386230 + }, + { + "epoch": 1.95, + "learning_rate": 7.70542502686531e-06, + "loss": 0.0058, + "step": 386240 + }, + { + "epoch": 1.95, + "learning_rate": 7.6978573338513e-06, + "loss": 0.0057, + "step": 386250 + }, + { + "epoch": 1.95, + "learning_rate": 7.690289640837289e-06, + "loss": 0.0061, + "step": 386260 + }, + { + "epoch": 1.95, + "learning_rate": 7.682721947823279e-06, + "loss": 0.0064, + "step": 386270 + }, + { + "epoch": 1.95, + "learning_rate": 7.675154254809267e-06, + "loss": 0.0056, + "step": 386280 + }, + { + "epoch": 1.95, + "learning_rate": 7.667586561795257e-06, + "loss": 0.004, + "step": 386290 + }, + { + "epoch": 1.95, + "learning_rate": 7.660018868781247e-06, + "loss": 0.0053, + "step": 386300 + }, + { + "epoch": 1.95, + "learning_rate": 7.652451175767237e-06, + "loss": 0.0055, + "step": 386310 + }, + { + "epoch": 1.95, + "learning_rate": 7.644883482753227e-06, + "loss": 0.0043, + "step": 386320 + }, + { + "epoch": 1.95, + "learning_rate": 7.637315789739217e-06, + "loss": 0.0044, + "step": 386330 + }, + { + "epoch": 1.95, + "learning_rate": 7.629748096725207e-06, + "loss": 0.0053, + "step": 386340 + }, + { + "epoch": 1.95, + "learning_rate": 7.622180403711197e-06, + "loss": 0.0067, + "step": 386350 + }, + { + "epoch": 1.95, + "learning_rate": 7.614612710697186e-06, + "loss": 0.0038, + "step": 386360 + }, + { + "epoch": 1.95, + "learning_rate": 7.607045017683176e-06, + "loss": 0.0078, + "step": 386370 + }, + { + "epoch": 1.95, + "learning_rate": 7.5994773246691655e-06, + "loss": 0.0069, + "step": 386380 + }, + { + "epoch": 1.95, + "learning_rate": 7.591909631655155e-06, + "loss": 0.0039, + "step": 386390 + }, + { + "epoch": 1.95, + "learning_rate": 7.584341938641144e-06, + "loss": 0.0051, + "step": 386400 + }, + { + "epoch": 1.95, + "learning_rate": 7.5767742456271335e-06, + "loss": 0.0045, + "step": 386410 + }, + { + "epoch": 1.95, + "learning_rate": 7.569206552613124e-06, + "loss": 0.0058, + "step": 386420 + }, + { + "epoch": 1.95, + "learning_rate": 7.561638859599114e-06, + "loss": 0.0065, + "step": 386430 + }, + { + "epoch": 1.95, + "learning_rate": 7.5540711665851024e-06, + "loss": 0.0077, + "step": 386440 + }, + { + "epoch": 1.95, + "learning_rate": 7.546503473571092e-06, + "loss": 0.0068, + "step": 386450 + }, + { + "epoch": 1.95, + "learning_rate": 7.538935780557082e-06, + "loss": 0.007, + "step": 386460 + }, + { + "epoch": 1.95, + "learning_rate": 7.531368087543072e-06, + "loss": 0.0057, + "step": 386470 + }, + { + "epoch": 1.95, + "learning_rate": 7.523800394529061e-06, + "loss": 0.0055, + "step": 386480 + }, + { + "epoch": 1.95, + "learning_rate": 7.516232701515051e-06, + "loss": 0.0064, + "step": 386490 + }, + { + "epoch": 1.95, + "learning_rate": 7.508665008501041e-06, + "loss": 0.0051, + "step": 386500 + }, + { + "epoch": 1.95, + "learning_rate": 7.501097315487031e-06, + "loss": 0.0053, + "step": 386510 + }, + { + "epoch": 1.95, + "learning_rate": 7.49352962247302e-06, + "loss": 0.006, + "step": 386520 + }, + { + "epoch": 1.95, + "learning_rate": 7.48596192945901e-06, + "loss": 0.0047, + "step": 386530 + }, + { + "epoch": 1.95, + "learning_rate": 7.478394236445e-06, + "loss": 0.0046, + "step": 386540 + }, + { + "epoch": 1.95, + "learning_rate": 7.47082654343099e-06, + "loss": 0.0085, + "step": 386550 + }, + { + "epoch": 1.95, + "learning_rate": 7.463258850416979e-06, + "loss": 0.0081, + "step": 386560 + }, + { + "epoch": 1.95, + "learning_rate": 7.455691157402969e-06, + "loss": 0.0066, + "step": 386570 + }, + { + "epoch": 1.95, + "learning_rate": 7.448123464388959e-06, + "loss": 0.0055, + "step": 386580 + }, + { + "epoch": 1.95, + "learning_rate": 7.440555771374949e-06, + "loss": 0.0063, + "step": 386590 + }, + { + "epoch": 1.95, + "learning_rate": 7.432988078360938e-06, + "loss": 0.0069, + "step": 386600 + }, + { + "epoch": 1.95, + "learning_rate": 7.4254203853469276e-06, + "loss": 0.0048, + "step": 386610 + }, + { + "epoch": 1.95, + "learning_rate": 7.4178526923329175e-06, + "loss": 0.0061, + "step": 386620 + }, + { + "epoch": 1.95, + "learning_rate": 7.410284999318907e-06, + "loss": 0.006, + "step": 386630 + }, + { + "epoch": 1.95, + "learning_rate": 7.4027173063048965e-06, + "loss": 0.0071, + "step": 386640 + }, + { + "epoch": 1.95, + "learning_rate": 7.395149613290886e-06, + "loss": 0.0062, + "step": 386650 + }, + { + "epoch": 1.95, + "learning_rate": 7.387581920276876e-06, + "loss": 0.0053, + "step": 386660 + }, + { + "epoch": 1.95, + "learning_rate": 7.380014227262865e-06, + "loss": 0.0051, + "step": 386670 + }, + { + "epoch": 1.95, + "learning_rate": 7.372446534248855e-06, + "loss": 0.0045, + "step": 386680 + }, + { + "epoch": 1.95, + "learning_rate": 7.364878841234845e-06, + "loss": 0.0063, + "step": 386690 + }, + { + "epoch": 1.95, + "learning_rate": 7.357311148220835e-06, + "loss": 0.0064, + "step": 386700 + }, + { + "epoch": 1.95, + "learning_rate": 7.349743455206824e-06, + "loss": 0.0046, + "step": 386710 + }, + { + "epoch": 1.95, + "learning_rate": 7.342175762192814e-06, + "loss": 0.006, + "step": 386720 + }, + { + "epoch": 1.95, + "learning_rate": 7.334608069178804e-06, + "loss": 0.005, + "step": 386730 + }, + { + "epoch": 1.95, + "learning_rate": 7.327040376164794e-06, + "loss": 0.0049, + "step": 386740 + }, + { + "epoch": 1.95, + "learning_rate": 7.319472683150783e-06, + "loss": 0.0064, + "step": 386750 + }, + { + "epoch": 1.95, + "learning_rate": 7.311904990136773e-06, + "loss": 0.0085, + "step": 386760 + }, + { + "epoch": 1.95, + "learning_rate": 7.304337297122763e-06, + "loss": 0.0057, + "step": 386770 + }, + { + "epoch": 1.95, + "learning_rate": 7.296769604108753e-06, + "loss": 0.0048, + "step": 386780 + }, + { + "epoch": 1.95, + "learning_rate": 7.289201911094742e-06, + "loss": 0.007, + "step": 386790 + }, + { + "epoch": 1.95, + "learning_rate": 7.281634218080732e-06, + "loss": 0.005, + "step": 386800 + }, + { + "epoch": 1.95, + "learning_rate": 7.274066525066722e-06, + "loss": 0.0066, + "step": 386810 + }, + { + "epoch": 1.95, + "learning_rate": 7.2664988320527115e-06, + "loss": 0.0057, + "step": 386820 + }, + { + "epoch": 1.95, + "learning_rate": 7.2589311390387e-06, + "loss": 0.0047, + "step": 386830 + }, + { + "epoch": 1.95, + "learning_rate": 7.2513634460246905e-06, + "loss": 0.0047, + "step": 386840 + }, + { + "epoch": 1.95, + "learning_rate": 7.24379575301068e-06, + "loss": 0.0058, + "step": 386850 + }, + { + "epoch": 1.95, + "learning_rate": 7.23622805999667e-06, + "loss": 0.0035, + "step": 386860 + }, + { + "epoch": 1.95, + "learning_rate": 7.2286603669826585e-06, + "loss": 0.0056, + "step": 386870 + }, + { + "epoch": 1.95, + "learning_rate": 7.2210926739686484e-06, + "loss": 0.0049, + "step": 386880 + }, + { + "epoch": 1.95, + "learning_rate": 7.213524980954638e-06, + "loss": 0.0056, + "step": 386890 + }, + { + "epoch": 1.95, + "learning_rate": 7.205957287940628e-06, + "loss": 0.0032, + "step": 386900 + }, + { + "epoch": 1.95, + "learning_rate": 7.198389594926617e-06, + "loss": 0.0052, + "step": 386910 + }, + { + "epoch": 1.95, + "learning_rate": 7.190821901912607e-06, + "loss": 0.0089, + "step": 386920 + }, + { + "epoch": 1.95, + "learning_rate": 7.183254208898597e-06, + "loss": 0.0062, + "step": 386930 + }, + { + "epoch": 1.95, + "learning_rate": 7.175686515884587e-06, + "loss": 0.0066, + "step": 386940 + }, + { + "epoch": 1.95, + "learning_rate": 7.168118822870576e-06, + "loss": 0.0051, + "step": 386950 + }, + { + "epoch": 1.95, + "learning_rate": 7.160551129856566e-06, + "loss": 0.0056, + "step": 386960 + }, + { + "epoch": 1.95, + "learning_rate": 7.152983436842556e-06, + "loss": 0.0069, + "step": 386970 + }, + { + "epoch": 1.95, + "learning_rate": 7.145415743828546e-06, + "loss": 0.0072, + "step": 386980 + }, + { + "epoch": 1.95, + "learning_rate": 7.137848050814535e-06, + "loss": 0.0047, + "step": 386990 + }, + { + "epoch": 1.95, + "learning_rate": 7.130280357800525e-06, + "loss": 0.0078, + "step": 387000 + }, + { + "epoch": 1.95, + "eval_cer": 0.9144052393627603, + "eval_loss": 0.004187974147498608, + "eval_runtime": 116.3794, + "eval_samples_per_second": 17.185, + "eval_steps_per_second": 4.296, + "step": 387000 + }, + { + "epoch": 1.95, + "learning_rate": 7.122712664786515e-06, + "loss": 0.0064, + "step": 387010 + }, + { + "epoch": 1.95, + "learning_rate": 7.115144971772505e-06, + "loss": 0.009, + "step": 387020 + }, + { + "epoch": 1.95, + "learning_rate": 7.107577278758494e-06, + "loss": 0.0104, + "step": 387030 + }, + { + "epoch": 1.95, + "learning_rate": 7.100009585744484e-06, + "loss": 0.0053, + "step": 387040 + }, + { + "epoch": 1.95, + "learning_rate": 7.0924418927304736e-06, + "loss": 0.005, + "step": 387050 + }, + { + "epoch": 1.95, + "learning_rate": 7.0848741997164635e-06, + "loss": 0.0054, + "step": 387060 + }, + { + "epoch": 1.95, + "learning_rate": 7.0773065067024526e-06, + "loss": 0.0062, + "step": 387070 + }, + { + "epoch": 1.95, + "learning_rate": 7.0697388136884425e-06, + "loss": 0.0057, + "step": 387080 + }, + { + "epoch": 1.95, + "learning_rate": 7.062171120674432e-06, + "loss": 0.0062, + "step": 387090 + }, + { + "epoch": 1.95, + "learning_rate": 7.054603427660422e-06, + "loss": 0.0059, + "step": 387100 + }, + { + "epoch": 1.95, + "learning_rate": 7.047035734646411e-06, + "loss": 0.0053, + "step": 387110 + }, + { + "epoch": 1.95, + "learning_rate": 7.039468041632401e-06, + "loss": 0.0077, + "step": 387120 + }, + { + "epoch": 1.95, + "learning_rate": 7.031900348618391e-06, + "loss": 0.0051, + "step": 387130 + }, + { + "epoch": 1.95, + "learning_rate": 7.024332655604381e-06, + "loss": 0.005, + "step": 387140 + }, + { + "epoch": 1.95, + "learning_rate": 7.01676496259037e-06, + "loss": 0.0045, + "step": 387150 + }, + { + "epoch": 1.95, + "learning_rate": 7.00919726957636e-06, + "loss": 0.0102, + "step": 387160 + }, + { + "epoch": 1.95, + "learning_rate": 7.00162957656235e-06, + "loss": 0.0043, + "step": 387170 + }, + { + "epoch": 1.95, + "learning_rate": 6.994061883548339e-06, + "loss": 0.0058, + "step": 387180 + }, + { + "epoch": 1.95, + "learning_rate": 6.986494190534329e-06, + "loss": 0.0056, + "step": 387190 + }, + { + "epoch": 1.95, + "learning_rate": 6.978926497520319e-06, + "loss": 0.007, + "step": 387200 + }, + { + "epoch": 1.95, + "learning_rate": 6.971358804506309e-06, + "loss": 0.0069, + "step": 387210 + }, + { + "epoch": 1.95, + "learning_rate": 6.963791111492298e-06, + "loss": 0.0061, + "step": 387220 + }, + { + "epoch": 1.95, + "learning_rate": 6.956223418478288e-06, + "loss": 0.0051, + "step": 387230 + }, + { + "epoch": 1.95, + "learning_rate": 6.948655725464278e-06, + "loss": 0.0054, + "step": 387240 + }, + { + "epoch": 1.95, + "learning_rate": 6.941088032450268e-06, + "loss": 0.0044, + "step": 387250 + }, + { + "epoch": 1.95, + "learning_rate": 6.933520339436256e-06, + "loss": 0.0064, + "step": 387260 + }, + { + "epoch": 1.95, + "learning_rate": 6.9259526464222466e-06, + "loss": 0.008, + "step": 387270 + }, + { + "epoch": 1.95, + "learning_rate": 6.9183849534082365e-06, + "loss": 0.0053, + "step": 387280 + }, + { + "epoch": 1.95, + "learning_rate": 6.910817260394226e-06, + "loss": 0.0046, + "step": 387290 + }, + { + "epoch": 1.95, + "learning_rate": 6.903249567380215e-06, + "loss": 0.0086, + "step": 387300 + }, + { + "epoch": 1.95, + "learning_rate": 6.8956818743662045e-06, + "loss": 0.0052, + "step": 387310 + }, + { + "epoch": 1.95, + "learning_rate": 6.8881141813521944e-06, + "loss": 0.0047, + "step": 387320 + }, + { + "epoch": 1.95, + "learning_rate": 6.880546488338185e-06, + "loss": 0.0064, + "step": 387330 + }, + { + "epoch": 1.95, + "learning_rate": 6.872978795324173e-06, + "loss": 0.0135, + "step": 387340 + }, + { + "epoch": 1.95, + "learning_rate": 6.865411102310163e-06, + "loss": 0.0059, + "step": 387350 + }, + { + "epoch": 1.95, + "learning_rate": 6.857843409296153e-06, + "loss": 0.0055, + "step": 387360 + }, + { + "epoch": 1.95, + "learning_rate": 6.850275716282143e-06, + "loss": 0.0048, + "step": 387370 + }, + { + "epoch": 1.95, + "learning_rate": 6.842708023268132e-06, + "loss": 0.0052, + "step": 387380 + }, + { + "epoch": 1.95, + "learning_rate": 6.835140330254122e-06, + "loss": 0.0053, + "step": 387390 + }, + { + "epoch": 1.95, + "learning_rate": 6.827572637240112e-06, + "loss": 0.0065, + "step": 387400 + }, + { + "epoch": 1.95, + "learning_rate": 6.820004944226102e-06, + "loss": 0.0057, + "step": 387410 + }, + { + "epoch": 1.95, + "learning_rate": 6.812437251212091e-06, + "loss": 0.0046, + "step": 387420 + }, + { + "epoch": 1.95, + "learning_rate": 6.804869558198081e-06, + "loss": 0.0048, + "step": 387430 + }, + { + "epoch": 1.95, + "learning_rate": 6.797301865184071e-06, + "loss": 0.007, + "step": 387440 + }, + { + "epoch": 1.95, + "learning_rate": 6.789734172170061e-06, + "loss": 0.0045, + "step": 387450 + }, + { + "epoch": 1.95, + "learning_rate": 6.78216647915605e-06, + "loss": 0.0055, + "step": 387460 + }, + { + "epoch": 1.95, + "learning_rate": 6.77459878614204e-06, + "loss": 0.0051, + "step": 387470 + }, + { + "epoch": 1.95, + "learning_rate": 6.76703109312803e-06, + "loss": 0.0065, + "step": 387480 + }, + { + "epoch": 1.95, + "learning_rate": 6.7594634001140196e-06, + "loss": 0.0063, + "step": 387490 + }, + { + "epoch": 1.95, + "learning_rate": 6.751895707100009e-06, + "loss": 0.0068, + "step": 387500 + }, + { + "epoch": 1.96, + "learning_rate": 6.7443280140859986e-06, + "loss": 0.0063, + "step": 387510 + }, + { + "epoch": 1.96, + "learning_rate": 6.7367603210719885e-06, + "loss": 0.0071, + "step": 387520 + }, + { + "epoch": 1.96, + "learning_rate": 6.729192628057978e-06, + "loss": 0.0046, + "step": 387530 + }, + { + "epoch": 1.96, + "learning_rate": 6.7216249350439674e-06, + "loss": 0.0058, + "step": 387540 + }, + { + "epoch": 1.96, + "learning_rate": 6.714057242029957e-06, + "loss": 0.0061, + "step": 387550 + }, + { + "epoch": 1.96, + "learning_rate": 6.706489549015947e-06, + "loss": 0.0057, + "step": 387560 + }, + { + "epoch": 1.96, + "learning_rate": 6.698921856001937e-06, + "loss": 0.0054, + "step": 387570 + }, + { + "epoch": 1.96, + "learning_rate": 6.691354162987926e-06, + "loss": 0.0098, + "step": 387580 + }, + { + "epoch": 1.96, + "learning_rate": 6.683786469973916e-06, + "loss": 0.0052, + "step": 387590 + }, + { + "epoch": 1.96, + "learning_rate": 6.676218776959906e-06, + "loss": 0.0053, + "step": 387600 + }, + { + "epoch": 1.96, + "learning_rate": 6.668651083945896e-06, + "loss": 0.005, + "step": 387610 + }, + { + "epoch": 1.96, + "learning_rate": 6.661083390931885e-06, + "loss": 0.006, + "step": 387620 + }, + { + "epoch": 1.96, + "learning_rate": 6.653515697917875e-06, + "loss": 0.0075, + "step": 387630 + }, + { + "epoch": 1.96, + "learning_rate": 6.645948004903865e-06, + "loss": 0.0061, + "step": 387640 + }, + { + "epoch": 1.96, + "learning_rate": 6.638380311889855e-06, + "loss": 0.006, + "step": 387650 + }, + { + "epoch": 1.96, + "learning_rate": 6.630812618875844e-06, + "loss": 0.0057, + "step": 387660 + }, + { + "epoch": 1.96, + "learning_rate": 6.623244925861834e-06, + "loss": 0.0054, + "step": 387670 + }, + { + "epoch": 1.96, + "learning_rate": 6.615677232847824e-06, + "loss": 0.0065, + "step": 387680 + }, + { + "epoch": 1.96, + "learning_rate": 6.608109539833814e-06, + "loss": 0.0045, + "step": 387690 + }, + { + "epoch": 1.96, + "learning_rate": 6.600541846819803e-06, + "loss": 0.0087, + "step": 387700 + }, + { + "epoch": 1.96, + "learning_rate": 6.5929741538057926e-06, + "loss": 0.0064, + "step": 387710 + }, + { + "epoch": 1.96, + "learning_rate": 6.5854064607917825e-06, + "loss": 0.0054, + "step": 387720 + }, + { + "epoch": 1.96, + "learning_rate": 6.577838767777771e-06, + "loss": 0.005, + "step": 387730 + }, + { + "epoch": 1.96, + "learning_rate": 6.570271074763761e-06, + "loss": 0.0056, + "step": 387740 + }, + { + "epoch": 1.96, + "learning_rate": 6.562703381749751e-06, + "loss": 0.0062, + "step": 387750 + }, + { + "epoch": 1.96, + "learning_rate": 6.555135688735741e-06, + "loss": 0.0042, + "step": 387760 + }, + { + "epoch": 1.96, + "learning_rate": 6.5475679957217295e-06, + "loss": 0.0063, + "step": 387770 + }, + { + "epoch": 1.96, + "learning_rate": 6.540000302707719e-06, + "loss": 0.0058, + "step": 387780 + }, + { + "epoch": 1.96, + "learning_rate": 6.532432609693709e-06, + "loss": 0.0052, + "step": 387790 + }, + { + "epoch": 1.96, + "learning_rate": 6.524864916679699e-06, + "loss": 0.0052, + "step": 387800 + }, + { + "epoch": 1.96, + "learning_rate": 6.517297223665688e-06, + "loss": 0.0064, + "step": 387810 + }, + { + "epoch": 1.96, + "learning_rate": 6.509729530651678e-06, + "loss": 0.0049, + "step": 387820 + }, + { + "epoch": 1.96, + "learning_rate": 6.502161837637668e-06, + "loss": 0.0046, + "step": 387830 + }, + { + "epoch": 1.96, + "learning_rate": 6.494594144623658e-06, + "loss": 0.0063, + "step": 387840 + }, + { + "epoch": 1.96, + "learning_rate": 6.487026451609647e-06, + "loss": 0.0056, + "step": 387850 + }, + { + "epoch": 1.96, + "learning_rate": 6.479458758595637e-06, + "loss": 0.0058, + "step": 387860 + }, + { + "epoch": 1.96, + "learning_rate": 6.471891065581627e-06, + "loss": 0.0054, + "step": 387870 + }, + { + "epoch": 1.96, + "learning_rate": 6.464323372567617e-06, + "loss": 0.0052, + "step": 387880 + }, + { + "epoch": 1.96, + "learning_rate": 6.456755679553606e-06, + "loss": 0.0037, + "step": 387890 + }, + { + "epoch": 1.96, + "learning_rate": 6.449187986539596e-06, + "loss": 0.0057, + "step": 387900 + }, + { + "epoch": 1.96, + "learning_rate": 6.441620293525586e-06, + "loss": 0.0055, + "step": 387910 + }, + { + "epoch": 1.96, + "learning_rate": 6.434052600511576e-06, + "loss": 0.0061, + "step": 387920 + }, + { + "epoch": 1.96, + "learning_rate": 6.426484907497565e-06, + "loss": 0.0045, + "step": 387930 + }, + { + "epoch": 1.96, + "learning_rate": 6.418917214483555e-06, + "loss": 0.0056, + "step": 387940 + }, + { + "epoch": 1.96, + "learning_rate": 6.4113495214695446e-06, + "loss": 0.0064, + "step": 387950 + }, + { + "epoch": 1.96, + "learning_rate": 6.4037818284555345e-06, + "loss": 0.007, + "step": 387960 + }, + { + "epoch": 1.96, + "learning_rate": 6.3962141354415235e-06, + "loss": 0.0054, + "step": 387970 + }, + { + "epoch": 1.96, + "learning_rate": 6.3886464424275134e-06, + "loss": 0.0063, + "step": 387980 + }, + { + "epoch": 1.96, + "learning_rate": 6.381078749413503e-06, + "loss": 0.0051, + "step": 387990 + }, + { + "epoch": 1.96, + "learning_rate": 6.373511056399493e-06, + "loss": 0.0051, + "step": 388000 + }, + { + "epoch": 1.96, + "eval_cer": 0.9144062097588856, + "eval_loss": 0.004157001152634621, + "eval_runtime": 116.3242, + "eval_samples_per_second": 17.193, + "eval_steps_per_second": 4.298, + "step": 388000 + }, + { + "epoch": 1.96, + "learning_rate": 6.365943363385482e-06, + "loss": 0.0045, + "step": 388010 + }, + { + "epoch": 1.96, + "learning_rate": 6.358375670371472e-06, + "loss": 0.0044, + "step": 388020 + }, + { + "epoch": 1.96, + "learning_rate": 6.350807977357462e-06, + "loss": 0.0038, + "step": 388030 + }, + { + "epoch": 1.96, + "learning_rate": 6.343240284343452e-06, + "loss": 0.0045, + "step": 388040 + }, + { + "epoch": 1.96, + "learning_rate": 6.335672591329441e-06, + "loss": 0.0068, + "step": 388050 + }, + { + "epoch": 1.96, + "learning_rate": 6.328104898315431e-06, + "loss": 0.0055, + "step": 388060 + }, + { + "epoch": 1.96, + "learning_rate": 6.320537205301421e-06, + "loss": 0.0046, + "step": 388070 + }, + { + "epoch": 1.96, + "learning_rate": 6.312969512287411e-06, + "loss": 0.0059, + "step": 388080 + }, + { + "epoch": 1.96, + "learning_rate": 6.3054018192734e-06, + "loss": 0.0055, + "step": 388090 + }, + { + "epoch": 1.96, + "learning_rate": 6.29783412625939e-06, + "loss": 0.0043, + "step": 388100 + }, + { + "epoch": 1.96, + "learning_rate": 6.29026643324538e-06, + "loss": 0.0087, + "step": 388110 + }, + { + "epoch": 1.96, + "learning_rate": 6.28269874023137e-06, + "loss": 0.0042, + "step": 388120 + }, + { + "epoch": 1.96, + "learning_rate": 6.275131047217359e-06, + "loss": 0.0067, + "step": 388130 + }, + { + "epoch": 1.96, + "learning_rate": 6.267563354203349e-06, + "loss": 0.0049, + "step": 388140 + }, + { + "epoch": 1.96, + "learning_rate": 6.2599956611893386e-06, + "loss": 0.0064, + "step": 388150 + }, + { + "epoch": 1.96, + "learning_rate": 6.2524279681753285e-06, + "loss": 0.0044, + "step": 388160 + }, + { + "epoch": 1.96, + "learning_rate": 6.2448602751613176e-06, + "loss": 0.0061, + "step": 388170 + }, + { + "epoch": 1.96, + "learning_rate": 6.2372925821473075e-06, + "loss": 0.0056, + "step": 388180 + }, + { + "epoch": 1.96, + "learning_rate": 6.229724889133297e-06, + "loss": 0.0066, + "step": 388190 + }, + { + "epoch": 1.96, + "learning_rate": 6.222157196119287e-06, + "loss": 0.0063, + "step": 388200 + }, + { + "epoch": 1.96, + "learning_rate": 6.2145895031052755e-06, + "loss": 0.0067, + "step": 388210 + }, + { + "epoch": 1.96, + "learning_rate": 6.207021810091265e-06, + "loss": 0.0051, + "step": 388220 + }, + { + "epoch": 1.96, + "learning_rate": 6.199454117077255e-06, + "loss": 0.0056, + "step": 388230 + }, + { + "epoch": 1.96, + "learning_rate": 6.191886424063246e-06, + "loss": 0.0041, + "step": 388240 + }, + { + "epoch": 1.96, + "learning_rate": 6.184318731049234e-06, + "loss": 0.0064, + "step": 388250 + }, + { + "epoch": 1.96, + "learning_rate": 6.176751038035224e-06, + "loss": 0.0047, + "step": 388260 + }, + { + "epoch": 1.96, + "learning_rate": 6.169183345021214e-06, + "loss": 0.0041, + "step": 388270 + }, + { + "epoch": 1.96, + "learning_rate": 6.161615652007203e-06, + "loss": 0.0046, + "step": 388280 + }, + { + "epoch": 1.96, + "learning_rate": 6.154047958993193e-06, + "loss": 0.006, + "step": 388290 + }, + { + "epoch": 1.96, + "learning_rate": 6.146480265979183e-06, + "loss": 0.0046, + "step": 388300 + }, + { + "epoch": 1.96, + "learning_rate": 6.138912572965173e-06, + "loss": 0.0055, + "step": 388310 + }, + { + "epoch": 1.96, + "learning_rate": 6.131344879951162e-06, + "loss": 0.0048, + "step": 388320 + }, + { + "epoch": 1.96, + "learning_rate": 6.123777186937152e-06, + "loss": 0.0052, + "step": 388330 + }, + { + "epoch": 1.96, + "learning_rate": 6.116209493923142e-06, + "loss": 0.0073, + "step": 388340 + }, + { + "epoch": 1.96, + "learning_rate": 6.108641800909132e-06, + "loss": 0.0053, + "step": 388350 + }, + { + "epoch": 1.96, + "learning_rate": 6.101074107895121e-06, + "loss": 0.0083, + "step": 388360 + }, + { + "epoch": 1.96, + "learning_rate": 6.093506414881111e-06, + "loss": 0.0052, + "step": 388370 + }, + { + "epoch": 1.96, + "learning_rate": 6.085938721867101e-06, + "loss": 0.006, + "step": 388380 + }, + { + "epoch": 1.96, + "learning_rate": 6.0783710288530906e-06, + "loss": 0.006, + "step": 388390 + }, + { + "epoch": 1.96, + "learning_rate": 6.07080333583908e-06, + "loss": 0.0056, + "step": 388400 + }, + { + "epoch": 1.96, + "learning_rate": 6.0632356428250695e-06, + "loss": 0.0059, + "step": 388410 + }, + { + "epoch": 1.96, + "learning_rate": 6.0556679498110594e-06, + "loss": 0.0063, + "step": 388420 + }, + { + "epoch": 1.96, + "learning_rate": 6.048100256797049e-06, + "loss": 0.0048, + "step": 388430 + }, + { + "epoch": 1.96, + "learning_rate": 6.040532563783038e-06, + "loss": 0.0043, + "step": 388440 + }, + { + "epoch": 1.96, + "learning_rate": 6.032964870769028e-06, + "loss": 0.0055, + "step": 388450 + }, + { + "epoch": 1.96, + "learning_rate": 6.025397177755018e-06, + "loss": 0.005, + "step": 388460 + }, + { + "epoch": 1.96, + "learning_rate": 6.017829484741008e-06, + "loss": 0.0081, + "step": 388470 + }, + { + "epoch": 1.96, + "learning_rate": 6.010261791726997e-06, + "loss": 0.0058, + "step": 388480 + }, + { + "epoch": 1.96, + "learning_rate": 6.002694098712987e-06, + "loss": 0.005, + "step": 388490 + }, + { + "epoch": 1.96, + "learning_rate": 5.995126405698977e-06, + "loss": 0.0051, + "step": 388500 + }, + { + "epoch": 1.96, + "learning_rate": 5.987558712684967e-06, + "loss": 0.0041, + "step": 388510 + }, + { + "epoch": 1.96, + "learning_rate": 5.979991019670956e-06, + "loss": 0.0066, + "step": 388520 + }, + { + "epoch": 1.96, + "learning_rate": 5.972423326656946e-06, + "loss": 0.0069, + "step": 388530 + }, + { + "epoch": 1.96, + "learning_rate": 5.964855633642936e-06, + "loss": 0.0059, + "step": 388540 + }, + { + "epoch": 1.96, + "learning_rate": 5.957287940628926e-06, + "loss": 0.0057, + "step": 388550 + }, + { + "epoch": 1.96, + "learning_rate": 5.949720247614915e-06, + "loss": 0.0051, + "step": 388560 + }, + { + "epoch": 1.96, + "learning_rate": 5.942152554600905e-06, + "loss": 0.0074, + "step": 388570 + }, + { + "epoch": 1.96, + "learning_rate": 5.934584861586895e-06, + "loss": 0.006, + "step": 388580 + }, + { + "epoch": 1.96, + "learning_rate": 5.9270171685728846e-06, + "loss": 0.0054, + "step": 388590 + }, + { + "epoch": 1.96, + "learning_rate": 5.919449475558874e-06, + "loss": 0.0057, + "step": 388600 + }, + { + "epoch": 1.96, + "learning_rate": 5.9118817825448636e-06, + "loss": 0.006, + "step": 388610 + }, + { + "epoch": 1.96, + "learning_rate": 5.9043140895308535e-06, + "loss": 0.0064, + "step": 388620 + }, + { + "epoch": 1.96, + "learning_rate": 5.896746396516843e-06, + "loss": 0.005, + "step": 388630 + }, + { + "epoch": 1.96, + "learning_rate": 5.889178703502832e-06, + "loss": 0.0055, + "step": 388640 + }, + { + "epoch": 1.96, + "learning_rate": 5.8816110104888215e-06, + "loss": 0.0056, + "step": 388650 + }, + { + "epoch": 1.96, + "learning_rate": 5.874043317474812e-06, + "loss": 0.005, + "step": 388660 + }, + { + "epoch": 1.96, + "learning_rate": 5.866475624460802e-06, + "loss": 0.0056, + "step": 388670 + }, + { + "epoch": 1.96, + "learning_rate": 5.85890793144679e-06, + "loss": 0.0049, + "step": 388680 + }, + { + "epoch": 1.96, + "learning_rate": 5.85134023843278e-06, + "loss": 0.0056, + "step": 388690 + }, + { + "epoch": 1.96, + "learning_rate": 5.84377254541877e-06, + "loss": 0.0057, + "step": 388700 + }, + { + "epoch": 1.96, + "learning_rate": 5.83620485240476e-06, + "loss": 0.0063, + "step": 388710 + }, + { + "epoch": 1.96, + "learning_rate": 5.828637159390749e-06, + "loss": 0.0065, + "step": 388720 + }, + { + "epoch": 1.96, + "learning_rate": 5.821069466376739e-06, + "loss": 0.0069, + "step": 388730 + }, + { + "epoch": 1.96, + "learning_rate": 5.813501773362729e-06, + "loss": 0.0043, + "step": 388740 + }, + { + "epoch": 1.96, + "learning_rate": 5.805934080348719e-06, + "loss": 0.0052, + "step": 388750 + }, + { + "epoch": 1.96, + "learning_rate": 5.798366387334708e-06, + "loss": 0.0057, + "step": 388760 + }, + { + "epoch": 1.96, + "learning_rate": 5.790798694320698e-06, + "loss": 0.005, + "step": 388770 + }, + { + "epoch": 1.96, + "learning_rate": 5.783231001306688e-06, + "loss": 0.0072, + "step": 388780 + }, + { + "epoch": 1.96, + "learning_rate": 5.775663308292678e-06, + "loss": 0.0047, + "step": 388790 + }, + { + "epoch": 1.96, + "learning_rate": 5.768095615278667e-06, + "loss": 0.0054, + "step": 388800 + }, + { + "epoch": 1.96, + "learning_rate": 5.760527922264657e-06, + "loss": 0.0054, + "step": 388810 + }, + { + "epoch": 1.96, + "learning_rate": 5.752960229250647e-06, + "loss": 0.0069, + "step": 388820 + }, + { + "epoch": 1.96, + "learning_rate": 5.745392536236636e-06, + "loss": 0.0042, + "step": 388830 + }, + { + "epoch": 1.96, + "learning_rate": 5.737824843222626e-06, + "loss": 0.0058, + "step": 388840 + }, + { + "epoch": 1.96, + "learning_rate": 5.7302571502086155e-06, + "loss": 0.0049, + "step": 388850 + }, + { + "epoch": 1.96, + "learning_rate": 5.7226894571946054e-06, + "loss": 0.0053, + "step": 388860 + }, + { + "epoch": 1.96, + "learning_rate": 5.7151217641805945e-06, + "loss": 0.006, + "step": 388870 + }, + { + "epoch": 1.96, + "learning_rate": 5.7075540711665844e-06, + "loss": 0.0043, + "step": 388880 + }, + { + "epoch": 1.96, + "learning_rate": 5.699986378152574e-06, + "loss": 0.007, + "step": 388890 + }, + { + "epoch": 1.96, + "learning_rate": 5.692418685138564e-06, + "loss": 0.0046, + "step": 388900 + }, + { + "epoch": 1.96, + "learning_rate": 5.684850992124553e-06, + "loss": 0.0047, + "step": 388910 + }, + { + "epoch": 1.96, + "learning_rate": 5.677283299110543e-06, + "loss": 0.0061, + "step": 388920 + }, + { + "epoch": 1.96, + "learning_rate": 5.669715606096533e-06, + "loss": 0.0048, + "step": 388930 + }, + { + "epoch": 1.96, + "learning_rate": 5.662147913082523e-06, + "loss": 0.0055, + "step": 388940 + }, + { + "epoch": 1.96, + "learning_rate": 5.654580220068512e-06, + "loss": 0.0066, + "step": 388950 + }, + { + "epoch": 1.96, + "learning_rate": 5.647012527054502e-06, + "loss": 0.0067, + "step": 388960 + }, + { + "epoch": 1.96, + "learning_rate": 5.639444834040492e-06, + "loss": 0.0048, + "step": 388970 + }, + { + "epoch": 1.96, + "learning_rate": 5.631877141026482e-06, + "loss": 0.0047, + "step": 388980 + }, + { + "epoch": 1.96, + "learning_rate": 5.624309448012471e-06, + "loss": 0.0049, + "step": 388990 + }, + { + "epoch": 1.96, + "learning_rate": 5.616741754998461e-06, + "loss": 0.0048, + "step": 389000 + }, + { + "epoch": 1.96, + "eval_cer": 0.9143994169860079, + "eval_loss": 0.004172166809439659, + "eval_runtime": 116.4331, + "eval_samples_per_second": 17.177, + "eval_steps_per_second": 4.294, + "step": 389000 + }, + { + "epoch": 1.96, + "learning_rate": 5.609174061984451e-06, + "loss": 0.0074, + "step": 389010 + }, + { + "epoch": 1.96, + "learning_rate": 5.601606368970441e-06, + "loss": 0.009, + "step": 389020 + }, + { + "epoch": 1.96, + "learning_rate": 5.59403867595643e-06, + "loss": 0.0077, + "step": 389030 + }, + { + "epoch": 1.96, + "learning_rate": 5.58647098294242e-06, + "loss": 0.0045, + "step": 389040 + }, + { + "epoch": 1.96, + "learning_rate": 5.5789032899284096e-06, + "loss": 0.0046, + "step": 389050 + }, + { + "epoch": 1.96, + "learning_rate": 5.5713355969143995e-06, + "loss": 0.0067, + "step": 389060 + }, + { + "epoch": 1.96, + "learning_rate": 5.563767903900388e-06, + "loss": 0.0034, + "step": 389070 + }, + { + "epoch": 1.96, + "learning_rate": 5.5562002108863784e-06, + "loss": 0.0074, + "step": 389080 + }, + { + "epoch": 1.96, + "learning_rate": 5.548632517872368e-06, + "loss": 0.0076, + "step": 389090 + }, + { + "epoch": 1.96, + "learning_rate": 5.541064824858358e-06, + "loss": 0.0057, + "step": 389100 + }, + { + "epoch": 1.96, + "learning_rate": 5.5334971318443465e-06, + "loss": 0.0057, + "step": 389110 + }, + { + "epoch": 1.96, + "learning_rate": 5.525929438830336e-06, + "loss": 0.0073, + "step": 389120 + }, + { + "epoch": 1.96, + "learning_rate": 5.518361745816326e-06, + "loss": 0.0064, + "step": 389130 + }, + { + "epoch": 1.96, + "learning_rate": 5.510794052802317e-06, + "loss": 0.0055, + "step": 389140 + }, + { + "epoch": 1.96, + "learning_rate": 5.503226359788305e-06, + "loss": 0.0052, + "step": 389150 + }, + { + "epoch": 1.96, + "learning_rate": 5.495658666774295e-06, + "loss": 0.0055, + "step": 389160 + }, + { + "epoch": 1.96, + "learning_rate": 5.488090973760285e-06, + "loss": 0.0061, + "step": 389170 + }, + { + "epoch": 1.96, + "learning_rate": 5.480523280746275e-06, + "loss": 0.0041, + "step": 389180 + }, + { + "epoch": 1.96, + "learning_rate": 5.472955587732264e-06, + "loss": 0.0062, + "step": 389190 + }, + { + "epoch": 1.96, + "learning_rate": 5.465387894718254e-06, + "loss": 0.0064, + "step": 389200 + }, + { + "epoch": 1.96, + "learning_rate": 5.457820201704244e-06, + "loss": 0.006, + "step": 389210 + }, + { + "epoch": 1.96, + "learning_rate": 5.450252508690234e-06, + "loss": 0.0065, + "step": 389220 + }, + { + "epoch": 1.96, + "learning_rate": 5.442684815676223e-06, + "loss": 0.0058, + "step": 389230 + }, + { + "epoch": 1.96, + "learning_rate": 5.435117122662213e-06, + "loss": 0.0061, + "step": 389240 + }, + { + "epoch": 1.96, + "learning_rate": 5.427549429648203e-06, + "loss": 0.0042, + "step": 389250 + }, + { + "epoch": 1.96, + "learning_rate": 5.419981736634193e-06, + "loss": 0.0056, + "step": 389260 + }, + { + "epoch": 1.96, + "learning_rate": 5.412414043620182e-06, + "loss": 0.0052, + "step": 389270 + }, + { + "epoch": 1.96, + "learning_rate": 5.404846350606172e-06, + "loss": 0.0053, + "step": 389280 + }, + { + "epoch": 1.96, + "learning_rate": 5.3972786575921615e-06, + "loss": 0.0048, + "step": 389290 + }, + { + "epoch": 1.96, + "learning_rate": 5.3897109645781514e-06, + "loss": 0.006, + "step": 389300 + }, + { + "epoch": 1.96, + "learning_rate": 5.3821432715641405e-06, + "loss": 0.0043, + "step": 389310 + }, + { + "epoch": 1.96, + "learning_rate": 5.3745755785501304e-06, + "loss": 0.005, + "step": 389320 + }, + { + "epoch": 1.96, + "learning_rate": 5.36700788553612e-06, + "loss": 0.0061, + "step": 389330 + }, + { + "epoch": 1.96, + "learning_rate": 5.35944019252211e-06, + "loss": 0.0056, + "step": 389340 + }, + { + "epoch": 1.96, + "learning_rate": 5.351872499508099e-06, + "loss": 0.0041, + "step": 389350 + }, + { + "epoch": 1.96, + "learning_rate": 5.344304806494089e-06, + "loss": 0.0062, + "step": 389360 + }, + { + "epoch": 1.96, + "learning_rate": 5.336737113480079e-06, + "loss": 0.0051, + "step": 389370 + }, + { + "epoch": 1.96, + "learning_rate": 5.329169420466068e-06, + "loss": 0.0051, + "step": 389380 + }, + { + "epoch": 1.96, + "learning_rate": 5.321601727452058e-06, + "loss": 0.0067, + "step": 389390 + }, + { + "epoch": 1.96, + "learning_rate": 5.314034034438048e-06, + "loss": 0.0049, + "step": 389400 + }, + { + "epoch": 1.96, + "learning_rate": 5.306466341424038e-06, + "loss": 0.0088, + "step": 389410 + }, + { + "epoch": 1.96, + "learning_rate": 5.298898648410027e-06, + "loss": 0.004, + "step": 389420 + }, + { + "epoch": 1.96, + "learning_rate": 5.291330955396017e-06, + "loss": 0.0057, + "step": 389430 + }, + { + "epoch": 1.96, + "learning_rate": 5.283763262382007e-06, + "loss": 0.0057, + "step": 389440 + }, + { + "epoch": 1.96, + "learning_rate": 5.276195569367997e-06, + "loss": 0.0056, + "step": 389450 + }, + { + "epoch": 1.96, + "learning_rate": 5.268627876353986e-06, + "loss": 0.0054, + "step": 389460 + }, + { + "epoch": 1.96, + "learning_rate": 5.261060183339976e-06, + "loss": 0.0039, + "step": 389470 + }, + { + "epoch": 1.96, + "learning_rate": 5.253492490325966e-06, + "loss": 0.0092, + "step": 389480 + }, + { + "epoch": 1.97, + "learning_rate": 5.2459247973119556e-06, + "loss": 0.0053, + "step": 389490 + }, + { + "epoch": 1.97, + "learning_rate": 5.238357104297945e-06, + "loss": 0.0059, + "step": 389500 + }, + { + "epoch": 1.97, + "learning_rate": 5.2307894112839345e-06, + "loss": 0.0048, + "step": 389510 + }, + { + "epoch": 1.97, + "learning_rate": 5.2232217182699244e-06, + "loss": 0.0042, + "step": 389520 + }, + { + "epoch": 1.97, + "learning_rate": 5.215654025255914e-06, + "loss": 0.0058, + "step": 389530 + }, + { + "epoch": 1.97, + "learning_rate": 5.208086332241903e-06, + "loss": 0.0055, + "step": 389540 + }, + { + "epoch": 1.97, + "learning_rate": 5.2005186392278925e-06, + "loss": 0.0027, + "step": 389550 + }, + { + "epoch": 1.97, + "learning_rate": 5.192950946213883e-06, + "loss": 0.0036, + "step": 389560 + }, + { + "epoch": 1.97, + "learning_rate": 5.185383253199873e-06, + "loss": 0.0067, + "step": 389570 + }, + { + "epoch": 1.97, + "learning_rate": 5.177815560185861e-06, + "loss": 0.0056, + "step": 389580 + }, + { + "epoch": 1.97, + "learning_rate": 5.170247867171851e-06, + "loss": 0.0058, + "step": 389590 + }, + { + "epoch": 1.97, + "learning_rate": 5.162680174157841e-06, + "loss": 0.005, + "step": 389600 + }, + { + "epoch": 1.97, + "learning_rate": 5.155112481143831e-06, + "loss": 0.0068, + "step": 389610 + }, + { + "epoch": 1.97, + "learning_rate": 5.14754478812982e-06, + "loss": 0.0055, + "step": 389620 + }, + { + "epoch": 1.97, + "learning_rate": 5.13997709511581e-06, + "loss": 0.0063, + "step": 389630 + }, + { + "epoch": 1.97, + "learning_rate": 5.1324094021018e-06, + "loss": 0.0062, + "step": 389640 + }, + { + "epoch": 1.97, + "learning_rate": 5.12484170908779e-06, + "loss": 0.0073, + "step": 389650 + }, + { + "epoch": 1.97, + "learning_rate": 5.117274016073779e-06, + "loss": 0.0058, + "step": 389660 + }, + { + "epoch": 1.97, + "learning_rate": 5.109706323059769e-06, + "loss": 0.0063, + "step": 389670 + }, + { + "epoch": 1.97, + "learning_rate": 5.102138630045759e-06, + "loss": 0.0029, + "step": 389680 + }, + { + "epoch": 1.97, + "learning_rate": 5.094570937031749e-06, + "loss": 0.0052, + "step": 389690 + }, + { + "epoch": 1.97, + "learning_rate": 5.087003244017738e-06, + "loss": 0.0054, + "step": 389700 + }, + { + "epoch": 1.97, + "learning_rate": 5.079435551003728e-06, + "loss": 0.0052, + "step": 389710 + }, + { + "epoch": 1.97, + "learning_rate": 5.071867857989718e-06, + "loss": 0.0059, + "step": 389720 + }, + { + "epoch": 1.97, + "learning_rate": 5.0643001649757075e-06, + "loss": 0.0059, + "step": 389730 + }, + { + "epoch": 1.97, + "learning_rate": 5.056732471961697e-06, + "loss": 0.0072, + "step": 389740 + }, + { + "epoch": 1.97, + "learning_rate": 5.0491647789476865e-06, + "loss": 0.0055, + "step": 389750 + }, + { + "epoch": 1.97, + "learning_rate": 5.0415970859336764e-06, + "loss": 0.0045, + "step": 389760 + }, + { + "epoch": 1.97, + "learning_rate": 5.034029392919666e-06, + "loss": 0.0055, + "step": 389770 + }, + { + "epoch": 1.97, + "learning_rate": 5.026461699905655e-06, + "loss": 0.0048, + "step": 389780 + }, + { + "epoch": 1.97, + "learning_rate": 5.018894006891645e-06, + "loss": 0.0064, + "step": 389790 + }, + { + "epoch": 1.97, + "learning_rate": 5.011326313877635e-06, + "loss": 0.006, + "step": 389800 + }, + { + "epoch": 1.97, + "learning_rate": 5.003758620863625e-06, + "loss": 0.007, + "step": 389810 + }, + { + "epoch": 1.97, + "learning_rate": 4.996190927849614e-06, + "loss": 0.0051, + "step": 389820 + }, + { + "epoch": 1.97, + "learning_rate": 4.988623234835604e-06, + "loss": 0.0056, + "step": 389830 + }, + { + "epoch": 1.97, + "learning_rate": 4.981055541821594e-06, + "loss": 0.0048, + "step": 389840 + }, + { + "epoch": 1.97, + "learning_rate": 4.973487848807584e-06, + "loss": 0.0042, + "step": 389850 + }, + { + "epoch": 1.97, + "learning_rate": 4.965920155793573e-06, + "loss": 0.0072, + "step": 389860 + }, + { + "epoch": 1.97, + "learning_rate": 4.958352462779563e-06, + "loss": 0.0049, + "step": 389870 + }, + { + "epoch": 1.97, + "learning_rate": 4.950784769765553e-06, + "loss": 0.0052, + "step": 389880 + }, + { + "epoch": 1.97, + "learning_rate": 4.943217076751543e-06, + "loss": 0.0042, + "step": 389890 + }, + { + "epoch": 1.97, + "learning_rate": 4.935649383737532e-06, + "loss": 0.0076, + "step": 389900 + }, + { + "epoch": 1.97, + "learning_rate": 4.928081690723522e-06, + "loss": 0.0056, + "step": 389910 + }, + { + "epoch": 1.97, + "learning_rate": 4.920513997709512e-06, + "loss": 0.0062, + "step": 389920 + }, + { + "epoch": 1.97, + "learning_rate": 4.912946304695501e-06, + "loss": 0.0061, + "step": 389930 + }, + { + "epoch": 1.97, + "learning_rate": 4.905378611681491e-06, + "loss": 0.0058, + "step": 389940 + }, + { + "epoch": 1.97, + "learning_rate": 4.8978109186674805e-06, + "loss": 0.0058, + "step": 389950 + }, + { + "epoch": 1.97, + "learning_rate": 4.8902432256534704e-06, + "loss": 0.0066, + "step": 389960 + }, + { + "epoch": 1.97, + "learning_rate": 4.882675532639459e-06, + "loss": 0.0056, + "step": 389970 + }, + { + "epoch": 1.97, + "learning_rate": 4.875107839625449e-06, + "loss": 0.0048, + "step": 389980 + }, + { + "epoch": 1.97, + "learning_rate": 4.867540146611439e-06, + "loss": 0.0068, + "step": 389990 + }, + { + "epoch": 1.97, + "learning_rate": 4.859972453597429e-06, + "loss": 0.0059, + "step": 390000 + }, + { + "epoch": 1.97, + "eval_cer": 0.9143955354015062, + "eval_loss": 0.004140438511967659, + "eval_runtime": 116.3675, + "eval_samples_per_second": 17.187, + "eval_steps_per_second": 4.297, + "step": 390000 + }, + { + "epoch": 1.97, + "learning_rate": 4.8524047605834175e-06, + "loss": 0.0059, + "step": 390010 + }, + { + "epoch": 1.97, + "learning_rate": 4.844837067569407e-06, + "loss": 0.0046, + "step": 390020 + }, + { + "epoch": 1.97, + "learning_rate": 4.837269374555397e-06, + "loss": 0.0049, + "step": 390030 + }, + { + "epoch": 1.97, + "learning_rate": 4.829701681541387e-06, + "loss": 0.0064, + "step": 390040 + }, + { + "epoch": 1.97, + "learning_rate": 4.822133988527376e-06, + "loss": 0.0044, + "step": 390050 + }, + { + "epoch": 1.97, + "learning_rate": 4.814566295513366e-06, + "loss": 0.0058, + "step": 390060 + }, + { + "epoch": 1.97, + "learning_rate": 4.806998602499356e-06, + "loss": 0.0054, + "step": 390070 + }, + { + "epoch": 1.97, + "learning_rate": 4.799430909485346e-06, + "loss": 0.0064, + "step": 390080 + }, + { + "epoch": 1.97, + "learning_rate": 4.791863216471335e-06, + "loss": 0.0052, + "step": 390090 + }, + { + "epoch": 1.97, + "learning_rate": 4.784295523457325e-06, + "loss": 0.0053, + "step": 390100 + }, + { + "epoch": 1.97, + "learning_rate": 4.776727830443315e-06, + "loss": 0.0043, + "step": 390110 + }, + { + "epoch": 1.97, + "learning_rate": 4.769160137429305e-06, + "loss": 0.0048, + "step": 390120 + }, + { + "epoch": 1.97, + "learning_rate": 4.761592444415294e-06, + "loss": 0.0045, + "step": 390130 + }, + { + "epoch": 1.97, + "learning_rate": 4.754024751401284e-06, + "loss": 0.0033, + "step": 390140 + }, + { + "epoch": 1.97, + "learning_rate": 4.746457058387274e-06, + "loss": 0.0094, + "step": 390150 + }, + { + "epoch": 1.97, + "learning_rate": 4.738889365373264e-06, + "loss": 0.0056, + "step": 390160 + }, + { + "epoch": 1.97, + "learning_rate": 4.731321672359253e-06, + "loss": 0.0068, + "step": 390170 + }, + { + "epoch": 1.97, + "learning_rate": 4.723753979345243e-06, + "loss": 0.0084, + "step": 390180 + }, + { + "epoch": 1.97, + "learning_rate": 4.7161862863312325e-06, + "loss": 0.0051, + "step": 390190 + }, + { + "epoch": 1.97, + "learning_rate": 4.7086185933172224e-06, + "loss": 0.0047, + "step": 390200 + }, + { + "epoch": 1.97, + "learning_rate": 4.7010509003032115e-06, + "loss": 0.0095, + "step": 390210 + }, + { + "epoch": 1.97, + "learning_rate": 4.693483207289201e-06, + "loss": 0.0061, + "step": 390220 + }, + { + "epoch": 1.97, + "learning_rate": 4.685915514275191e-06, + "loss": 0.006, + "step": 390230 + }, + { + "epoch": 1.97, + "learning_rate": 4.67834782126118e-06, + "loss": 0.0035, + "step": 390240 + }, + { + "epoch": 1.97, + "learning_rate": 4.67078012824717e-06, + "loss": 0.0049, + "step": 390250 + }, + { + "epoch": 1.97, + "learning_rate": 4.66321243523316e-06, + "loss": 0.0071, + "step": 390260 + }, + { + "epoch": 1.97, + "learning_rate": 4.65564474221915e-06, + "loss": 0.0063, + "step": 390270 + }, + { + "epoch": 1.97, + "learning_rate": 4.648077049205139e-06, + "loss": 0.006, + "step": 390280 + }, + { + "epoch": 1.97, + "learning_rate": 4.640509356191129e-06, + "loss": 0.0044, + "step": 390290 + }, + { + "epoch": 1.97, + "learning_rate": 4.632941663177119e-06, + "loss": 0.0045, + "step": 390300 + }, + { + "epoch": 1.97, + "learning_rate": 4.625373970163109e-06, + "loss": 0.0066, + "step": 390310 + }, + { + "epoch": 1.97, + "learning_rate": 4.617806277149098e-06, + "loss": 0.0052, + "step": 390320 + }, + { + "epoch": 1.97, + "learning_rate": 4.610238584135088e-06, + "loss": 0.0048, + "step": 390330 + }, + { + "epoch": 1.97, + "learning_rate": 4.602670891121078e-06, + "loss": 0.0059, + "step": 390340 + }, + { + "epoch": 1.97, + "learning_rate": 4.595103198107068e-06, + "loss": 0.0058, + "step": 390350 + }, + { + "epoch": 1.97, + "learning_rate": 4.587535505093057e-06, + "loss": 0.0054, + "step": 390360 + }, + { + "epoch": 1.97, + "learning_rate": 4.579967812079047e-06, + "loss": 0.0065, + "step": 390370 + }, + { + "epoch": 1.97, + "learning_rate": 4.572400119065037e-06, + "loss": 0.0063, + "step": 390380 + }, + { + "epoch": 1.97, + "learning_rate": 4.5648324260510265e-06, + "loss": 0.0057, + "step": 390390 + }, + { + "epoch": 1.97, + "learning_rate": 4.557264733037016e-06, + "loss": 0.0058, + "step": 390400 + }, + { + "epoch": 1.97, + "learning_rate": 4.5496970400230055e-06, + "loss": 0.0055, + "step": 390410 + }, + { + "epoch": 1.97, + "learning_rate": 4.5421293470089954e-06, + "loss": 0.0079, + "step": 390420 + }, + { + "epoch": 1.97, + "learning_rate": 4.534561653994985e-06, + "loss": 0.0052, + "step": 390430 + }, + { + "epoch": 1.97, + "learning_rate": 4.526993960980974e-06, + "loss": 0.0042, + "step": 390440 + }, + { + "epoch": 1.97, + "learning_rate": 4.5194262679669635e-06, + "loss": 0.0043, + "step": 390450 + }, + { + "epoch": 1.97, + "learning_rate": 4.511858574952953e-06, + "loss": 0.0058, + "step": 390460 + }, + { + "epoch": 1.97, + "learning_rate": 4.504290881938943e-06, + "loss": 0.0055, + "step": 390470 + }, + { + "epoch": 1.97, + "learning_rate": 4.496723188924933e-06, + "loss": 0.0058, + "step": 390480 + }, + { + "epoch": 1.97, + "learning_rate": 4.489155495910922e-06, + "loss": 0.0099, + "step": 390490 + }, + { + "epoch": 1.97, + "learning_rate": 4.481587802896912e-06, + "loss": 0.0068, + "step": 390500 + }, + { + "epoch": 1.97, + "learning_rate": 4.474020109882902e-06, + "loss": 0.0059, + "step": 390510 + }, + { + "epoch": 1.97, + "learning_rate": 4.466452416868892e-06, + "loss": 0.0052, + "step": 390520 + }, + { + "epoch": 1.97, + "learning_rate": 4.458884723854881e-06, + "loss": 0.0053, + "step": 390530 + }, + { + "epoch": 1.97, + "learning_rate": 4.451317030840871e-06, + "loss": 0.0045, + "step": 390540 + }, + { + "epoch": 1.97, + "learning_rate": 4.443749337826861e-06, + "loss": 0.0046, + "step": 390550 + }, + { + "epoch": 1.97, + "learning_rate": 4.436181644812851e-06, + "loss": 0.0071, + "step": 390560 + }, + { + "epoch": 1.97, + "learning_rate": 4.42861395179884e-06, + "loss": 0.0071, + "step": 390570 + }, + { + "epoch": 1.97, + "learning_rate": 4.42104625878483e-06, + "loss": 0.0059, + "step": 390580 + }, + { + "epoch": 1.97, + "learning_rate": 4.41347856577082e-06, + "loss": 0.0036, + "step": 390590 + }, + { + "epoch": 1.97, + "learning_rate": 4.40591087275681e-06, + "loss": 0.0047, + "step": 390600 + }, + { + "epoch": 1.97, + "learning_rate": 4.398343179742799e-06, + "loss": 0.004, + "step": 390610 + }, + { + "epoch": 1.97, + "learning_rate": 4.390775486728789e-06, + "loss": 0.0074, + "step": 390620 + }, + { + "epoch": 1.97, + "learning_rate": 4.3832077937147785e-06, + "loss": 0.0056, + "step": 390630 + }, + { + "epoch": 1.97, + "learning_rate": 4.3756401007007684e-06, + "loss": 0.0057, + "step": 390640 + }, + { + "epoch": 1.97, + "learning_rate": 4.3680724076867575e-06, + "loss": 0.0057, + "step": 390650 + }, + { + "epoch": 1.97, + "learning_rate": 4.360504714672747e-06, + "loss": 0.0053, + "step": 390660 + }, + { + "epoch": 1.97, + "learning_rate": 4.3529370216587365e-06, + "loss": 0.0062, + "step": 390670 + }, + { + "epoch": 1.97, + "learning_rate": 4.345369328644727e-06, + "loss": 0.0043, + "step": 390680 + }, + { + "epoch": 1.97, + "learning_rate": 4.337801635630716e-06, + "loss": 0.0089, + "step": 390690 + }, + { + "epoch": 1.97, + "learning_rate": 4.330233942616706e-06, + "loss": 0.0051, + "step": 390700 + }, + { + "epoch": 1.97, + "learning_rate": 4.322666249602695e-06, + "loss": 0.0059, + "step": 390710 + }, + { + "epoch": 1.97, + "learning_rate": 4.315098556588685e-06, + "loss": 0.0051, + "step": 390720 + }, + { + "epoch": 1.97, + "learning_rate": 4.307530863574675e-06, + "loss": 0.0055, + "step": 390730 + }, + { + "epoch": 1.97, + "learning_rate": 4.299963170560665e-06, + "loss": 0.0056, + "step": 390740 + }, + { + "epoch": 1.97, + "learning_rate": 4.292395477546654e-06, + "loss": 0.0047, + "step": 390750 + }, + { + "epoch": 1.97, + "learning_rate": 4.284827784532644e-06, + "loss": 0.0071, + "step": 390760 + }, + { + "epoch": 1.97, + "learning_rate": 4.277260091518634e-06, + "loss": 0.0052, + "step": 390770 + }, + { + "epoch": 1.97, + "learning_rate": 4.269692398504624e-06, + "loss": 0.0046, + "step": 390780 + }, + { + "epoch": 1.97, + "learning_rate": 4.262124705490613e-06, + "loss": 0.0056, + "step": 390790 + }, + { + "epoch": 1.97, + "learning_rate": 4.254557012476603e-06, + "loss": 0.0088, + "step": 390800 + }, + { + "epoch": 1.97, + "learning_rate": 4.246989319462593e-06, + "loss": 0.0038, + "step": 390810 + }, + { + "epoch": 1.97, + "learning_rate": 4.239421626448583e-06, + "loss": 0.0046, + "step": 390820 + }, + { + "epoch": 1.97, + "learning_rate": 4.231853933434572e-06, + "loss": 0.0093, + "step": 390830 + }, + { + "epoch": 1.97, + "learning_rate": 4.224286240420562e-06, + "loss": 0.0093, + "step": 390840 + }, + { + "epoch": 1.97, + "learning_rate": 4.2167185474065515e-06, + "loss": 0.0056, + "step": 390850 + }, + { + "epoch": 1.97, + "learning_rate": 4.2091508543925414e-06, + "loss": 0.0048, + "step": 390860 + }, + { + "epoch": 1.97, + "learning_rate": 4.2015831613785305e-06, + "loss": 0.0055, + "step": 390870 + }, + { + "epoch": 1.97, + "learning_rate": 4.19401546836452e-06, + "loss": 0.0041, + "step": 390880 + }, + { + "epoch": 1.97, + "learning_rate": 4.18644777535051e-06, + "loss": 0.0059, + "step": 390890 + }, + { + "epoch": 1.97, + "learning_rate": 4.1788800823365e-06, + "loss": 0.007, + "step": 390900 + }, + { + "epoch": 1.97, + "learning_rate": 4.171312389322489e-06, + "loss": 0.0055, + "step": 390910 + }, + { + "epoch": 1.97, + "learning_rate": 4.163744696308479e-06, + "loss": 0.0055, + "step": 390920 + }, + { + "epoch": 1.97, + "learning_rate": 4.156177003294468e-06, + "loss": 0.0071, + "step": 390930 + }, + { + "epoch": 1.97, + "learning_rate": 4.148609310280458e-06, + "loss": 0.0044, + "step": 390940 + }, + { + "epoch": 1.97, + "learning_rate": 4.141041617266448e-06, + "loss": 0.007, + "step": 390950 + }, + { + "epoch": 1.97, + "learning_rate": 4.133473924252438e-06, + "loss": 0.0038, + "step": 390960 + }, + { + "epoch": 1.97, + "learning_rate": 4.125906231238427e-06, + "loss": 0.0057, + "step": 390970 + }, + { + "epoch": 1.97, + "learning_rate": 4.118338538224417e-06, + "loss": 0.005, + "step": 390980 + }, + { + "epoch": 1.97, + "learning_rate": 4.110770845210407e-06, + "loss": 0.0062, + "step": 390990 + }, + { + "epoch": 1.97, + "learning_rate": 4.103203152196396e-06, + "loss": 0.0061, + "step": 391000 + }, + { + "epoch": 1.97, + "eval_cer": 0.9144003873821333, + "eval_loss": 0.00414480222389102, + "eval_runtime": 116.2164, + "eval_samples_per_second": 17.209, + "eval_steps_per_second": 4.302, + "step": 391000 + }, + { + "epoch": 1.97, + "learning_rate": 4.095635459182386e-06, + "loss": 0.0084, + "step": 391010 + }, + { + "epoch": 1.97, + "learning_rate": 4.088067766168376e-06, + "loss": 0.0054, + "step": 391020 + }, + { + "epoch": 1.97, + "learning_rate": 4.080500073154366e-06, + "loss": 0.0064, + "step": 391030 + }, + { + "epoch": 1.97, + "learning_rate": 4.072932380140355e-06, + "loss": 0.0057, + "step": 391040 + }, + { + "epoch": 1.97, + "learning_rate": 4.065364687126345e-06, + "loss": 0.0049, + "step": 391050 + }, + { + "epoch": 1.97, + "learning_rate": 4.057796994112335e-06, + "loss": 0.0048, + "step": 391060 + }, + { + "epoch": 1.97, + "learning_rate": 4.0502293010983245e-06, + "loss": 0.0054, + "step": 391070 + }, + { + "epoch": 1.97, + "learning_rate": 4.042661608084314e-06, + "loss": 0.004, + "step": 391080 + }, + { + "epoch": 1.97, + "learning_rate": 4.0350939150703035e-06, + "loss": 0.0058, + "step": 391090 + }, + { + "epoch": 1.97, + "learning_rate": 4.027526222056293e-06, + "loss": 0.0046, + "step": 391100 + }, + { + "epoch": 1.97, + "learning_rate": 4.019958529042283e-06, + "loss": 0.0063, + "step": 391110 + }, + { + "epoch": 1.97, + "learning_rate": 4.012390836028272e-06, + "loss": 0.0045, + "step": 391120 + }, + { + "epoch": 1.97, + "learning_rate": 4.004823143014262e-06, + "loss": 0.0058, + "step": 391130 + }, + { + "epoch": 1.97, + "learning_rate": 3.997255450000251e-06, + "loss": 0.0054, + "step": 391140 + }, + { + "epoch": 1.97, + "learning_rate": 3.989687756986241e-06, + "loss": 0.0035, + "step": 391150 + }, + { + "epoch": 1.97, + "learning_rate": 3.982120063972231e-06, + "loss": 0.0049, + "step": 391160 + }, + { + "epoch": 1.97, + "learning_rate": 3.974552370958221e-06, + "loss": 0.0056, + "step": 391170 + }, + { + "epoch": 1.97, + "learning_rate": 3.96698467794421e-06, + "loss": 0.0053, + "step": 391180 + }, + { + "epoch": 1.97, + "learning_rate": 3.9594169849302e-06, + "loss": 0.0054, + "step": 391190 + }, + { + "epoch": 1.97, + "learning_rate": 3.95184929191619e-06, + "loss": 0.0049, + "step": 391200 + }, + { + "epoch": 1.97, + "learning_rate": 3.94428159890218e-06, + "loss": 0.006, + "step": 391210 + }, + { + "epoch": 1.97, + "learning_rate": 3.936713905888169e-06, + "loss": 0.0052, + "step": 391220 + }, + { + "epoch": 1.97, + "learning_rate": 3.929146212874159e-06, + "loss": 0.0053, + "step": 391230 + }, + { + "epoch": 1.97, + "learning_rate": 3.921578519860149e-06, + "loss": 0.0072, + "step": 391240 + }, + { + "epoch": 1.97, + "learning_rate": 3.914010826846139e-06, + "loss": 0.0052, + "step": 391250 + }, + { + "epoch": 1.97, + "learning_rate": 3.906443133832128e-06, + "loss": 0.0064, + "step": 391260 + }, + { + "epoch": 1.97, + "learning_rate": 3.898875440818118e-06, + "loss": 0.0041, + "step": 391270 + }, + { + "epoch": 1.97, + "learning_rate": 3.891307747804108e-06, + "loss": 0.0048, + "step": 391280 + }, + { + "epoch": 1.97, + "learning_rate": 3.8837400547900975e-06, + "loss": 0.0046, + "step": 391290 + }, + { + "epoch": 1.97, + "learning_rate": 3.876172361776087e-06, + "loss": 0.0065, + "step": 391300 + }, + { + "epoch": 1.97, + "learning_rate": 3.8686046687620765e-06, + "loss": 0.0061, + "step": 391310 + }, + { + "epoch": 1.97, + "learning_rate": 3.861036975748066e-06, + "loss": 0.0092, + "step": 391320 + }, + { + "epoch": 1.97, + "learning_rate": 3.853469282734056e-06, + "loss": 0.0039, + "step": 391330 + }, + { + "epoch": 1.97, + "learning_rate": 3.845901589720045e-06, + "loss": 0.0042, + "step": 391340 + }, + { + "epoch": 1.97, + "learning_rate": 3.838333896706035e-06, + "loss": 0.0051, + "step": 391350 + }, + { + "epoch": 1.97, + "learning_rate": 3.830766203692024e-06, + "loss": 0.0053, + "step": 391360 + }, + { + "epoch": 1.97, + "learning_rate": 3.823198510678014e-06, + "loss": 0.0039, + "step": 391370 + }, + { + "epoch": 1.97, + "learning_rate": 3.815630817664004e-06, + "loss": 0.0054, + "step": 391380 + }, + { + "epoch": 1.97, + "learning_rate": 3.808063124649994e-06, + "loss": 0.0062, + "step": 391390 + }, + { + "epoch": 1.97, + "learning_rate": 3.8004954316359836e-06, + "loss": 0.0057, + "step": 391400 + }, + { + "epoch": 1.97, + "learning_rate": 3.7929277386219735e-06, + "loss": 0.0047, + "step": 391410 + }, + { + "epoch": 1.97, + "learning_rate": 3.785360045607963e-06, + "loss": 0.0054, + "step": 391420 + }, + { + "epoch": 1.97, + "learning_rate": 3.777792352593953e-06, + "loss": 0.006, + "step": 391430 + }, + { + "epoch": 1.97, + "learning_rate": 3.7702246595799424e-06, + "loss": 0.0035, + "step": 391440 + }, + { + "epoch": 1.97, + "learning_rate": 3.7626569665659323e-06, + "loss": 0.0038, + "step": 391450 + }, + { + "epoch": 1.97, + "learning_rate": 3.7550892735519214e-06, + "loss": 0.0053, + "step": 391460 + }, + { + "epoch": 1.98, + "learning_rate": 3.7475215805379117e-06, + "loss": 0.0053, + "step": 391470 + }, + { + "epoch": 1.98, + "learning_rate": 3.7399538875239008e-06, + "loss": 0.0048, + "step": 391480 + }, + { + "epoch": 1.98, + "learning_rate": 3.7323861945098907e-06, + "loss": 0.0047, + "step": 391490 + }, + { + "epoch": 1.98, + "learning_rate": 3.72481850149588e-06, + "loss": 0.0091, + "step": 391500 + }, + { + "epoch": 1.98, + "learning_rate": 3.71725080848187e-06, + "loss": 0.0053, + "step": 391510 + }, + { + "epoch": 1.98, + "learning_rate": 3.7096831154678596e-06, + "loss": 0.0064, + "step": 391520 + }, + { + "epoch": 1.98, + "learning_rate": 3.702115422453849e-06, + "loss": 0.0049, + "step": 391530 + }, + { + "epoch": 1.98, + "learning_rate": 3.694547729439839e-06, + "loss": 0.0063, + "step": 391540 + }, + { + "epoch": 1.98, + "learning_rate": 3.6869800364258285e-06, + "loss": 0.0049, + "step": 391550 + }, + { + "epoch": 1.98, + "learning_rate": 3.6794123434118184e-06, + "loss": 0.0054, + "step": 391560 + }, + { + "epoch": 1.98, + "learning_rate": 3.671844650397808e-06, + "loss": 0.0055, + "step": 391570 + }, + { + "epoch": 1.98, + "learning_rate": 3.6642769573837978e-06, + "loss": 0.0064, + "step": 391580 + }, + { + "epoch": 1.98, + "learning_rate": 3.6567092643697873e-06, + "loss": 0.0055, + "step": 391590 + }, + { + "epoch": 1.98, + "learning_rate": 3.649141571355777e-06, + "loss": 0.0051, + "step": 391600 + }, + { + "epoch": 1.98, + "learning_rate": 3.6415738783417667e-06, + "loss": 0.004, + "step": 391610 + }, + { + "epoch": 1.98, + "learning_rate": 3.6340061853277566e-06, + "loss": 0.0051, + "step": 391620 + }, + { + "epoch": 1.98, + "learning_rate": 3.626438492313746e-06, + "loss": 0.0081, + "step": 391630 + }, + { + "epoch": 1.98, + "learning_rate": 3.618870799299736e-06, + "loss": 0.009, + "step": 391640 + }, + { + "epoch": 1.98, + "learning_rate": 3.6113031062857255e-06, + "loss": 0.0033, + "step": 391650 + }, + { + "epoch": 1.98, + "learning_rate": 3.6037354132717154e-06, + "loss": 0.006, + "step": 391660 + }, + { + "epoch": 1.98, + "learning_rate": 3.5961677202577045e-06, + "loss": 0.0046, + "step": 391670 + }, + { + "epoch": 1.98, + "learning_rate": 3.588600027243695e-06, + "loss": 0.0057, + "step": 391680 + }, + { + "epoch": 1.98, + "learning_rate": 3.581032334229684e-06, + "loss": 0.0076, + "step": 391690 + }, + { + "epoch": 1.98, + "learning_rate": 3.5734646412156738e-06, + "loss": 0.0063, + "step": 391700 + }, + { + "epoch": 1.98, + "learning_rate": 3.5658969482016633e-06, + "loss": 0.0055, + "step": 391710 + }, + { + "epoch": 1.98, + "learning_rate": 3.558329255187653e-06, + "loss": 0.005, + "step": 391720 + }, + { + "epoch": 1.98, + "learning_rate": 3.5507615621736427e-06, + "loss": 0.0072, + "step": 391730 + }, + { + "epoch": 1.98, + "learning_rate": 3.5431938691596326e-06, + "loss": 0.0058, + "step": 391740 + }, + { + "epoch": 1.98, + "learning_rate": 3.535626176145622e-06, + "loss": 0.0039, + "step": 391750 + }, + { + "epoch": 1.98, + "learning_rate": 3.528058483131612e-06, + "loss": 0.0067, + "step": 391760 + }, + { + "epoch": 1.98, + "learning_rate": 3.5204907901176015e-06, + "loss": 0.0043, + "step": 391770 + }, + { + "epoch": 1.98, + "learning_rate": 3.5129230971035914e-06, + "loss": 0.0057, + "step": 391780 + }, + { + "epoch": 1.98, + "learning_rate": 3.505355404089581e-06, + "loss": 0.0087, + "step": 391790 + }, + { + "epoch": 1.98, + "learning_rate": 3.4977877110755708e-06, + "loss": 0.0045, + "step": 391800 + }, + { + "epoch": 1.98, + "learning_rate": 3.4902200180615603e-06, + "loss": 0.0046, + "step": 391810 + }, + { + "epoch": 1.98, + "learning_rate": 3.48265232504755e-06, + "loss": 0.0051, + "step": 391820 + }, + { + "epoch": 1.98, + "learning_rate": 3.4750846320335397e-06, + "loss": 0.006, + "step": 391830 + }, + { + "epoch": 1.98, + "learning_rate": 3.4675169390195296e-06, + "loss": 0.0066, + "step": 391840 + }, + { + "epoch": 1.98, + "learning_rate": 3.459949246005519e-06, + "loss": 0.0051, + "step": 391850 + }, + { + "epoch": 1.98, + "learning_rate": 3.452381552991509e-06, + "loss": 0.0046, + "step": 391860 + }, + { + "epoch": 1.98, + "learning_rate": 3.4448138599774985e-06, + "loss": 0.009, + "step": 391870 + }, + { + "epoch": 1.98, + "learning_rate": 3.4372461669634884e-06, + "loss": 0.0059, + "step": 391880 + }, + { + "epoch": 1.98, + "learning_rate": 3.429678473949478e-06, + "loss": 0.0049, + "step": 391890 + }, + { + "epoch": 1.98, + "learning_rate": 3.422110780935468e-06, + "loss": 0.0061, + "step": 391900 + }, + { + "epoch": 1.98, + "learning_rate": 3.414543087921457e-06, + "loss": 0.0063, + "step": 391910 + }, + { + "epoch": 1.98, + "learning_rate": 3.406975394907447e-06, + "loss": 0.008, + "step": 391920 + }, + { + "epoch": 1.98, + "learning_rate": 3.3994077018934363e-06, + "loss": 0.0062, + "step": 391930 + }, + { + "epoch": 1.98, + "learning_rate": 3.391840008879426e-06, + "loss": 0.0052, + "step": 391940 + }, + { + "epoch": 1.98, + "learning_rate": 3.3842723158654157e-06, + "loss": 0.0044, + "step": 391950 + }, + { + "epoch": 1.98, + "learning_rate": 3.3767046228514056e-06, + "loss": 0.0078, + "step": 391960 + }, + { + "epoch": 1.98, + "learning_rate": 3.369136929837395e-06, + "loss": 0.0048, + "step": 391970 + }, + { + "epoch": 1.98, + "learning_rate": 3.361569236823385e-06, + "loss": 0.0071, + "step": 391980 + }, + { + "epoch": 1.98, + "learning_rate": 3.3540015438093745e-06, + "loss": 0.004, + "step": 391990 + }, + { + "epoch": 1.98, + "learning_rate": 3.3464338507953644e-06, + "loss": 0.0048, + "step": 392000 + }, + { + "epoch": 1.98, + "eval_cer": 0.9144130025317635, + "eval_loss": 0.004128037486225367, + "eval_runtime": 116.0593, + "eval_samples_per_second": 17.233, + "eval_steps_per_second": 4.308, + "step": 392000 + }, + { + "epoch": 1.98, + "learning_rate": 3.338866157781354e-06, + "loss": 0.0077, + "step": 392010 + }, + { + "epoch": 1.98, + "learning_rate": 3.331298464767344e-06, + "loss": 0.0051, + "step": 392020 + }, + { + "epoch": 1.98, + "learning_rate": 3.3237307717533333e-06, + "loss": 0.004, + "step": 392030 + }, + { + "epoch": 1.98, + "learning_rate": 3.316163078739323e-06, + "loss": 0.0056, + "step": 392040 + }, + { + "epoch": 1.98, + "learning_rate": 3.3085953857253127e-06, + "loss": 0.0052, + "step": 392050 + }, + { + "epoch": 1.98, + "learning_rate": 3.3010276927113026e-06, + "loss": 0.0064, + "step": 392060 + }, + { + "epoch": 1.98, + "learning_rate": 3.293459999697292e-06, + "loss": 0.0061, + "step": 392070 + }, + { + "epoch": 1.98, + "learning_rate": 3.2858923066832816e-06, + "loss": 0.0061, + "step": 392080 + }, + { + "epoch": 1.98, + "learning_rate": 3.2783246136692715e-06, + "loss": 0.0051, + "step": 392090 + }, + { + "epoch": 1.98, + "learning_rate": 3.270756920655261e-06, + "loss": 0.0055, + "step": 392100 + }, + { + "epoch": 1.98, + "learning_rate": 3.263189227641251e-06, + "loss": 0.005, + "step": 392110 + }, + { + "epoch": 1.98, + "learning_rate": 3.25562153462724e-06, + "loss": 0.0054, + "step": 392120 + }, + { + "epoch": 1.98, + "learning_rate": 3.2480538416132303e-06, + "loss": 0.004, + "step": 392130 + }, + { + "epoch": 1.98, + "learning_rate": 3.2404861485992194e-06, + "loss": 0.0061, + "step": 392140 + }, + { + "epoch": 1.98, + "learning_rate": 3.2329184555852093e-06, + "loss": 0.0055, + "step": 392150 + }, + { + "epoch": 1.98, + "learning_rate": 3.2253507625711988e-06, + "loss": 0.0042, + "step": 392160 + }, + { + "epoch": 1.98, + "learning_rate": 3.2177830695571887e-06, + "loss": 0.01, + "step": 392170 + }, + { + "epoch": 1.98, + "learning_rate": 3.210215376543178e-06, + "loss": 0.0038, + "step": 392180 + }, + { + "epoch": 1.98, + "learning_rate": 3.202647683529168e-06, + "loss": 0.0051, + "step": 392190 + }, + { + "epoch": 1.98, + "learning_rate": 3.1950799905151576e-06, + "loss": 0.0054, + "step": 392200 + }, + { + "epoch": 1.98, + "learning_rate": 3.1875122975011475e-06, + "loss": 0.0056, + "step": 392210 + }, + { + "epoch": 1.98, + "learning_rate": 3.179944604487137e-06, + "loss": 0.0052, + "step": 392220 + }, + { + "epoch": 1.98, + "learning_rate": 3.172376911473127e-06, + "loss": 0.004, + "step": 392230 + }, + { + "epoch": 1.98, + "learning_rate": 3.1648092184591164e-06, + "loss": 0.0033, + "step": 392240 + }, + { + "epoch": 1.98, + "learning_rate": 3.1572415254451063e-06, + "loss": 0.0056, + "step": 392250 + }, + { + "epoch": 1.98, + "learning_rate": 3.1496738324310958e-06, + "loss": 0.0044, + "step": 392260 + }, + { + "epoch": 1.98, + "learning_rate": 3.1421061394170857e-06, + "loss": 0.005, + "step": 392270 + }, + { + "epoch": 1.98, + "learning_rate": 3.134538446403075e-06, + "loss": 0.0049, + "step": 392280 + }, + { + "epoch": 1.98, + "learning_rate": 3.126970753389065e-06, + "loss": 0.0052, + "step": 392290 + }, + { + "epoch": 1.98, + "learning_rate": 3.1194030603750546e-06, + "loss": 0.0047, + "step": 392300 + }, + { + "epoch": 1.98, + "learning_rate": 3.1118353673610445e-06, + "loss": 0.0059, + "step": 392310 + }, + { + "epoch": 1.98, + "learning_rate": 3.104267674347034e-06, + "loss": 0.0068, + "step": 392320 + }, + { + "epoch": 1.98, + "learning_rate": 3.096699981333024e-06, + "loss": 0.0064, + "step": 392330 + }, + { + "epoch": 1.98, + "learning_rate": 3.0891322883190134e-06, + "loss": 0.0061, + "step": 392340 + }, + { + "epoch": 1.98, + "learning_rate": 3.0815645953050033e-06, + "loss": 0.0046, + "step": 392350 + }, + { + "epoch": 1.98, + "learning_rate": 3.0739969022909924e-06, + "loss": 0.0095, + "step": 392360 + }, + { + "epoch": 1.98, + "learning_rate": 3.0664292092769827e-06, + "loss": 0.0051, + "step": 392370 + }, + { + "epoch": 1.98, + "learning_rate": 3.0588615162629718e-06, + "loss": 0.0036, + "step": 392380 + }, + { + "epoch": 1.98, + "learning_rate": 3.0512938232489617e-06, + "loss": 0.0042, + "step": 392390 + }, + { + "epoch": 1.98, + "learning_rate": 3.043726130234951e-06, + "loss": 0.0054, + "step": 392400 + }, + { + "epoch": 1.98, + "learning_rate": 3.036158437220941e-06, + "loss": 0.0077, + "step": 392410 + }, + { + "epoch": 1.98, + "learning_rate": 3.0285907442069306e-06, + "loss": 0.0063, + "step": 392420 + }, + { + "epoch": 1.98, + "learning_rate": 3.0210230511929205e-06, + "loss": 0.0034, + "step": 392430 + }, + { + "epoch": 1.98, + "learning_rate": 3.01345535817891e-06, + "loss": 0.0081, + "step": 392440 + }, + { + "epoch": 1.98, + "learning_rate": 3.0058876651649e-06, + "loss": 0.0055, + "step": 392450 + }, + { + "epoch": 1.98, + "learning_rate": 2.9983199721508894e-06, + "loss": 0.0056, + "step": 392460 + }, + { + "epoch": 1.98, + "learning_rate": 2.9907522791368793e-06, + "loss": 0.0046, + "step": 392470 + }, + { + "epoch": 1.98, + "learning_rate": 2.9831845861228688e-06, + "loss": 0.0063, + "step": 392480 + }, + { + "epoch": 1.98, + "learning_rate": 2.9756168931088587e-06, + "loss": 0.0078, + "step": 392490 + }, + { + "epoch": 1.98, + "learning_rate": 2.968049200094848e-06, + "loss": 0.0049, + "step": 392500 + }, + { + "epoch": 1.98, + "learning_rate": 2.960481507080838e-06, + "loss": 0.0044, + "step": 392510 + }, + { + "epoch": 1.98, + "learning_rate": 2.9529138140668276e-06, + "loss": 0.0063, + "step": 392520 + }, + { + "epoch": 1.98, + "learning_rate": 2.9453461210528175e-06, + "loss": 0.0051, + "step": 392530 + }, + { + "epoch": 1.98, + "learning_rate": 2.937778428038807e-06, + "loss": 0.0075, + "step": 392540 + }, + { + "epoch": 1.98, + "learning_rate": 2.930210735024797e-06, + "loss": 0.0053, + "step": 392550 + }, + { + "epoch": 1.98, + "learning_rate": 2.9226430420107864e-06, + "loss": 0.0042, + "step": 392560 + }, + { + "epoch": 1.98, + "learning_rate": 2.9150753489967763e-06, + "loss": 0.0062, + "step": 392570 + }, + { + "epoch": 1.98, + "learning_rate": 2.9075076559827658e-06, + "loss": 0.0094, + "step": 392580 + }, + { + "epoch": 1.98, + "learning_rate": 2.8999399629687557e-06, + "loss": 0.004, + "step": 392590 + }, + { + "epoch": 1.98, + "learning_rate": 2.8923722699547448e-06, + "loss": 0.0071, + "step": 392600 + }, + { + "epoch": 1.98, + "learning_rate": 2.8848045769407347e-06, + "loss": 0.0082, + "step": 392610 + }, + { + "epoch": 1.98, + "learning_rate": 2.877236883926724e-06, + "loss": 0.0052, + "step": 392620 + }, + { + "epoch": 1.98, + "learning_rate": 2.8696691909127136e-06, + "loss": 0.0043, + "step": 392630 + }, + { + "epoch": 1.98, + "learning_rate": 2.8621014978987036e-06, + "loss": 0.004, + "step": 392640 + }, + { + "epoch": 1.98, + "learning_rate": 2.854533804884693e-06, + "loss": 0.0063, + "step": 392650 + }, + { + "epoch": 1.98, + "learning_rate": 2.846966111870683e-06, + "loss": 0.0045, + "step": 392660 + }, + { + "epoch": 1.98, + "learning_rate": 2.8393984188566725e-06, + "loss": 0.0035, + "step": 392670 + }, + { + "epoch": 1.98, + "learning_rate": 2.8318307258426624e-06, + "loss": 0.0055, + "step": 392680 + }, + { + "epoch": 1.98, + "learning_rate": 2.824263032828652e-06, + "loss": 0.0048, + "step": 392690 + }, + { + "epoch": 1.98, + "learning_rate": 2.8166953398146418e-06, + "loss": 0.006, + "step": 392700 + }, + { + "epoch": 1.98, + "learning_rate": 2.8091276468006313e-06, + "loss": 0.0047, + "step": 392710 + }, + { + "epoch": 1.98, + "learning_rate": 2.801559953786621e-06, + "loss": 0.0072, + "step": 392720 + }, + { + "epoch": 1.98, + "learning_rate": 2.7939922607726107e-06, + "loss": 0.0072, + "step": 392730 + }, + { + "epoch": 1.98, + "learning_rate": 2.7864245677586006e-06, + "loss": 0.0058, + "step": 392740 + }, + { + "epoch": 1.98, + "learning_rate": 2.77885687474459e-06, + "loss": 0.0055, + "step": 392750 + }, + { + "epoch": 1.98, + "learning_rate": 2.77128918173058e-06, + "loss": 0.0057, + "step": 392760 + }, + { + "epoch": 1.98, + "learning_rate": 2.7637214887165695e-06, + "loss": 0.0065, + "step": 392770 + }, + { + "epoch": 1.98, + "learning_rate": 2.7561537957025594e-06, + "loss": 0.0039, + "step": 392780 + }, + { + "epoch": 1.98, + "learning_rate": 2.7485861026885484e-06, + "loss": 0.0066, + "step": 392790 + }, + { + "epoch": 1.98, + "learning_rate": 2.7410184096745388e-06, + "loss": 0.0073, + "step": 392800 + }, + { + "epoch": 1.98, + "learning_rate": 2.733450716660528e-06, + "loss": 0.0041, + "step": 392810 + }, + { + "epoch": 1.98, + "learning_rate": 2.7258830236465178e-06, + "loss": 0.0048, + "step": 392820 + }, + { + "epoch": 1.98, + "learning_rate": 2.7183153306325072e-06, + "loss": 0.0054, + "step": 392830 + }, + { + "epoch": 1.98, + "learning_rate": 2.710747637618497e-06, + "loss": 0.005, + "step": 392840 + }, + { + "epoch": 1.98, + "learning_rate": 2.7031799446044866e-06, + "loss": 0.0046, + "step": 392850 + }, + { + "epoch": 1.98, + "learning_rate": 2.6956122515904766e-06, + "loss": 0.0054, + "step": 392860 + }, + { + "epoch": 1.98, + "learning_rate": 2.688044558576466e-06, + "loss": 0.005, + "step": 392870 + }, + { + "epoch": 1.98, + "learning_rate": 2.680476865562456e-06, + "loss": 0.0038, + "step": 392880 + }, + { + "epoch": 1.98, + "learning_rate": 2.6729091725484455e-06, + "loss": 0.0049, + "step": 392890 + }, + { + "epoch": 1.98, + "learning_rate": 2.6653414795344354e-06, + "loss": 0.0053, + "step": 392900 + }, + { + "epoch": 1.98, + "learning_rate": 2.657773786520425e-06, + "loss": 0.006, + "step": 392910 + }, + { + "epoch": 1.98, + "learning_rate": 2.6502060935064148e-06, + "loss": 0.0067, + "step": 392920 + }, + { + "epoch": 1.98, + "learning_rate": 2.6426384004924043e-06, + "loss": 0.0068, + "step": 392930 + }, + { + "epoch": 1.98, + "learning_rate": 2.635070707478394e-06, + "loss": 0.0044, + "step": 392940 + }, + { + "epoch": 1.98, + "learning_rate": 2.6275030144643837e-06, + "loss": 0.0058, + "step": 392950 + }, + { + "epoch": 1.98, + "learning_rate": 2.6199353214503736e-06, + "loss": 0.0042, + "step": 392960 + }, + { + "epoch": 1.98, + "learning_rate": 2.612367628436363e-06, + "loss": 0.0049, + "step": 392970 + }, + { + "epoch": 1.98, + "learning_rate": 2.604799935422353e-06, + "loss": 0.005, + "step": 392980 + }, + { + "epoch": 1.98, + "learning_rate": 2.5972322424083425e-06, + "loss": 0.0045, + "step": 392990 + }, + { + "epoch": 1.98, + "learning_rate": 2.5896645493943324e-06, + "loss": 0.0069, + "step": 393000 + }, + { + "epoch": 1.98, + "eval_cer": 0.9144188249085159, + "eval_loss": 0.004126059357076883, + "eval_runtime": 116.0572, + "eval_samples_per_second": 17.233, + "eval_steps_per_second": 4.308, + "step": 393000 + }, + { + "epoch": 1.98, + "learning_rate": 2.582096856380322e-06, + "loss": 0.0053, + "step": 393010 + }, + { + "epoch": 1.98, + "learning_rate": 2.5745291633663118e-06, + "loss": 0.01, + "step": 393020 + }, + { + "epoch": 1.98, + "learning_rate": 2.566961470352301e-06, + "loss": 0.005, + "step": 393030 + }, + { + "epoch": 1.98, + "learning_rate": 2.559393777338291e-06, + "loss": 0.0069, + "step": 393040 + }, + { + "epoch": 1.98, + "learning_rate": 2.5518260843242802e-06, + "loss": 0.0043, + "step": 393050 + }, + { + "epoch": 1.98, + "learning_rate": 2.54425839131027e-06, + "loss": 0.0065, + "step": 393060 + }, + { + "epoch": 1.98, + "learning_rate": 2.5366906982962596e-06, + "loss": 0.0053, + "step": 393070 + }, + { + "epoch": 1.98, + "learning_rate": 2.5291230052822496e-06, + "loss": 0.0051, + "step": 393080 + }, + { + "epoch": 1.98, + "learning_rate": 2.521555312268239e-06, + "loss": 0.0072, + "step": 393090 + }, + { + "epoch": 1.98, + "learning_rate": 2.513987619254229e-06, + "loss": 0.005, + "step": 393100 + }, + { + "epoch": 1.98, + "learning_rate": 2.5064199262402185e-06, + "loss": 0.005, + "step": 393110 + }, + { + "epoch": 1.98, + "learning_rate": 2.4988522332262084e-06, + "loss": 0.006, + "step": 393120 + }, + { + "epoch": 1.98, + "learning_rate": 2.491284540212198e-06, + "loss": 0.005, + "step": 393130 + }, + { + "epoch": 1.98, + "learning_rate": 2.4837168471981878e-06, + "loss": 0.0049, + "step": 393140 + }, + { + "epoch": 1.98, + "learning_rate": 2.4761491541841773e-06, + "loss": 0.0053, + "step": 393150 + }, + { + "epoch": 1.98, + "learning_rate": 2.4685814611701667e-06, + "loss": 0.0042, + "step": 393160 + }, + { + "epoch": 1.98, + "learning_rate": 2.4610137681561567e-06, + "loss": 0.0057, + "step": 393170 + }, + { + "epoch": 1.98, + "learning_rate": 2.453446075142146e-06, + "loss": 0.0075, + "step": 393180 + }, + { + "epoch": 1.98, + "learning_rate": 2.445878382128136e-06, + "loss": 0.0069, + "step": 393190 + }, + { + "epoch": 1.98, + "learning_rate": 2.4383106891141256e-06, + "loss": 0.0038, + "step": 393200 + }, + { + "epoch": 1.98, + "learning_rate": 2.4307429961001155e-06, + "loss": 0.0048, + "step": 393210 + }, + { + "epoch": 1.98, + "learning_rate": 2.423175303086105e-06, + "loss": 0.007, + "step": 393220 + }, + { + "epoch": 1.98, + "learning_rate": 2.415607610072095e-06, + "loss": 0.0049, + "step": 393230 + }, + { + "epoch": 1.98, + "learning_rate": 2.408039917058084e-06, + "loss": 0.0062, + "step": 393240 + }, + { + "epoch": 1.98, + "learning_rate": 2.4004722240440743e-06, + "loss": 0.0051, + "step": 393250 + }, + { + "epoch": 1.98, + "learning_rate": 2.3929045310300633e-06, + "loss": 0.0052, + "step": 393260 + }, + { + "epoch": 1.98, + "learning_rate": 2.3853368380160532e-06, + "loss": 0.0055, + "step": 393270 + }, + { + "epoch": 1.98, + "learning_rate": 2.3777691450020427e-06, + "loss": 0.0047, + "step": 393280 + }, + { + "epoch": 1.98, + "learning_rate": 2.3702014519880327e-06, + "loss": 0.0045, + "step": 393290 + }, + { + "epoch": 1.98, + "learning_rate": 2.362633758974022e-06, + "loss": 0.0048, + "step": 393300 + }, + { + "epoch": 1.98, + "learning_rate": 2.355066065960012e-06, + "loss": 0.0052, + "step": 393310 + }, + { + "epoch": 1.98, + "learning_rate": 2.3474983729460015e-06, + "loss": 0.0064, + "step": 393320 + }, + { + "epoch": 1.98, + "learning_rate": 2.3399306799319915e-06, + "loss": 0.0075, + "step": 393330 + }, + { + "epoch": 1.98, + "learning_rate": 2.3323629869179814e-06, + "loss": 0.0049, + "step": 393340 + }, + { + "epoch": 1.98, + "learning_rate": 2.324795293903971e-06, + "loss": 0.0092, + "step": 393350 + }, + { + "epoch": 1.98, + "learning_rate": 2.3172276008899608e-06, + "loss": 0.0072, + "step": 393360 + }, + { + "epoch": 1.98, + "learning_rate": 2.3096599078759503e-06, + "loss": 0.0064, + "step": 393370 + }, + { + "epoch": 1.98, + "learning_rate": 2.3020922148619397e-06, + "loss": 0.008, + "step": 393380 + }, + { + "epoch": 1.98, + "learning_rate": 2.2945245218479297e-06, + "loss": 0.0091, + "step": 393390 + }, + { + "epoch": 1.98, + "learning_rate": 2.286956828833919e-06, + "loss": 0.0048, + "step": 393400 + }, + { + "epoch": 1.98, + "learning_rate": 2.279389135819909e-06, + "loss": 0.0055, + "step": 393410 + }, + { + "epoch": 1.98, + "learning_rate": 2.2718214428058986e-06, + "loss": 0.0047, + "step": 393420 + }, + { + "epoch": 1.98, + "learning_rate": 2.2642537497918885e-06, + "loss": 0.0053, + "step": 393430 + }, + { + "epoch": 1.98, + "learning_rate": 2.256686056777878e-06, + "loss": 0.0059, + "step": 393440 + }, + { + "epoch": 1.98, + "learning_rate": 2.2491183637638674e-06, + "loss": 0.0043, + "step": 393450 + }, + { + "epoch": 1.99, + "learning_rate": 2.2415506707498574e-06, + "loss": 0.006, + "step": 393460 + }, + { + "epoch": 1.99, + "learning_rate": 2.233982977735847e-06, + "loss": 0.0056, + "step": 393470 + }, + { + "epoch": 1.99, + "learning_rate": 2.2264152847218363e-06, + "loss": 0.0046, + "step": 393480 + }, + { + "epoch": 1.99, + "learning_rate": 2.2188475917078262e-06, + "loss": 0.0063, + "step": 393490 + }, + { + "epoch": 1.99, + "learning_rate": 2.2112798986938157e-06, + "loss": 0.0049, + "step": 393500 + }, + { + "epoch": 1.99, + "learning_rate": 2.2037122056798057e-06, + "loss": 0.0059, + "step": 393510 + }, + { + "epoch": 1.99, + "learning_rate": 2.196144512665795e-06, + "loss": 0.0071, + "step": 393520 + }, + { + "epoch": 1.99, + "learning_rate": 2.188576819651785e-06, + "loss": 0.0075, + "step": 393530 + }, + { + "epoch": 1.99, + "learning_rate": 2.1810091266377745e-06, + "loss": 0.0065, + "step": 393540 + }, + { + "epoch": 1.99, + "learning_rate": 2.1734414336237645e-06, + "loss": 0.007, + "step": 393550 + }, + { + "epoch": 1.99, + "learning_rate": 2.165873740609754e-06, + "loss": 0.007, + "step": 393560 + }, + { + "epoch": 1.99, + "learning_rate": 2.158306047595744e-06, + "loss": 0.0054, + "step": 393570 + }, + { + "epoch": 1.99, + "learning_rate": 2.1507383545817333e-06, + "loss": 0.0037, + "step": 393580 + }, + { + "epoch": 1.99, + "learning_rate": 2.143170661567723e-06, + "loss": 0.005, + "step": 393590 + }, + { + "epoch": 1.99, + "learning_rate": 2.1356029685537127e-06, + "loss": 0.0076, + "step": 393600 + }, + { + "epoch": 1.99, + "learning_rate": 2.1280352755397022e-06, + "loss": 0.0066, + "step": 393610 + }, + { + "epoch": 1.99, + "learning_rate": 2.120467582525692e-06, + "loss": 0.0054, + "step": 393620 + }, + { + "epoch": 1.99, + "learning_rate": 2.1128998895116816e-06, + "loss": 0.0048, + "step": 393630 + }, + { + "epoch": 1.99, + "learning_rate": 2.1053321964976716e-06, + "loss": 0.0085, + "step": 393640 + }, + { + "epoch": 1.99, + "learning_rate": 2.097764503483661e-06, + "loss": 0.0042, + "step": 393650 + }, + { + "epoch": 1.99, + "learning_rate": 2.090196810469651e-06, + "loss": 0.0063, + "step": 393660 + }, + { + "epoch": 1.99, + "learning_rate": 2.0826291174556404e-06, + "loss": 0.0067, + "step": 393670 + }, + { + "epoch": 1.99, + "learning_rate": 2.0750614244416304e-06, + "loss": 0.0048, + "step": 393680 + }, + { + "epoch": 1.99, + "learning_rate": 2.06749373142762e-06, + "loss": 0.0066, + "step": 393690 + }, + { + "epoch": 1.99, + "learning_rate": 2.0599260384136098e-06, + "loss": 0.0069, + "step": 393700 + }, + { + "epoch": 1.99, + "learning_rate": 2.0523583453995992e-06, + "loss": 0.0059, + "step": 393710 + }, + { + "epoch": 1.99, + "learning_rate": 2.0447906523855887e-06, + "loss": 0.0066, + "step": 393720 + }, + { + "epoch": 1.99, + "learning_rate": 2.0372229593715787e-06, + "loss": 0.007, + "step": 393730 + }, + { + "epoch": 1.99, + "learning_rate": 2.029655266357568e-06, + "loss": 0.0072, + "step": 393740 + }, + { + "epoch": 1.99, + "learning_rate": 2.022087573343558e-06, + "loss": 0.0047, + "step": 393750 + }, + { + "epoch": 1.99, + "learning_rate": 2.0145198803295475e-06, + "loss": 0.0066, + "step": 393760 + }, + { + "epoch": 1.99, + "learning_rate": 2.0069521873155375e-06, + "loss": 0.0054, + "step": 393770 + }, + { + "epoch": 1.99, + "learning_rate": 1.999384494301527e-06, + "loss": 0.0057, + "step": 393780 + }, + { + "epoch": 1.99, + "learning_rate": 1.991816801287517e-06, + "loss": 0.0039, + "step": 393790 + }, + { + "epoch": 1.99, + "learning_rate": 1.9842491082735063e-06, + "loss": 0.005, + "step": 393800 + }, + { + "epoch": 1.99, + "learning_rate": 1.9766814152594963e-06, + "loss": 0.0051, + "step": 393810 + }, + { + "epoch": 1.99, + "learning_rate": 1.9691137222454857e-06, + "loss": 0.006, + "step": 393820 + }, + { + "epoch": 1.99, + "learning_rate": 1.9615460292314752e-06, + "loss": 0.0049, + "step": 393830 + }, + { + "epoch": 1.99, + "learning_rate": 1.953978336217465e-06, + "loss": 0.0051, + "step": 393840 + }, + { + "epoch": 1.99, + "learning_rate": 1.9464106432034546e-06, + "loss": 0.0055, + "step": 393850 + }, + { + "epoch": 1.99, + "learning_rate": 1.9388429501894446e-06, + "loss": 0.0036, + "step": 393860 + }, + { + "epoch": 1.99, + "learning_rate": 1.931275257175434e-06, + "loss": 0.0066, + "step": 393870 + }, + { + "epoch": 1.99, + "learning_rate": 1.923707564161424e-06, + "loss": 0.0051, + "step": 393880 + }, + { + "epoch": 1.99, + "learning_rate": 1.9161398711474134e-06, + "loss": 0.0059, + "step": 393890 + }, + { + "epoch": 1.99, + "learning_rate": 1.9085721781334034e-06, + "loss": 0.0053, + "step": 393900 + }, + { + "epoch": 1.99, + "learning_rate": 1.9010044851193928e-06, + "loss": 0.007, + "step": 393910 + }, + { + "epoch": 1.99, + "learning_rate": 1.8934367921053825e-06, + "loss": 0.0079, + "step": 393920 + }, + { + "epoch": 1.99, + "learning_rate": 1.8858690990913722e-06, + "loss": 0.0077, + "step": 393930 + }, + { + "epoch": 1.99, + "learning_rate": 1.878301406077362e-06, + "loss": 0.0078, + "step": 393940 + }, + { + "epoch": 1.99, + "learning_rate": 1.8707337130633517e-06, + "loss": 0.006, + "step": 393950 + }, + { + "epoch": 1.99, + "learning_rate": 1.8631660200493414e-06, + "loss": 0.0053, + "step": 393960 + }, + { + "epoch": 1.99, + "learning_rate": 1.855598327035331e-06, + "loss": 0.0037, + "step": 393970 + }, + { + "epoch": 1.99, + "learning_rate": 1.8480306340213203e-06, + "loss": 0.0062, + "step": 393980 + }, + { + "epoch": 1.99, + "learning_rate": 1.84046294100731e-06, + "loss": 0.006, + "step": 393990 + }, + { + "epoch": 1.99, + "learning_rate": 1.8328952479932997e-06, + "loss": 0.0053, + "step": 394000 + }, + { + "epoch": 1.99, + "eval_cer": 0.9144168841162651, + "eval_loss": 0.004111087881028652, + "eval_runtime": 116.0484, + "eval_samples_per_second": 17.234, + "eval_steps_per_second": 4.309, + "step": 394000 + }, + { + "epoch": 1.99, + "learning_rate": 1.8253275549792894e-06, + "loss": 0.0062, + "step": 394010 + }, + { + "epoch": 1.99, + "learning_rate": 1.8177598619652791e-06, + "loss": 0.0054, + "step": 394020 + }, + { + "epoch": 1.99, + "learning_rate": 1.8101921689512688e-06, + "loss": 0.0059, + "step": 394030 + }, + { + "epoch": 1.99, + "learning_rate": 1.8026244759372585e-06, + "loss": 0.005, + "step": 394040 + }, + { + "epoch": 1.99, + "learning_rate": 1.7950567829232482e-06, + "loss": 0.0062, + "step": 394050 + }, + { + "epoch": 1.99, + "learning_rate": 1.787489089909238e-06, + "loss": 0.0051, + "step": 394060 + }, + { + "epoch": 1.99, + "learning_rate": 1.7799213968952276e-06, + "loss": 0.0051, + "step": 394070 + }, + { + "epoch": 1.99, + "learning_rate": 1.7723537038812173e-06, + "loss": 0.0047, + "step": 394080 + }, + { + "epoch": 1.99, + "learning_rate": 1.764786010867207e-06, + "loss": 0.0046, + "step": 394090 + }, + { + "epoch": 1.99, + "learning_rate": 1.7572183178531965e-06, + "loss": 0.0053, + "step": 394100 + }, + { + "epoch": 1.99, + "learning_rate": 1.7496506248391862e-06, + "loss": 0.0046, + "step": 394110 + }, + { + "epoch": 1.99, + "learning_rate": 1.742082931825176e-06, + "loss": 0.0062, + "step": 394120 + }, + { + "epoch": 1.99, + "learning_rate": 1.7345152388111656e-06, + "loss": 0.0045, + "step": 394130 + }, + { + "epoch": 1.99, + "learning_rate": 1.7269475457971553e-06, + "loss": 0.006, + "step": 394140 + }, + { + "epoch": 1.99, + "learning_rate": 1.719379852783145e-06, "loss": 0.0057, - "step": 184980 + "step": 394150 + }, + { + "epoch": 1.99, + "learning_rate": 1.7118121597691347e-06, + "loss": 0.0055, + "step": 394160 + }, + { + "epoch": 1.99, + "learning_rate": 1.7042444667551244e-06, + "loss": 0.0048, + "step": 394170 + }, + { + "epoch": 1.99, + "learning_rate": 1.6966767737411141e-06, + "loss": 0.0041, + "step": 394180 + }, + { + "epoch": 1.99, + "learning_rate": 1.6891090807271038e-06, + "loss": 0.0071, + "step": 394190 + }, + { + "epoch": 1.99, + "learning_rate": 1.6815413877130935e-06, + "loss": 0.0059, + "step": 394200 + }, + { + "epoch": 1.99, + "learning_rate": 1.673973694699083e-06, + "loss": 0.0045, + "step": 394210 + }, + { + "epoch": 1.99, + "learning_rate": 1.6664060016850727e-06, + "loss": 0.0053, + "step": 394220 + }, + { + "epoch": 1.99, + "learning_rate": 1.6588383086710624e-06, + "loss": 0.0075, + "step": 394230 + }, + { + "epoch": 1.99, + "learning_rate": 1.6512706156570521e-06, + "loss": 0.0047, + "step": 394240 + }, + { + "epoch": 1.99, + "learning_rate": 1.6437029226430418e-06, + "loss": 0.0053, + "step": 394250 + }, + { + "epoch": 1.99, + "learning_rate": 1.6361352296290315e-06, + "loss": 0.0046, + "step": 394260 + }, + { + "epoch": 1.99, + "learning_rate": 1.6285675366150212e-06, + "loss": 0.0049, + "step": 394270 + }, + { + "epoch": 1.99, + "learning_rate": 1.620999843601011e-06, + "loss": 0.007, + "step": 394280 + }, + { + "epoch": 1.99, + "learning_rate": 1.6134321505870006e-06, + "loss": 0.0071, + "step": 394290 + }, + { + "epoch": 1.99, + "learning_rate": 1.6058644575729903e-06, + "loss": 0.0059, + "step": 394300 + }, + { + "epoch": 1.99, + "learning_rate": 1.59829676455898e-06, + "loss": 0.0046, + "step": 394310 + }, + { + "epoch": 1.99, + "learning_rate": 1.5907290715449697e-06, + "loss": 0.0058, + "step": 394320 + }, + { + "epoch": 1.99, + "learning_rate": 1.5831613785309592e-06, + "loss": 0.0063, + "step": 394330 + }, + { + "epoch": 1.99, + "learning_rate": 1.575593685516949e-06, + "loss": 0.005, + "step": 394340 + }, + { + "epoch": 1.99, + "learning_rate": 1.5680259925029386e-06, + "loss": 0.0046, + "step": 394350 + }, + { + "epoch": 1.99, + "learning_rate": 1.5604582994889283e-06, + "loss": 0.0044, + "step": 394360 + }, + { + "epoch": 1.99, + "learning_rate": 1.552890606474918e-06, + "loss": 0.005, + "step": 394370 + }, + { + "epoch": 1.99, + "learning_rate": 1.5453229134609077e-06, + "loss": 0.0063, + "step": 394380 + }, + { + "epoch": 1.99, + "learning_rate": 1.5377552204468974e-06, + "loss": 0.0064, + "step": 394390 + }, + { + "epoch": 1.99, + "learning_rate": 1.5301875274328871e-06, + "loss": 0.0061, + "step": 394400 + }, + { + "epoch": 1.99, + "learning_rate": 1.5226198344188768e-06, + "loss": 0.0071, + "step": 394410 + }, + { + "epoch": 1.99, + "learning_rate": 1.5150521414048665e-06, + "loss": 0.006, + "step": 394420 + }, + { + "epoch": 1.99, + "learning_rate": 1.5074844483908562e-06, + "loss": 0.0063, + "step": 394430 + }, + { + "epoch": 1.99, + "learning_rate": 1.499916755376846e-06, + "loss": 0.0037, + "step": 394440 + }, + { + "epoch": 1.99, + "learning_rate": 1.4923490623628354e-06, + "loss": 0.0047, + "step": 394450 + }, + { + "epoch": 1.99, + "learning_rate": 1.4847813693488251e-06, + "loss": 0.0053, + "step": 394460 + }, + { + "epoch": 1.99, + "learning_rate": 1.4772136763348148e-06, + "loss": 0.0051, + "step": 394470 + }, + { + "epoch": 1.99, + "learning_rate": 1.4696459833208045e-06, + "loss": 0.005, + "step": 394480 + }, + { + "epoch": 1.99, + "learning_rate": 1.4620782903067942e-06, + "loss": 0.0075, + "step": 394490 + }, + { + "epoch": 1.99, + "learning_rate": 1.454510597292784e-06, + "loss": 0.0063, + "step": 394500 + }, + { + "epoch": 1.99, + "learning_rate": 1.4469429042787736e-06, + "loss": 0.0043, + "step": 394510 + }, + { + "epoch": 1.99, + "learning_rate": 1.4393752112647631e-06, + "loss": 0.0044, + "step": 394520 + }, + { + "epoch": 1.99, + "learning_rate": 1.4318075182507528e-06, + "loss": 0.0048, + "step": 394530 + }, + { + "epoch": 1.99, + "learning_rate": 1.4242398252367423e-06, + "loss": 0.0061, + "step": 394540 + }, + { + "epoch": 1.99, + "learning_rate": 1.416672132222732e-06, + "loss": 0.007, + "step": 394550 + }, + { + "epoch": 1.99, + "learning_rate": 1.4091044392087217e-06, + "loss": 0.0042, + "step": 394560 + }, + { + "epoch": 1.99, + "learning_rate": 1.4015367461947114e-06, + "loss": 0.0042, + "step": 394570 + }, + { + "epoch": 1.99, + "learning_rate": 1.3939690531807011e-06, + "loss": 0.005, + "step": 394580 + }, + { + "epoch": 1.99, + "learning_rate": 1.3864013601666908e-06, + "loss": 0.0062, + "step": 394590 + }, + { + "epoch": 1.99, + "learning_rate": 1.3788336671526805e-06, + "loss": 0.0074, + "step": 394600 + }, + { + "epoch": 1.99, + "learning_rate": 1.3712659741386702e-06, + "loss": 0.0055, + "step": 394610 + }, + { + "epoch": 1.99, + "learning_rate": 1.36369828112466e-06, + "loss": 0.0052, + "step": 394620 + }, + { + "epoch": 1.99, + "learning_rate": 1.3561305881106496e-06, + "loss": 0.004, + "step": 394630 + }, + { + "epoch": 1.99, + "learning_rate": 1.3485628950966393e-06, + "loss": 0.0093, + "step": 394640 + }, + { + "epoch": 1.99, + "learning_rate": 1.340995202082629e-06, + "loss": 0.0063, + "step": 394650 + }, + { + "epoch": 1.99, + "learning_rate": 1.3334275090686185e-06, + "loss": 0.0048, + "step": 394660 + }, + { + "epoch": 1.99, + "learning_rate": 1.3258598160546082e-06, + "loss": 0.0072, + "step": 394670 + }, + { + "epoch": 1.99, + "learning_rate": 1.318292123040598e-06, + "loss": 0.0054, + "step": 394680 + }, + { + "epoch": 1.99, + "learning_rate": 1.3107244300265876e-06, + "loss": 0.0043, + "step": 394690 + }, + { + "epoch": 1.99, + "learning_rate": 1.3031567370125773e-06, + "loss": 0.0046, + "step": 394700 + }, + { + "epoch": 1.99, + "learning_rate": 1.295589043998567e-06, + "loss": 0.0046, + "step": 394710 + }, + { + "epoch": 1.99, + "learning_rate": 1.2880213509845567e-06, + "loss": 0.0069, + "step": 394720 + }, + { + "epoch": 1.99, + "learning_rate": 1.2804536579705464e-06, + "loss": 0.0058, + "step": 394730 + }, + { + "epoch": 1.99, + "learning_rate": 1.2728859649565361e-06, + "loss": 0.0044, + "step": 394740 + }, + { + "epoch": 1.99, + "learning_rate": 1.2653182719425258e-06, + "loss": 0.0052, + "step": 394750 + }, + { + "epoch": 1.99, + "learning_rate": 1.2577505789285155e-06, + "loss": 0.0067, + "step": 394760 + }, + { + "epoch": 1.99, + "learning_rate": 1.2501828859145052e-06, + "loss": 0.0053, + "step": 394770 + }, + { + "epoch": 1.99, + "learning_rate": 1.2426151929004947e-06, + "loss": 0.0084, + "step": 394780 + }, + { + "epoch": 1.99, + "learning_rate": 1.2350474998864844e-06, + "loss": 0.0058, + "step": 394790 + }, + { + "epoch": 1.99, + "learning_rate": 1.2274798068724741e-06, + "loss": 0.0066, + "step": 394800 + }, + { + "epoch": 1.99, + "learning_rate": 1.2199121138584638e-06, + "loss": 0.0061, + "step": 394810 + }, + { + "epoch": 1.99, + "learning_rate": 1.2123444208444535e-06, + "loss": 0.0048, + "step": 394820 + }, + { + "epoch": 1.99, + "learning_rate": 1.2047767278304432e-06, + "loss": 0.0051, + "step": 394830 + }, + { + "epoch": 1.99, + "learning_rate": 1.197209034816433e-06, + "loss": 0.0089, + "step": 394840 + }, + { + "epoch": 1.99, + "learning_rate": 1.1896413418024226e-06, + "loss": 0.0069, + "step": 394850 + }, + { + "epoch": 1.99, + "learning_rate": 1.1820736487884123e-06, + "loss": 0.0043, + "step": 394860 + }, + { + "epoch": 1.99, + "learning_rate": 1.174505955774402e-06, + "loss": 0.0074, + "step": 394870 + }, + { + "epoch": 1.99, + "learning_rate": 1.1669382627603917e-06, + "loss": 0.0052, + "step": 394880 + }, + { + "epoch": 1.99, + "learning_rate": 1.1593705697463812e-06, + "loss": 0.0048, + "step": 394890 + }, + { + "epoch": 1.99, + "learning_rate": 1.151802876732371e-06, + "loss": 0.0045, + "step": 394900 + }, + { + "epoch": 1.99, + "learning_rate": 1.1442351837183606e-06, + "loss": 0.0047, + "step": 394910 + }, + { + "epoch": 1.99, + "learning_rate": 1.1366674907043503e-06, + "loss": 0.0048, + "step": 394920 + }, + { + "epoch": 1.99, + "learning_rate": 1.12909979769034e-06, + "loss": 0.0046, + "step": 394930 + }, + { + "epoch": 1.99, + "learning_rate": 1.1215321046763295e-06, + "loss": 0.0046, + "step": 394940 + }, + { + "epoch": 1.99, + "learning_rate": 1.1139644116623192e-06, + "loss": 0.0043, + "step": 394950 + }, + { + "epoch": 1.99, + "learning_rate": 1.106396718648309e-06, + "loss": 0.0062, + "step": 394960 + }, + { + "epoch": 1.99, + "learning_rate": 1.0988290256342986e-06, + "loss": 0.0056, + "step": 394970 + }, + { + "epoch": 1.99, + "learning_rate": 1.0912613326202883e-06, + "loss": 0.0034, + "step": 394980 + }, + { + "epoch": 1.99, + "learning_rate": 1.083693639606278e-06, + "loss": 0.0043, + "step": 394990 + }, + { + "epoch": 1.99, + "learning_rate": 1.0761259465922677e-06, + "loss": 0.0048, + "step": 395000 + }, + { + "epoch": 1.99, + "eval_cer": 0.9144168841162651, + "eval_loss": 0.004111517686396837, + "eval_runtime": 115.9763, + "eval_samples_per_second": 17.245, + "eval_steps_per_second": 4.311, + "step": 395000 + }, + { + "epoch": 1.99, + "learning_rate": 1.0685582535782574e-06, + "loss": 0.0043, + "step": 395010 + }, + { + "epoch": 1.99, + "learning_rate": 1.0609905605642471e-06, + "loss": 0.0083, + "step": 395020 + }, + { + "epoch": 1.99, + "learning_rate": 1.0534228675502368e-06, + "loss": 0.0055, + "step": 395030 + }, + { + "epoch": 1.99, + "learning_rate": 1.0458551745362265e-06, + "loss": 0.0054, + "step": 395040 + }, + { + "epoch": 1.99, + "learning_rate": 1.0382874815222162e-06, + "loss": 0.0062, + "step": 395050 + }, + { + "epoch": 1.99, + "learning_rate": 1.0307197885082057e-06, + "loss": 0.0048, + "step": 395060 + }, + { + "epoch": 1.99, + "learning_rate": 1.0231520954941954e-06, + "loss": 0.0065, + "step": 395070 + }, + { + "epoch": 1.99, + "learning_rate": 1.0155844024801851e-06, + "loss": 0.0055, + "step": 395080 + }, + { + "epoch": 1.99, + "learning_rate": 1.0080167094661748e-06, + "loss": 0.0058, + "step": 395090 + }, + { + "epoch": 1.99, + "learning_rate": 1.0004490164521645e-06, + "loss": 0.0066, + "step": 395100 + }, + { + "epoch": 1.99, + "learning_rate": 9.928813234381542e-07, + "loss": 0.0042, + "step": 395110 + }, + { + "epoch": 1.99, + "learning_rate": 9.85313630424144e-07, + "loss": 0.0051, + "step": 395120 + }, + { + "epoch": 1.99, + "learning_rate": 9.777459374101336e-07, + "loss": 0.0048, + "step": 395130 + }, + { + "epoch": 1.99, + "learning_rate": 9.701782443961233e-07, + "loss": 0.0041, + "step": 395140 + }, + { + "epoch": 1.99, + "learning_rate": 9.62610551382113e-07, + "loss": 0.0046, + "step": 395150 + }, + { + "epoch": 1.99, + "learning_rate": 9.550428583681027e-07, + "loss": 0.0058, + "step": 395160 + }, + { + "epoch": 1.99, + "learning_rate": 9.474751653540923e-07, + "loss": 0.0049, + "step": 395170 + }, + { + "epoch": 1.99, + "learning_rate": 9.39907472340082e-07, + "loss": 0.0058, + "step": 395180 + }, + { + "epoch": 1.99, + "learning_rate": 9.323397793260717e-07, + "loss": 0.0057, + "step": 395190 + }, + { + "epoch": 1.99, + "learning_rate": 9.247720863120612e-07, + "loss": 0.0089, + "step": 395200 + }, + { + "epoch": 1.99, + "learning_rate": 9.172043932980509e-07, + "loss": 0.006, + "step": 395210 + }, + { + "epoch": 1.99, + "learning_rate": 9.096367002840406e-07, + "loss": 0.005, + "step": 395220 + }, + { + "epoch": 1.99, + "learning_rate": 9.020690072700303e-07, + "loss": 0.0051, + "step": 395230 + }, + { + "epoch": 1.99, + "learning_rate": 8.9450131425602e-07, + "loss": 0.006, + "step": 395240 + }, + { + "epoch": 1.99, + "learning_rate": 8.869336212420096e-07, + "loss": 0.0049, + "step": 395250 + }, + { + "epoch": 1.99, + "learning_rate": 8.793659282279993e-07, + "loss": 0.0057, + "step": 395260 + }, + { + "epoch": 1.99, + "learning_rate": 8.71798235213989e-07, + "loss": 0.0048, + "step": 395270 + }, + { + "epoch": 1.99, + "learning_rate": 8.642305421999787e-07, + "loss": 0.004, + "step": 395280 + }, + { + "epoch": 1.99, + "learning_rate": 8.566628491859684e-07, + "loss": 0.0033, + "step": 395290 + }, + { + "epoch": 1.99, + "learning_rate": 8.490951561719581e-07, + "loss": 0.0053, + "step": 395300 + }, + { + "epoch": 1.99, + "learning_rate": 8.415274631579477e-07, + "loss": 0.0056, + "step": 395310 + }, + { + "epoch": 1.99, + "learning_rate": 8.339597701439374e-07, + "loss": 0.0054, + "step": 395320 + }, + { + "epoch": 1.99, + "learning_rate": 8.263920771299271e-07, + "loss": 0.0045, + "step": 395330 + }, + { + "epoch": 1.99, + "learning_rate": 8.188243841159168e-07, + "loss": 0.0059, + "step": 395340 + }, + { + "epoch": 1.99, + "learning_rate": 8.112566911019065e-07, + "loss": 0.0061, + "step": 395350 + }, + { + "epoch": 1.99, + "learning_rate": 8.036889980878962e-07, + "loss": 0.005, + "step": 395360 + }, + { + "epoch": 1.99, + "learning_rate": 7.961213050738858e-07, + "loss": 0.0051, + "step": 395370 + }, + { + "epoch": 1.99, + "learning_rate": 7.885536120598755e-07, + "loss": 0.0066, + "step": 395380 + }, + { + "epoch": 1.99, + "learning_rate": 7.809859190458652e-07, + "loss": 0.0048, + "step": 395390 + }, + { + "epoch": 1.99, + "learning_rate": 7.734182260318549e-07, + "loss": 0.0054, + "step": 395400 + }, + { + "epoch": 1.99, + "learning_rate": 7.658505330178446e-07, + "loss": 0.0068, + "step": 395410 + }, + { + "epoch": 1.99, + "learning_rate": 7.582828400038343e-07, + "loss": 0.0089, + "step": 395420 + }, + { + "epoch": 1.99, + "learning_rate": 7.507151469898239e-07, + "loss": 0.0066, + "step": 395430 + }, + { + "epoch": 2.0, + "learning_rate": 7.431474539758136e-07, + "loss": 0.0056, + "step": 395440 + }, + { + "epoch": 2.0, + "learning_rate": 7.355797609618033e-07, + "loss": 0.0045, + "step": 395450 + }, + { + "epoch": 2.0, + "learning_rate": 7.28012067947793e-07, + "loss": 0.0056, + "step": 395460 + }, + { + "epoch": 2.0, + "learning_rate": 7.204443749337827e-07, + "loss": 0.0042, + "step": 395470 + }, + { + "epoch": 2.0, + "learning_rate": 7.128766819197722e-07, + "loss": 0.0059, + "step": 395480 + }, + { + "epoch": 2.0, + "learning_rate": 7.053089889057619e-07, + "loss": 0.008, + "step": 395490 + }, + { + "epoch": 2.0, + "learning_rate": 6.977412958917516e-07, + "loss": 0.0062, + "step": 395500 + }, + { + "epoch": 2.0, + "learning_rate": 6.901736028777413e-07, + "loss": 0.0062, + "step": 395510 + }, + { + "epoch": 2.0, + "learning_rate": 6.82605909863731e-07, + "loss": 0.0042, + "step": 395520 + }, + { + "epoch": 2.0, + "learning_rate": 6.750382168497206e-07, + "loss": 0.004, + "step": 395530 + }, + { + "epoch": 2.0, + "learning_rate": 6.674705238357103e-07, + "loss": 0.0054, + "step": 395540 + }, + { + "epoch": 2.0, + "learning_rate": 6.599028308217e-07, + "loss": 0.0066, + "step": 395550 + }, + { + "epoch": 2.0, + "learning_rate": 6.523351378076897e-07, + "loss": 0.0051, + "step": 395560 + }, + { + "epoch": 2.0, + "learning_rate": 6.447674447936794e-07, + "loss": 0.0068, + "step": 395570 + }, + { + "epoch": 2.0, + "learning_rate": 6.371997517796691e-07, + "loss": 0.0058, + "step": 395580 + }, + { + "epoch": 2.0, + "learning_rate": 6.296320587656587e-07, + "loss": 0.0053, + "step": 395590 + }, + { + "epoch": 2.0, + "learning_rate": 6.220643657516484e-07, + "loss": 0.0043, + "step": 395600 + }, + { + "epoch": 2.0, + "learning_rate": 6.144966727376381e-07, + "loss": 0.0056, + "step": 395610 + }, + { + "epoch": 2.0, + "learning_rate": 6.069289797236278e-07, + "loss": 0.0036, + "step": 395620 + }, + { + "epoch": 2.0, + "learning_rate": 5.993612867096175e-07, + "loss": 0.0052, + "step": 395630 + }, + { + "epoch": 2.0, + "learning_rate": 5.917935936956072e-07, + "loss": 0.0069, + "step": 395640 + }, + { + "epoch": 2.0, + "learning_rate": 5.842259006815968e-07, + "loss": 0.0048, + "step": 395650 + }, + { + "epoch": 2.0, + "learning_rate": 5.766582076675865e-07, + "loss": 0.0064, + "step": 395660 + }, + { + "epoch": 2.0, + "learning_rate": 5.690905146535762e-07, + "loss": 0.005, + "step": 395670 + }, + { + "epoch": 2.0, + "learning_rate": 5.615228216395658e-07, + "loss": 0.0061, + "step": 395680 + }, + { + "epoch": 2.0, + "learning_rate": 5.539551286255555e-07, + "loss": 0.0051, + "step": 395690 + }, + { + "epoch": 2.0, + "learning_rate": 5.463874356115452e-07, + "loss": 0.0065, + "step": 395700 + }, + { + "epoch": 2.0, + "learning_rate": 5.388197425975349e-07, + "loss": 0.0054, + "step": 395710 + }, + { + "epoch": 2.0, + "learning_rate": 5.312520495835246e-07, + "loss": 0.0042, + "step": 395720 + }, + { + "epoch": 2.0, + "learning_rate": 5.236843565695142e-07, + "loss": 0.0079, + "step": 395730 + }, + { + "epoch": 2.0, + "learning_rate": 5.161166635555039e-07, + "loss": 0.0063, + "step": 395740 + }, + { + "epoch": 2.0, + "learning_rate": 5.085489705414936e-07, + "loss": 0.0047, + "step": 395750 + }, + { + "epoch": 2.0, + "learning_rate": 5.009812775274833e-07, + "loss": 0.0086, + "step": 395760 + }, + { + "epoch": 2.0, + "learning_rate": 4.93413584513473e-07, + "loss": 0.0062, + "step": 395770 + }, + { + "epoch": 2.0, + "learning_rate": 4.858458914994627e-07, + "loss": 0.0044, + "step": 395780 + }, + { + "epoch": 2.0, + "learning_rate": 4.782781984854523e-07, + "loss": 0.0036, + "step": 395790 + }, + { + "epoch": 2.0, + "learning_rate": 4.70710505471442e-07, + "loss": 0.0067, + "step": 395800 + }, + { + "epoch": 2.0, + "learning_rate": 4.631428124574317e-07, + "loss": 0.0058, + "step": 395810 + }, + { + "epoch": 2.0, + "learning_rate": 4.5557511944342136e-07, + "loss": 0.0068, + "step": 395820 + }, + { + "epoch": 2.0, + "learning_rate": 4.48007426429411e-07, + "loss": 0.0067, + "step": 395830 + }, + { + "epoch": 2.0, + "learning_rate": 4.404397334154007e-07, + "loss": 0.0083, + "step": 395840 + }, + { + "epoch": 2.0, + "learning_rate": 4.328720404013904e-07, + "loss": 0.005, + "step": 395850 + }, + { + "epoch": 2.0, + "learning_rate": 4.2530434738738006e-07, + "loss": 0.006, + "step": 395860 + }, + { + "epoch": 2.0, + "learning_rate": 4.1773665437336976e-07, + "loss": 0.0043, + "step": 395870 + }, + { + "epoch": 2.0, + "learning_rate": 4.1016896135935946e-07, + "loss": 0.0056, + "step": 395880 + }, + { + "epoch": 2.0, + "learning_rate": 4.026012683453491e-07, + "loss": 0.0065, + "step": 395890 + }, + { + "epoch": 2.0, + "learning_rate": 3.950335753313388e-07, + "loss": 0.0047, + "step": 395900 + }, + { + "epoch": 2.0, + "learning_rate": 3.8746588231732846e-07, + "loss": 0.0051, + "step": 395910 + }, + { + "epoch": 2.0, + "learning_rate": 3.7989818930331816e-07, + "loss": 0.0048, + "step": 395920 + }, + { + "epoch": 2.0, + "learning_rate": 3.7233049628930786e-07, + "loss": 0.0056, + "step": 395930 + }, + { + "epoch": 2.0, + "learning_rate": 3.647628032752975e-07, + "loss": 0.0061, + "step": 395940 + }, + { + "epoch": 2.0, + "learning_rate": 3.5719511026128716e-07, + "loss": 0.004, + "step": 395950 + }, + { + "epoch": 2.0, + "learning_rate": 3.4962741724727686e-07, + "loss": 0.0052, + "step": 395960 + }, + { + "epoch": 2.0, + "learning_rate": 3.420597242332665e-07, + "loss": 0.0054, + "step": 395970 + }, + { + "epoch": 2.0, + "learning_rate": 3.344920312192562e-07, + "loss": 0.0061, + "step": 395980 + }, + { + "epoch": 2.0, + "learning_rate": 3.269243382052459e-07, + "loss": 0.005, + "step": 395990 + }, + { + "epoch": 2.0, + "learning_rate": 3.1935664519123556e-07, + "loss": 0.0044, + "step": 396000 + }, + { + "epoch": 2.0, + "eval_cer": 0.9144159137201398, + "eval_loss": 0.004107584245502949, + "eval_runtime": 116.1979, + "eval_samples_per_second": 17.212, + "eval_steps_per_second": 4.303, + "step": 396000 }, { "epoch": 2.0, - "learning_rate": 2.2702211844068234e-08, + "learning_rate": 3.1178895217722526e-07, + "loss": 0.0042, + "step": 396010 + }, + { + "epoch": 2.0, + "learning_rate": 3.0422125916321496e-07, + "loss": 0.0065, + "step": 396020 + }, + { + "epoch": 2.0, + "learning_rate": 2.966535661492046e-07, + "loss": 0.0079, + "step": 396030 + }, + { + "epoch": 2.0, + "learning_rate": 2.890858731351943e-07, + "loss": 0.0049, + "step": 396040 + }, + { + "epoch": 2.0, + "learning_rate": 2.8151818012118396e-07, + "loss": 0.0066, + "step": 396050 + }, + { + "epoch": 2.0, + "learning_rate": 2.7395048710717366e-07, "loss": 0.0055, - "step": 184990 + "step": 396060 + }, + { + "epoch": 2.0, + "learning_rate": 2.663827940931633e-07, + "loss": 0.0048, + "step": 396070 + }, + { + "epoch": 2.0, + "learning_rate": 2.58815101079153e-07, + "loss": 0.0059, + "step": 396080 + }, + { + "epoch": 2.0, + "learning_rate": 2.512474080651427e-07, + "loss": 0.0055, + "step": 396090 + }, + { + "epoch": 2.0, + "learning_rate": 2.4367971505113236e-07, + "loss": 0.0039, + "step": 396100 + }, + { + "epoch": 2.0, + "learning_rate": 2.3611202203712206e-07, + "loss": 0.0043, + "step": 396110 + }, + { + "epoch": 2.0, + "learning_rate": 2.285443290231117e-07, + "loss": 0.0069, + "step": 396120 + }, + { + "epoch": 2.0, + "learning_rate": 2.2097663600910138e-07, + "loss": 0.0048, + "step": 396130 + }, + { + "epoch": 2.0, + "learning_rate": 2.1340894299509105e-07, + "loss": 0.0041, + "step": 396140 + }, + { + "epoch": 2.0, + "learning_rate": 2.0584124998108076e-07, + "loss": 0.0069, + "step": 396150 + }, + { + "epoch": 2.0, + "learning_rate": 1.9827355696707043e-07, + "loss": 0.0048, + "step": 396160 + }, + { + "epoch": 2.0, + "learning_rate": 1.907058639530601e-07, + "loss": 0.0061, + "step": 396170 + }, + { + "epoch": 2.0, + "learning_rate": 1.831381709390498e-07, + "loss": 0.0049, + "step": 396180 + }, + { + "epoch": 2.0, + "learning_rate": 1.7557047792503945e-07, + "loss": 0.0058, + "step": 396190 + }, + { + "epoch": 2.0, + "learning_rate": 1.6800278491102913e-07, + "loss": 0.0052, + "step": 396200 + }, + { + "epoch": 2.0, + "learning_rate": 1.604350918970188e-07, + "loss": 0.0048, + "step": 396210 + }, + { + "epoch": 2.0, + "learning_rate": 1.528673988830085e-07, + "loss": 0.0044, + "step": 396220 + }, + { + "epoch": 2.0, + "learning_rate": 1.4529970586899818e-07, + "loss": 0.0069, + "step": 396230 + }, + { + "epoch": 2.0, + "learning_rate": 1.3773201285498785e-07, + "loss": 0.0053, + "step": 396240 + }, + { + "epoch": 2.0, + "learning_rate": 1.3016431984097753e-07, + "loss": 0.0071, + "step": 396250 }, { "epoch": 2.0, - "learning_rate": 6.486346241162353e-09, + "learning_rate": 1.225966268269672e-07, "loss": 0.0066, - "step": 185000 + "step": 396260 }, { "epoch": 2.0, - "eval_cer": 0.9215104310529031, - "eval_loss": 0.005186900030821562, - "eval_runtime": 121.1763, - "eval_samples_per_second": 16.505, - "eval_steps_per_second": 4.126, - "step": 185000 + "learning_rate": 1.1502893381295688e-07, + "loss": 0.0054, + "step": 396270 + }, + { + "epoch": 2.0, + "learning_rate": 1.0746124079894656e-07, + "loss": 0.006, + "step": 396280 + }, + { + "epoch": 2.0, + "learning_rate": 9.989354778493625e-08, + "loss": 0.0061, + "step": 396290 + }, + { + "epoch": 2.0, + "learning_rate": 9.232585477092593e-08, + "loss": 0.0059, + "step": 396300 + }, + { + "epoch": 2.0, + "learning_rate": 8.47581617569156e-08, + "loss": 0.0049, + "step": 396310 + }, + { + "epoch": 2.0, + "learning_rate": 7.719046874290528e-08, + "loss": 0.0063, + "step": 396320 + }, + { + "epoch": 2.0, + "learning_rate": 6.962277572889495e-08, + "loss": 0.0069, + "step": 396330 + }, + { + "epoch": 2.0, + "learning_rate": 6.205508271488464e-08, + "loss": 0.0054, + "step": 396340 + }, + { + "epoch": 2.0, + "learning_rate": 5.4487389700874314e-08, + "loss": 0.0046, + "step": 396350 + }, + { + "epoch": 2.0, + "learning_rate": 4.6919696686863995e-08, + "loss": 0.0044, + "step": 396360 + }, + { + "epoch": 2.0, + "learning_rate": 3.935200367285367e-08, + "loss": 0.0049, + "step": 396370 + }, + { + "epoch": 2.0, + "learning_rate": 3.178431065884335e-08, + "loss": 0.0076, + "step": 396380 + }, + { + "epoch": 2.0, + "learning_rate": 2.421661764483303e-08, + "loss": 0.0049, + "step": 396390 + }, + { + "epoch": 2.0, + "learning_rate": 1.6648924630822707e-08, + "loss": 0.007, + "step": 396400 + }, + { + "epoch": 2.0, + "learning_rate": 9.081231616812386e-09, + "loss": 0.0071, + "step": 396410 + }, + { + "epoch": 2.0, + "learning_rate": 1.5135386028020643e-09, + "loss": 0.0046, + "step": 396420 }, { "epoch": 2.0, - "step": 185004, - "total_flos": 9.988292384850125e+17, - "train_loss": 0.016045775709704408, - "train_runtime": 206173.8627, - "train_samples_per_second": 28.714, - "train_steps_per_second": 0.897 + "step": 396422, + "total_flos": 1.969031441954304e+18, + "train_loss": 0.013614018808192265, + "train_runtime": 415192.129, + "train_samples_per_second": 30.553, + "train_steps_per_second": 0.955 } ], - "max_steps": 185004, + "max_steps": 396422, "num_train_epochs": 2, - "total_flos": 9.988292384850125e+17, + "total_flos": 1.969031441954304e+18, "trial_name": null, "trial_params": null } diff --git a/training_args.bin b/training_args.bin index ad985175243904ba448e09c2eda08617f5466325..dd7ed437e2e51efe83f1dc0ea00a5bbae4a92271 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e466518c4579bd6bee53fdf30377e705184fd9f7e036056a6b09423ab880b7fd -size 3707 +oid sha256:1cd15191290a2c0e137c6f35a6f650076ece6690fadfa42b7621140db2393fbb +size 4155